diff --git a/api/docker/entrypoint.sh b/api/docker/entrypoint.sh
index 67723ca592..68f3c65a4b 100755
--- a/api/docker/entrypoint.sh
+++ b/api/docker/entrypoint.sh
@@ -2,12 +2,6 @@
set -e
-if [[ "${MODE}" == "copy" ]]; then
- mkdir -p /app/storage
- cp -rf /app/api/init_data/plugins/storage/* /app/storage/
- exit 0
-fi
-
if [[ "${MIGRATION_ENABLED}" == "true" ]]; then
echo "Running migrations"
flask upgrade-db
diff --git a/api/init_data/plugins/packages/langgenius-agent_0.0.11.difypkg b/api/init_data/plugins/packages/langgenius-agent_0.0.9.difypkg
similarity index 98%
rename from api/init_data/plugins/packages/langgenius-agent_0.0.11.difypkg
rename to api/init_data/plugins/packages/langgenius-agent_0.0.9.difypkg
index eb7ac5f66e..56f5d8c27a 100644
Binary files a/api/init_data/plugins/packages/langgenius-agent_0.0.11.difypkg and b/api/init_data/plugins/packages/langgenius-agent_0.0.9.difypkg differ
diff --git a/api/init_data/plugins/packages/langgenius-openai_api_compatible_0.0.11.difypkg b/api/init_data/plugins/packages/langgenius-openai_api_compatible_0.0.11.difypkg
deleted file mode 100644
index 151db5c4a6..0000000000
Binary files a/api/init_data/plugins/packages/langgenius-openai_api_compatible_0.0.11.difypkg and /dev/null differ
diff --git a/api/init_data/plugins/storage/plugin/langgenius/openai_api_compatible0.0.11@410445eba2fa0f693d26dea2c3b9ffe51ad0777e021146ff877af6098412efc7 b/api/init_data/plugins/packages/langgenius-openai_api_compatible_0.0.7.difypkg
similarity index 97%
rename from api/init_data/plugins/storage/plugin/langgenius/openai_api_compatible0.0.11@410445eba2fa0f693d26dea2c3b9ffe51ad0777e021146ff877af6098412efc7
rename to api/init_data/plugins/packages/langgenius-openai_api_compatible_0.0.7.difypkg
index 151db5c4a6..42b76021a1 100644
Binary files a/api/init_data/plugins/storage/plugin/langgenius/openai_api_compatible0.0.11@410445eba2fa0f693d26dea2c3b9ffe51ad0777e021146ff877af6098412efc7 and b/api/init_data/plugins/packages/langgenius-openai_api_compatible_0.0.7.difypkg differ
diff --git a/api/init_data/plugins/storage/plugin_packages/langgenius/siliconflow0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3 b/api/init_data/plugins/packages/langgenius-siliconflow_0.0.7.difypkg
similarity index 94%
rename from api/init_data/plugins/storage/plugin_packages/langgenius/siliconflow0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3
rename to api/init_data/plugins/packages/langgenius-siliconflow_0.0.7.difypkg
index 4a5441cd85..8b11582947 100644
Binary files a/api/init_data/plugins/storage/plugin_packages/langgenius/siliconflow0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3 and b/api/init_data/plugins/packages/langgenius-siliconflow_0.0.7.difypkg differ
diff --git a/api/init_data/plugins/packages/langgenius-siliconflow_0.0.8.difypkg b/api/init_data/plugins/packages/langgenius-siliconflow_0.0.8.difypkg
deleted file mode 100644
index 4a5441cd85..0000000000
Binary files a/api/init_data/plugins/packages/langgenius-siliconflow_0.0.8.difypkg and /dev/null differ
diff --git a/api/init_data/plugins/packages/langgenius-tongyi_0.0.14.difypkg b/api/init_data/plugins/packages/langgenius-tongyi_0.0.14.difypkg
deleted file mode 100644
index 8532a7140e..0000000000
Binary files a/api/init_data/plugins/packages/langgenius-tongyi_0.0.14.difypkg and /dev/null differ
diff --git a/api/init_data/plugins/storage/plugin/langgenius/tongyi0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb b/api/init_data/plugins/packages/langgenius-tongyi_0.0.7.difypkg
similarity index 85%
rename from api/init_data/plugins/storage/plugin/langgenius/tongyi0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb
rename to api/init_data/plugins/packages/langgenius-tongyi_0.0.7.difypkg
index 8532a7140e..c025613fc9 100644
Binary files a/api/init_data/plugins/storage/plugin/langgenius/tongyi0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb and b/api/init_data/plugins/packages/langgenius-tongyi_0.0.7.difypkg differ
diff --git a/api/init_data/plugins/storage/assets/0458e787b7706a3743846cc695088866360b67a5a7d6020065f8c7e5ac091bc9.png b/api/init_data/plugins/storage/assets/0458e787b7706a3743846cc695088866360b67a5a7d6020065f8c7e5ac091bc9.png
deleted file mode 100644
index bd8f2762d1..0000000000
Binary files a/api/init_data/plugins/storage/assets/0458e787b7706a3743846cc695088866360b67a5a7d6020065f8c7e5ac091bc9.png and /dev/null differ
diff --git a/api/init_data/plugins/storage/assets/0dbcd12864243bfcd8c0c1898a3e0c37ea553c21a727800b0863a599a9660729.svg b/api/init_data/plugins/storage/assets/0dbcd12864243bfcd8c0c1898a3e0c37ea553c21a727800b0863a599a9660729.svg
deleted file mode 100644
index ad6b384f7a..0000000000
--- a/api/init_data/plugins/storage/assets/0dbcd12864243bfcd8c0c1898a3e0c37ea553c21a727800b0863a599a9660729.svg
+++ /dev/null
@@ -1 +0,0 @@
-
\ No newline at end of file
diff --git a/api/init_data/plugins/storage/assets/450d471ec223ca027aa3de206d1aafcd67cd3fcefcbdc9c28eafac21513a9e4c.png b/api/init_data/plugins/storage/assets/450d471ec223ca027aa3de206d1aafcd67cd3fcefcbdc9c28eafac21513a9e4c.png
deleted file mode 100644
index 94de01136a..0000000000
Binary files a/api/init_data/plugins/storage/assets/450d471ec223ca027aa3de206d1aafcd67cd3fcefcbdc9c28eafac21513a9e4c.png and /dev/null differ
diff --git a/api/init_data/plugins/storage/assets/49323fc47c82d3bf400280689f9ffa17708cfe465c7e1f3bbfb24f2a42ec0e2c.svg b/api/init_data/plugins/storage/assets/49323fc47c82d3bf400280689f9ffa17708cfe465c7e1f3bbfb24f2a42ec0e2c.svg
deleted file mode 100644
index 425494404f..0000000000
--- a/api/init_data/plugins/storage/assets/49323fc47c82d3bf400280689f9ffa17708cfe465c7e1f3bbfb24f2a42ec0e2c.svg
+++ /dev/null
@@ -1,22 +0,0 @@
-
diff --git a/api/init_data/plugins/storage/assets/69f80e7dfe36e036321767f69cad4755fe162cf581b206a8290dce0629d2e4f6.svg b/api/init_data/plugins/storage/assets/69f80e7dfe36e036321767f69cad4755fe162cf581b206a8290dce0629d2e4f6.svg
deleted file mode 100644
index aa854a7504..0000000000
--- a/api/init_data/plugins/storage/assets/69f80e7dfe36e036321767f69cad4755fe162cf581b206a8290dce0629d2e4f6.svg
+++ /dev/null
@@ -1,3 +0,0 @@
-
diff --git a/api/init_data/plugins/storage/assets/758825b9b095f55a1e391b138694e0d3c1cb07fd5eef27d7e5915aa7e2718a97.svg b/api/init_data/plugins/storage/assets/758825b9b095f55a1e391b138694e0d3c1cb07fd5eef27d7e5915aa7e2718a97.svg
deleted file mode 100644
index 39d8a1ece6..0000000000
--- a/api/init_data/plugins/storage/assets/758825b9b095f55a1e391b138694e0d3c1cb07fd5eef27d7e5915aa7e2718a97.svg
+++ /dev/null
@@ -1,15 +0,0 @@
-
diff --git a/api/init_data/plugins/storage/assets/7d40d629e02c01404af94652a8684f9aaab0da105182fc16fafe0da4e183dd9e.png b/api/init_data/plugins/storage/assets/7d40d629e02c01404af94652a8684f9aaab0da105182fc16fafe0da4e183dd9e.png
deleted file mode 100644
index c1aff40ee0..0000000000
Binary files a/api/init_data/plugins/storage/assets/7d40d629e02c01404af94652a8684f9aaab0da105182fc16fafe0da4e183dd9e.png and /dev/null differ
diff --git a/api/init_data/plugins/storage/assets/87afd76dc06bfd0ef344496e0a061e195bbfbcaf604606634fac00d5d2b83caf.svg b/api/init_data/plugins/storage/assets/87afd76dc06bfd0ef344496e0a061e195bbfbcaf604606634fac00d5d2b83caf.svg
deleted file mode 100644
index 16e406f030..0000000000
--- a/api/init_data/plugins/storage/assets/87afd76dc06bfd0ef344496e0a061e195bbfbcaf604606634fac00d5d2b83caf.svg
+++ /dev/null
@@ -1 +0,0 @@
-
\ No newline at end of file
diff --git a/api/init_data/plugins/storage/assets/bfff83a66922c09cb5a5aa68829742b8b4f4e818579db42f53c7b8a30912cd8b.svg b/api/init_data/plugins/storage/assets/bfff83a66922c09cb5a5aa68829742b8b4f4e818579db42f53c7b8a30912cd8b.svg
deleted file mode 100644
index f8482a96b9..0000000000
--- a/api/init_data/plugins/storage/assets/bfff83a66922c09cb5a5aa68829742b8b4f4e818579db42f53c7b8a30912cd8b.svg
+++ /dev/null
@@ -1,15 +0,0 @@
-
diff --git a/api/init_data/plugins/storage/assets/e74e644589f5d78cd6019be7b92050c2b54b2645139af705fe610649a73282cf.svg b/api/init_data/plugins/storage/assets/e74e644589f5d78cd6019be7b92050c2b54b2645139af705fe610649a73282cf.svg
deleted file mode 100644
index c0d23316fe..0000000000
--- a/api/init_data/plugins/storage/assets/e74e644589f5d78cd6019be7b92050c2b54b2645139af705fe610649a73282cf.svg
+++ /dev/null
@@ -1,21 +0,0 @@
-
diff --git a/api/init_data/plugins/storage/assets/fb1d7c05088e34ecabd0e087ebcfd929be9aad785b5e21e0577c2aa82acf7ae0.svg b/api/init_data/plugins/storage/assets/fb1d7c05088e34ecabd0e087ebcfd929be9aad785b5e21e0577c2aa82acf7ae0.svg
deleted file mode 100644
index ce65af405f..0000000000
--- a/api/init_data/plugins/storage/assets/fb1d7c05088e34ecabd0e087ebcfd929be9aad785b5e21e0577c2aa82acf7ae0.svg
+++ /dev/null
@@ -1 +0,0 @@
-
\ No newline at end of file
diff --git a/api/init_data/plugins/storage/cwd/langgenius/agent-0.0.11@6b60e6812d1428f06a4dee70a1e9c7dd2af217bf123103758fb40483069c12c9/.env.example b/api/init_data/plugins/storage/cwd/langgenius/agent-0.0.11@6b60e6812d1428f06a4dee70a1e9c7dd2af217bf123103758fb40483069c12c9/.env.example
deleted file mode 100644
index 2fa2ad9bf6..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/agent-0.0.11@6b60e6812d1428f06a4dee70a1e9c7dd2af217bf123103758fb40483069c12c9/.env.example
+++ /dev/null
@@ -1,4 +0,0 @@
-INSTALL_METHOD=remote
-REMOTE_INSTALL_HOST=debug-plugin.dify.dev
-REMOTE_INSTALL_PORT=5003
-REMOTE_INSTALL_KEY=ae1aa1c9-0af4-43db-b6d4-4fa9e6bfb646
diff --git a/api/init_data/plugins/storage/cwd/langgenius/agent-0.0.11@6b60e6812d1428f06a4dee70a1e9c7dd2af217bf123103758fb40483069c12c9/README.md b/api/init_data/plugins/storage/cwd/langgenius/agent-0.0.11@6b60e6812d1428f06a4dee70a1e9c7dd2af217bf123103758fb40483069c12c9/README.md
deleted file mode 100644
index 4e9b49148f..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/agent-0.0.11@6b60e6812d1428f06a4dee70a1e9c7dd2af217bf123103758fb40483069c12c9/README.md
+++ /dev/null
@@ -1,24 +0,0 @@
-# Overview
-The Agent node in Dify Chatflow/Workflow lets LLMs autonomously use tools. This plugin features two official Dify Agent reasoning strategies, enabling LLMs to dynamically select and run tools during runtime for multi-step problem-solving.
-
-## Strategies
-
-### 1. Function Calling
-Function Calling maps user commands to specific functions or tools. The LLM identifies the user's intent, decides which function to call, and extracts the required parameters. It is a straightforward mechanism for invoking external capabilities.
-
-
-
-#### Pros:
-- **Precise:** Directly calls the right tool for defined tasks, avoiding complex reasoning.
-- **Easy External Integration:** Integrates external APIs and tools as callable functions.
-- **Structured Output:** Provides structured function call information for easy processing.
-
-### 2. ReAct (Reason + Act)
-ReAct alternates between the LLM reasoning about the situation and taking actions. The LLM analyzes the current state and goal, selects and uses a tool, and then uses the tool's output for the next thought and action. This cycle repeats until the problem is resolved.
-
-
-
-#### Pros:
-- **Leverages External Information:** Effectively uses external tools to gather information for tasks the model cannot handle alone.
-- **Explainable Reasoning:** Interwoven reasoning and action steps allow some tracking of the Agent's process.
-- **Wide Applicability:** Suitable for tasks requiring external knowledge or specific actions, such as Q&A, information retrieval, and task execution.
\ No newline at end of file
diff --git a/api/init_data/plugins/storage/cwd/langgenius/agent-0.0.11@6b60e6812d1428f06a4dee70a1e9c7dd2af217bf123103758fb40483069c12c9/_assets/function_calling.png b/api/init_data/plugins/storage/cwd/langgenius/agent-0.0.11@6b60e6812d1428f06a4dee70a1e9c7dd2af217bf123103758fb40483069c12c9/_assets/function_calling.png
deleted file mode 100644
index f0ce6b0c41..0000000000
Binary files a/api/init_data/plugins/storage/cwd/langgenius/agent-0.0.11@6b60e6812d1428f06a4dee70a1e9c7dd2af217bf123103758fb40483069c12c9/_assets/function_calling.png and /dev/null differ
diff --git a/api/init_data/plugins/storage/cwd/langgenius/agent-0.0.11@6b60e6812d1428f06a4dee70a1e9c7dd2af217bf123103758fb40483069c12c9/_assets/icon.svg b/api/init_data/plugins/storage/cwd/langgenius/agent-0.0.11@6b60e6812d1428f06a4dee70a1e9c7dd2af217bf123103758fb40483069c12c9/_assets/icon.svg
deleted file mode 100644
index c0d23316fe..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/agent-0.0.11@6b60e6812d1428f06a4dee70a1e9c7dd2af217bf123103758fb40483069c12c9/_assets/icon.svg
+++ /dev/null
@@ -1,21 +0,0 @@
-
diff --git a/api/init_data/plugins/storage/cwd/langgenius/agent-0.0.11@6b60e6812d1428f06a4dee70a1e9c7dd2af217bf123103758fb40483069c12c9/_assets/react.png b/api/init_data/plugins/storage/cwd/langgenius/agent-0.0.11@6b60e6812d1428f06a4dee70a1e9c7dd2af217bf123103758fb40483069c12c9/_assets/react.png
deleted file mode 100644
index 271d6b82f7..0000000000
Binary files a/api/init_data/plugins/storage/cwd/langgenius/agent-0.0.11@6b60e6812d1428f06a4dee70a1e9c7dd2af217bf123103758fb40483069c12c9/_assets/react.png and /dev/null differ
diff --git a/api/init_data/plugins/storage/cwd/langgenius/agent-0.0.11@6b60e6812d1428f06a4dee70a1e9c7dd2af217bf123103758fb40483069c12c9/main.py b/api/init_data/plugins/storage/cwd/langgenius/agent-0.0.11@6b60e6812d1428f06a4dee70a1e9c7dd2af217bf123103758fb40483069c12c9/main.py
deleted file mode 100644
index 08eb1bd963..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/agent-0.0.11@6b60e6812d1428f06a4dee70a1e9c7dd2af217bf123103758fb40483069c12c9/main.py
+++ /dev/null
@@ -1,10 +0,0 @@
-import sys
-
-sys.path.append("../..")
-
-from dify_plugin import DifyPluginEnv, Plugin
-
-plugin = Plugin(DifyPluginEnv(MAX_REQUEST_TIMEOUT=240))
-
-if __name__ == "__main__":
- plugin.run()
diff --git a/api/init_data/plugins/storage/cwd/langgenius/agent-0.0.11@6b60e6812d1428f06a4dee70a1e9c7dd2af217bf123103758fb40483069c12c9/manifest.yaml b/api/init_data/plugins/storage/cwd/langgenius/agent-0.0.11@6b60e6812d1428f06a4dee70a1e9c7dd2af217bf123103758fb40483069c12c9/manifest.yaml
deleted file mode 100644
index d330737af3..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/agent-0.0.11@6b60e6812d1428f06a4dee70a1e9c7dd2af217bf123103758fb40483069c12c9/manifest.yaml
+++ /dev/null
@@ -1,34 +0,0 @@
-version: 0.0.11
-type: plugin
-author: "langgenius"
-name: "agent"
-label:
- en_US: "Dify Agent Strategies"
- zh_Hans: "Dify Agent 策略"
-created_at: "2024-07-12T08:03:44.658609186Z"
-icon: icon.svg
-description:
- en_US: Dify official Agent strategies collection
- zh_Hans: Dify 官方 Agent 策略集合
-tags:
- - "agent"
-resource:
- memory: 1048576
- permission:
- tool:
- enabled: true
- model:
- enabled: true
- llm: true
-plugins:
- agent_strategies:
- - "provider/agent.yaml"
-meta:
- version: 0.0.1
- arch:
- - "amd64"
- - "arm64"
- runner:
- language: "python"
- version: "3.12"
- entrypoint: "main"
diff --git a/api/init_data/plugins/storage/cwd/langgenius/agent-0.0.11@6b60e6812d1428f06a4dee70a1e9c7dd2af217bf123103758fb40483069c12c9/output_parser/cot_output_parser.py b/api/init_data/plugins/storage/cwd/langgenius/agent-0.0.11@6b60e6812d1428f06a4dee70a1e9c7dd2af217bf123103758fb40483069c12c9/output_parser/cot_output_parser.py
deleted file mode 100644
index 82e32d8039..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/agent-0.0.11@6b60e6812d1428f06a4dee70a1e9c7dd2af217bf123103758fb40483069c12c9/output_parser/cot_output_parser.py
+++ /dev/null
@@ -1,212 +0,0 @@
-import json
-import re
-from collections.abc import Generator
-from typing import Union
-
-from dify_plugin.entities.model.llm import LLMResultChunk
-from dify_plugin.interfaces.agent import AgentScratchpadUnit
-
-
-class CotAgentOutputParser:
- @classmethod
- def handle_react_stream_output(
- cls, llm_response: Generator[LLMResultChunk, None, None], usage_dict: dict
- ) -> Generator[Union[str, AgentScratchpadUnit.Action], None, None]:
- def parse_action(json_str):
- try:
- action = json.loads(json_str, strict=False)
- action_name = None
- action_input = None
-
- # cohere always returns a list
- if isinstance(action, list) and len(action) == 1:
- action = action[0]
-
- for key, value in action.items():
- if "input" in key.lower():
- action_input = value
- else:
- action_name = value
-
- if action_name is not None and action_input is not None:
- return AgentScratchpadUnit.Action(
- action_name=action_name,
- action_input=action_input,
- )
- else:
- return json_str or ""
- except:
- return json_str or ""
-
- def extra_json_from_code_block(
- code_block,
- ) -> Generator[Union[str, AgentScratchpadUnit.Action], None, None]:
- code_blocks = re.findall(r"```(.*?)```", code_block, re.DOTALL)
- if not code_blocks:
- return
- for block in code_blocks:
- json_text = re.sub(
- r"^[a-zA-Z]+\n", "", block.strip(), flags=re.MULTILINE
- )
- yield parse_action(json_text)
-
- code_block_cache = ""
- code_block_delimiter_count = 0
- in_code_block = False
- json_cache = ""
- json_quote_count = 0
- in_json = False
- got_json = False
-
- action_cache = ""
- action_str = "action:"
- action_idx = 0
-
- thought_cache = ""
- thought_str = "thought:"
- thought_idx = 0
-
- last_character = ""
-
- for response in llm_response:
- if response.delta.usage:
- usage_dict["usage"] = response.delta.usage
- response_content = response.delta.message.content
- if not isinstance(response_content, str):
- continue
-
- # stream
- index = 0
- while index < len(response_content):
- steps = 1
- delta = response_content[index : index + steps]
- yield_delta = False
-
- if delta == "`":
- last_character = delta
- code_block_cache += delta
- code_block_delimiter_count += 1
- else:
- if not in_code_block:
- if code_block_delimiter_count > 0:
- last_character = delta
- yield code_block_cache
- code_block_cache = ""
- else:
- last_character = delta
- code_block_cache += delta
- code_block_delimiter_count = 0
-
- if not in_code_block and not in_json:
- if delta.lower() == action_str[action_idx] and action_idx == 0:
- if last_character not in {"\n", " ", ""}:
- yield_delta = True
- else:
- last_character = delta
- action_cache += delta
- action_idx += 1
- if action_idx == len(action_str):
- action_cache = ""
- action_idx = 0
- index += steps
- continue
- elif delta.lower() == action_str[action_idx] and action_idx > 0:
- last_character = delta
- action_cache += delta
- action_idx += 1
- if action_idx == len(action_str):
- action_cache = ""
- action_idx = 0
- index += steps
- continue
- else:
- if action_cache:
- last_character = delta
- yield action_cache
- action_cache = ""
- action_idx = 0
-
- if delta.lower() == thought_str[thought_idx] and thought_idx == 0:
- if last_character not in {"\n", " ", ""}:
- yield_delta = True
- else:
- last_character = delta
- thought_cache += delta
- thought_idx += 1
- if thought_idx == len(thought_str):
- thought_cache = ""
- thought_idx = 0
- index += steps
- continue
- elif delta.lower() == thought_str[thought_idx] and thought_idx > 0:
- last_character = delta
- thought_cache += delta
- thought_idx += 1
- if thought_idx == len(thought_str):
- thought_cache = ""
- thought_idx = 0
- index += steps
- continue
- else:
- if thought_cache:
- last_character = delta
- yield thought_cache
- thought_cache = ""
- thought_idx = 0
-
- if yield_delta:
- index += steps
- last_character = delta
- yield delta
- continue
-
- if code_block_delimiter_count == 3:
- if in_code_block:
- last_character = delta
- yield from extra_json_from_code_block(code_block_cache)
- code_block_cache = ""
-
- in_code_block = not in_code_block
- code_block_delimiter_count = 0
-
- if not in_code_block:
- # handle single json
- if delta == "{":
- json_quote_count += 1
- in_json = True
- last_character = delta
- json_cache += delta
- elif delta == "}":
- last_character = delta
- json_cache += delta
- if json_quote_count > 0:
- json_quote_count -= 1
- if json_quote_count == 0:
- in_json = False
- got_json = True
- index += steps
- continue
- else:
- if in_json:
- last_character = delta
- json_cache += delta
-
- if got_json:
- got_json = False
- last_character = delta
- yield parse_action(json_cache)
- json_cache = ""
- json_quote_count = 0
- in_json = False
-
- if not in_code_block and not in_json:
- last_character = delta
- yield delta.replace("`", "")
-
- index += steps
-
- if code_block_cache:
- yield code_block_cache
-
- if json_cache:
- yield parse_action(json_cache)
diff --git a/api/init_data/plugins/storage/cwd/langgenius/agent-0.0.11@6b60e6812d1428f06a4dee70a1e9c7dd2af217bf123103758fb40483069c12c9/prompt/template.py b/api/init_data/plugins/storage/cwd/langgenius/agent-0.0.11@6b60e6812d1428f06a4dee70a1e9c7dd2af217bf123103758fb40483069c12c9/prompt/template.py
deleted file mode 100644
index ef64fd29fc..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/agent-0.0.11@6b60e6812d1428f06a4dee70a1e9c7dd2af217bf123103758fb40483069c12c9/prompt/template.py
+++ /dev/null
@@ -1,106 +0,0 @@
-ENGLISH_REACT_COMPLETION_PROMPT_TEMPLATES = """Respond to the human as helpfully and accurately as possible.
-
-{{instruction}}
-
-You have access to the following tools:
-
-{{tools}}
-
-Use a json blob to specify a tool by providing an action key (tool name) and an action_input key (tool input).
-Valid "action" values: "Final Answer" or {{tool_names}}
-
-Provide only ONE action per $JSON_BLOB, as shown:
-
-```
-{
- "action": $TOOL_NAME,
- "action_input": $ACTION_INPUT
-}
-```
-
-Follow this format:
-
-Question: input question to answer
-Thought: consider previous and subsequent steps
-Action:
-```
-$JSON_BLOB
-```
-Observation: action result
-... (repeat Thought/Action/Observation N times)
-Thought: I know what to respond
-Action:
-```
-{
- "action": "Final Answer",
- "action_input": "Final response to human"
-}
-```
-
-Begin! Reminder to ALWAYS respond with a valid json blob of a single action. Use tools if necessary. Respond directly if appropriate. Format is Action:```$JSON_BLOB```then Observation:.
-{{historic_messages}}
-Question: {{query}}
-{{agent_scratchpad}}
-Thought:""" # noqa: E501
-
-
-ENGLISH_REACT_COMPLETION_AGENT_SCRATCHPAD_TEMPLATES = """Observation: {{observation}}
-Thought:"""
-
-ENGLISH_REACT_CHAT_PROMPT_TEMPLATES = """Respond to the human as helpfully and accurately as possible.
-
-{{instruction}}
-
-You have access to the following tools:
-
-{{tools}}
-
-Use a json blob to specify a tool by providing an action key (tool name) and an action_input key (tool input).
-Valid "action" values: "Final Answer" or {{tool_names}}
-
-Provide only ONE action per $JSON_BLOB, as shown:
-
-```
-{
- "action": $TOOL_NAME,
- "action_input": $ACTION_INPUT
-}
-```
-
-Follow this format:
-
-Question: input question to answer
-Thought: consider previous and subsequent steps
-Action:
-```
-$JSON_BLOB
-```
-Observation: action result
-... (repeat Thought/Action/Observation N times)
-Thought: I know what to respond
-Action:
-```
-{
- "action": "Final Answer",
- "action_input": "Final response to human"
-}
-```
-
-Begin! Reminder to ALWAYS respond with a valid json blob of a single action. Use tools if necessary. Respond directly if appropriate. Format is Action:```$JSON_BLOB```then Observation:.
-""" # noqa: E501
-
-
-ENGLISH_REACT_CHAT_AGENT_SCRATCHPAD_TEMPLATES = ""
-
-REACT_PROMPT_TEMPLATES = {
- "english": {
- "chat": {
- "prompt": ENGLISH_REACT_CHAT_PROMPT_TEMPLATES,
- "agent_scratchpad": ENGLISH_REACT_CHAT_AGENT_SCRATCHPAD_TEMPLATES,
- },
- "completion": {
- "prompt": ENGLISH_REACT_COMPLETION_PROMPT_TEMPLATES,
- "agent_scratchpad": ENGLISH_REACT_COMPLETION_AGENT_SCRATCHPAD_TEMPLATES,
- },
- }
-}
diff --git a/api/init_data/plugins/storage/cwd/langgenius/agent-0.0.11@6b60e6812d1428f06a4dee70a1e9c7dd2af217bf123103758fb40483069c12c9/provider/agent.py b/api/init_data/plugins/storage/cwd/langgenius/agent-0.0.11@6b60e6812d1428f06a4dee70a1e9c7dd2af217bf123103758fb40483069c12c9/provider/agent.py
deleted file mode 100644
index a3394298b6..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/agent-0.0.11@6b60e6812d1428f06a4dee70a1e9c7dd2af217bf123103758fb40483069c12c9/provider/agent.py
+++ /dev/null
@@ -1,5 +0,0 @@
-from dify_plugin.interfaces.agent import AgentProvider
-
-
-class LanggeniusAgentProvider(AgentProvider):
- pass
diff --git a/api/init_data/plugins/storage/cwd/langgenius/agent-0.0.11@6b60e6812d1428f06a4dee70a1e9c7dd2af217bf123103758fb40483069c12c9/provider/agent.yaml b/api/init_data/plugins/storage/cwd/langgenius/agent-0.0.11@6b60e6812d1428f06a4dee70a1e9c7dd2af217bf123103758fb40483069c12c9/provider/agent.yaml
deleted file mode 100644
index 7be6dbbbce..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/agent-0.0.11@6b60e6812d1428f06a4dee70a1e9c7dd2af217bf123103758fb40483069c12c9/provider/agent.yaml
+++ /dev/null
@@ -1,18 +0,0 @@
-identity:
- author: langgenius
- name: agent
- label:
- en_US: Agent
- zh_Hans: Agent
- pt_BR: Agent
- description:
- en_US: Agent
- zh_Hans: Agent
- pt_BR: Agent
- icon: icon.svg
-strategies:
- - strategies/function_calling.yaml
- - strategies/ReAct.yaml
-extra:
- python:
- source: provider/agent.py
diff --git a/api/init_data/plugins/storage/cwd/langgenius/agent-0.0.11@6b60e6812d1428f06a4dee70a1e9c7dd2af217bf123103758fb40483069c12c9/requirements.txt b/api/init_data/plugins/storage/cwd/langgenius/agent-0.0.11@6b60e6812d1428f06a4dee70a1e9c7dd2af217bf123103758fb40483069c12c9/requirements.txt
deleted file mode 100644
index d9ba35abcf..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/agent-0.0.11@6b60e6812d1428f06a4dee70a1e9c7dd2af217bf123103758fb40483069c12c9/requirements.txt
+++ /dev/null
@@ -1 +0,0 @@
-dify_plugin==0.0.1b74
\ No newline at end of file
diff --git a/api/init_data/plugins/storage/cwd/langgenius/agent-0.0.11@6b60e6812d1428f06a4dee70a1e9c7dd2af217bf123103758fb40483069c12c9/strategies/ReAct.py b/api/init_data/plugins/storage/cwd/langgenius/agent-0.0.11@6b60e6812d1428f06a4dee70a1e9c7dd2af217bf123103758fb40483069c12c9/strategies/ReAct.py
deleted file mode 100644
index f1a2b5feb9..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/agent-0.0.11@6b60e6812d1428f06a4dee70a1e9c7dd2af217bf123103758fb40483069c12c9/strategies/ReAct.py
+++ /dev/null
@@ -1,642 +0,0 @@
-import json
-import time
-from collections.abc import Generator, Mapping
-from typing import Any, Optional, cast
-
-from dify_plugin.entities.agent import AgentInvokeMessage
-from dify_plugin.entities.model.llm import LLMModelConfig, LLMUsage
-from dify_plugin.entities.model.message import (
- AssistantPromptMessage,
- PromptMessage,
- SystemPromptMessage,
- ToolPromptMessage,
- UserPromptMessage,
-)
-from dify_plugin.entities.tool import (
- LogMetadata,
- ToolInvokeMessage,
- ToolParameter,
- ToolProviderType,
-)
-from dify_plugin.interfaces.agent import (
- AgentModelConfig,
- AgentScratchpadUnit,
- AgentStrategy,
- ToolEntity,
-)
-from output_parser.cot_output_parser import CotAgentOutputParser
-from prompt.template import REACT_PROMPT_TEMPLATES
-from pydantic import BaseModel, Field
-
-ignore_observation_providers = ["wenxin"]
-
-
-class ReActParams(BaseModel):
- query: str
- instruction: str | None
- model: AgentModelConfig
- tools: list[ToolEntity] | None
- inputs: dict[str, Any] = {}
- maximum_iterations: int = 3
-
-
-class AgentPromptEntity(BaseModel):
- """
- Agent Prompt Entity.
- """
-
- first_prompt: str
- next_iteration: str
-
-
-class ToolInvokeMeta(BaseModel):
- """
- Tool invoke meta
- """
-
- time_cost: float = Field(..., description="The time cost of the tool invoke")
- error: Optional[str] = None
- tool_config: Optional[dict] = None
-
- @classmethod
- def empty(cls) -> "ToolInvokeMeta":
- """
- Get an empty instance of ToolInvokeMeta
- """
- return cls(time_cost=0.0, error=None, tool_config={})
-
- @classmethod
- def error_instance(cls, error: str) -> "ToolInvokeMeta":
- """
- Get an instance of ToolInvokeMeta with error
- """
- return cls(time_cost=0.0, error=error, tool_config={})
-
- def to_dict(self) -> dict:
- return {
- "time_cost": self.time_cost,
- "error": self.error,
- "tool_config": self.tool_config,
- }
-
-
-class ReActAgentStrategy(AgentStrategy):
- def _invoke(self, parameters: dict[str, Any]) -> Generator[AgentInvokeMessage]:
- react_params = ReActParams(**parameters)
- query = react_params.query
- model = react_params.model
- agent_scratchpad = []
- history_prompt_messages: list[PromptMessage] = []
- current_session_messages = []
- self._organize_historic_prompt_messages(
- history_prompt_messages, current_session_messages=current_session_messages
- )
- tools = react_params.tools
- tool_instances = {tool.identity.name: tool for tool in tools} if tools else {}
- react_params.model.completion_params = (
- react_params.model.completion_params or {}
- )
- # check model mode
- stop = (
- react_params.model.completion_params.get("stop", [])
- if react_params.model.completion_params
- else []
- )
-
- if (
- "Observation" not in stop
- and model.provider not in ignore_observation_providers
- ):
- stop.append("Observation")
- # init instruction
- inputs = react_params.inputs
- instruction = react_params.instruction or ""
- self._instruction = self._fill_in_inputs_from_external_data_tools(
- instruction, inputs
- )
-
- iteration_step = 1
- max_iteration_steps = react_params.maximum_iterations
-
- # convert tools into ModelRuntime Tool format
- prompt_messages_tools = self._init_prompt_tools(tools)
- self._prompt_messages_tools = prompt_messages_tools
-
- run_agent_state = True
- llm_usage: dict[str, Optional[LLMUsage]] = {"usage": None}
- final_answer = ""
- prompt_messages = []
- while run_agent_state and iteration_step <= max_iteration_steps:
- # continue to run until there is not any tool call
- run_agent_state = False
- round_started_at = time.perf_counter()
- round_log = self.create_log_message(
- label=f"ROUND {iteration_step}",
- data={},
- metadata={
- LogMetadata.STARTED_AT: round_started_at,
- },
- status=ToolInvokeMessage.LogMessage.LogStatus.START,
- )
- yield round_log
- if iteration_step == max_iteration_steps:
- # the last iteration, remove all tools
- self._prompt_messages_tools = []
-
- message_file_ids: list[str] = []
-
- # recalc llm max tokens
- prompt_messages = self._organize_prompt_messages(agent_scratchpad, query)
- if model.completion_params:
- self.recalc_llm_max_tokens(
- model.entity, prompt_messages, model.completion_params
- )
- # invoke model
- chunks = self.session.model.llm.invoke(
- model_config=LLMModelConfig(**model.model_dump(mode="json")),
- prompt_messages=prompt_messages,
- stream=True,
- stop=stop,
- )
-
- usage_dict = {}
- react_chunks = CotAgentOutputParser.handle_react_stream_output(
- chunks, usage_dict
- )
- scratchpad = AgentScratchpadUnit(
- agent_response="",
- thought="",
- action_str="",
- observation="",
- action=None,
- )
-
- model_started_at = time.perf_counter()
- model_log = self.create_log_message(
- label=f"{model.model} Thought",
- data={},
- metadata={
- LogMetadata.STARTED_AT: model_started_at,
- LogMetadata.PROVIDER: model.provider,
- },
- parent=round_log,
- status=ToolInvokeMessage.LogMessage.LogStatus.START,
- )
- yield model_log
-
- for chunk in react_chunks:
- if isinstance(chunk, AgentScratchpadUnit.Action):
- action = chunk
- # detect action
- assert scratchpad.agent_response is not None
- scratchpad.agent_response += json.dumps(chunk.model_dump())
-
- scratchpad.action_str = json.dumps(chunk.model_dump())
- scratchpad.action = action
- else:
- scratchpad.agent_response = scratchpad.agent_response or ""
- scratchpad.thought = scratchpad.thought or ""
- scratchpad.agent_response += chunk
- scratchpad.thought += chunk
- scratchpad.thought = (
- scratchpad.thought.strip()
- if scratchpad.thought
- else "I am thinking about how to help you"
- )
- agent_scratchpad.append(scratchpad)
-
- # get llm usage
- if "usage" in usage_dict:
- if usage_dict["usage"] is not None:
- self.increase_usage(llm_usage, usage_dict["usage"])
- else:
- usage_dict["usage"] = LLMUsage.empty_usage()
-
- action = (
- scratchpad.action.to_dict()
- if scratchpad.action
- else {"action": scratchpad.agent_response}
- )
-
- yield self.finish_log_message(
- log=model_log,
- data={"thought": scratchpad.thought, **action},
- metadata={
- LogMetadata.STARTED_AT: model_started_at,
- LogMetadata.FINISHED_AT: time.perf_counter(),
- LogMetadata.ELAPSED_TIME: time.perf_counter() - model_started_at,
- LogMetadata.PROVIDER: model.provider,
- LogMetadata.TOTAL_PRICE: usage_dict["usage"].total_price
- if usage_dict["usage"]
- else 0,
- LogMetadata.CURRENCY: usage_dict["usage"].currency
- if usage_dict["usage"]
- else "",
- LogMetadata.TOTAL_TOKENS: usage_dict["usage"].total_tokens
- if usage_dict["usage"]
- else 0,
- },
- )
- if not scratchpad.action:
- final_answer = scratchpad.thought
- else:
- if scratchpad.action.action_name.lower() == "final answer":
- # action is final answer, return final answer directly
- try:
- if isinstance(scratchpad.action.action_input, dict):
- final_answer = json.dumps(scratchpad.action.action_input)
- elif isinstance(scratchpad.action.action_input, str):
- final_answer = scratchpad.action.action_input
- else:
- final_answer = f"{scratchpad.action.action_input}"
- except json.JSONDecodeError:
- final_answer = f"{scratchpad.action.action_input}"
- else:
- run_agent_state = True
- # action is tool call, invoke tool
- tool_call_started_at = time.perf_counter()
- tool_name = scratchpad.action.action_name
- tool_call_log = self.create_log_message(
- label=f"CALL {tool_name}",
- data={},
- metadata={
- LogMetadata.STARTED_AT: time.perf_counter(),
- LogMetadata.PROVIDER: tool_instances[
- tool_name
- ].identity.provider
- if tool_instances.get(tool_name)
- else "",
- },
- parent=round_log,
- status=ToolInvokeMessage.LogMessage.LogStatus.START,
- )
- yield tool_call_log
- tool_invoke_response, tool_invoke_parameters = (
- self._handle_invoke_action(
- action=scratchpad.action,
- tool_instances=tool_instances,
- message_file_ids=message_file_ids,
- )
- )
- scratchpad.observation = tool_invoke_response
- scratchpad.agent_response = tool_invoke_response
- yield self.finish_log_message(
- log=tool_call_log,
- data={
- "tool_name": tool_name,
- "tool_call_args": tool_invoke_parameters,
- "output": tool_invoke_response,
- },
- metadata={
- LogMetadata.STARTED_AT: tool_call_started_at,
- LogMetadata.PROVIDER: tool_instances[
- tool_name
- ].identity.provider
- if tool_instances.get(tool_name)
- else "",
- LogMetadata.FINISHED_AT: time.perf_counter(),
- LogMetadata.ELAPSED_TIME: time.perf_counter()
- - tool_call_started_at,
- },
- )
-
- # update prompt tool message
- for prompt_tool in self._prompt_messages_tools:
- self.update_prompt_message_tool(
- tool_instances[prompt_tool.name], prompt_tool
- )
- yield self.finish_log_message(
- log=round_log,
- data={
- "action_name": scratchpad.action.action_name
- if scratchpad.action
- else "",
- "action_input": scratchpad.action.action_input
- if scratchpad.action
- else "",
- "thought": scratchpad.thought,
- "observation": scratchpad.observation,
- },
- metadata={
- LogMetadata.STARTED_AT: round_started_at,
- LogMetadata.FINISHED_AT: time.perf_counter(),
- LogMetadata.ELAPSED_TIME: time.perf_counter() - round_started_at,
- LogMetadata.TOTAL_PRICE: usage_dict["usage"].total_price
- if usage_dict["usage"]
- else 0,
- LogMetadata.CURRENCY: usage_dict["usage"].currency
- if usage_dict["usage"]
- else "",
- LogMetadata.TOTAL_TOKENS: usage_dict["usage"].total_tokens
- if usage_dict["usage"]
- else 0,
- },
- )
- iteration_step += 1
-
- yield self.create_text_message(final_answer)
- yield self.create_json_message(
- {
- "execution_metadata": {
- LogMetadata.TOTAL_PRICE: llm_usage["usage"].total_price
- if llm_usage["usage"] is not None
- else 0,
- LogMetadata.CURRENCY: llm_usage["usage"].currency
- if llm_usage["usage"] is not None
- else "",
- LogMetadata.TOTAL_TOKENS: llm_usage["usage"].total_tokens
- if llm_usage["usage"] is not None
- else 0,
- }
- }
- )
-
- def _organize_system_prompt(self) -> SystemPromptMessage:
- """
- Organize system prompt
- """
-
- prompt_entity = AgentPromptEntity(
- first_prompt=REACT_PROMPT_TEMPLATES["english"]["chat"]["prompt"],
- next_iteration=REACT_PROMPT_TEMPLATES["english"]["chat"][
- "agent_scratchpad"
- ],
- )
- if not prompt_entity:
- raise ValueError("Agent prompt configuration is not set")
- first_prompt = prompt_entity.first_prompt
-
- system_prompt = (
- first_prompt.replace("{{instruction}}", self._instruction)
- .replace(
- "{{tools}}",
- json.dumps(
- [
- tool.model_dump(mode="json")
- for tool in self._prompt_messages_tools
- ]
- ),
- )
- .replace(
- "{{tool_names}}",
- ", ".join([tool.name for tool in self._prompt_messages_tools]),
- )
- )
-
- return SystemPromptMessage(content=system_prompt)
-
- def _organize_user_query(
- self, query, prompt_messages: list[PromptMessage]
- ) -> list[PromptMessage]:
- """
- Organize user query
- """
- prompt_messages.append(UserPromptMessage(content=query))
-
- return prompt_messages
-
- def _organize_prompt_messages(
- self, agent_scratchpad: list, query: str
- ) -> list[PromptMessage]:
- """
- Organize
- """
- # organize system prompt
- system_message = self._organize_system_prompt()
-
- # organize current assistant messages
- agent_scratchpad = agent_scratchpad
- if not agent_scratchpad:
- assistant_messages = []
- else:
- assistant_message = AssistantPromptMessage(content="")
- assistant_message.content = (
- "" # FIXME: type check tell mypy that assistant_message.content is str
- )
- for unit in agent_scratchpad:
- if unit.is_final():
- assert isinstance(assistant_message.content, str)
- assistant_message.content += f"Final Answer: {unit.agent_response}"
- else:
- assert isinstance(assistant_message.content, str)
- assistant_message.content += f"Thought: {unit.thought}\n\n"
- if unit.action_str:
- assistant_message.content += f"Action: {unit.action_str}\n\n"
- if unit.observation:
- assistant_message.content += (
- f"Observation: {unit.observation}\n\n"
- )
-
- assistant_messages = [assistant_message]
-
- # query messages
- query_messages = self._organize_user_query(query, [])
-
- if assistant_messages:
- # organize historic prompt messages
- historic_messages = self._organize_historic_prompt_messages(
- [
- system_message,
- *query_messages,
- *assistant_messages,
- UserPromptMessage(content="continue"),
- ]
- )
- messages = [
- system_message,
- *historic_messages,
- *query_messages,
- *assistant_messages,
- UserPromptMessage(content="continue"),
- ]
- else:
- # organize historic prompt messages
- historic_messages = self._organize_historic_prompt_messages(
- [system_message, *query_messages]
- )
- messages = [system_message, *historic_messages, *query_messages]
-
- # join all messages
- return messages
-
- def _handle_invoke_action(
- self,
- action: AgentScratchpadUnit.Action,
- tool_instances: Mapping[str, ToolEntity],
- message_file_ids: list[str],
- ) -> tuple[str, dict[str, Any] | str]:
- """
- handle invoke action
- :param action: action
- :param tool_instances: tool instances
- :param message_file_ids: message file ids
- :param trace_manager: trace manager
- :return: observation, meta
- """
- # action is tool call, invoke tool
- tool_call_name = action.action_name
- tool_call_args = action.action_input
- tool_instance = tool_instances.get(tool_call_name)
-
- if not tool_instance:
- answer = f"there is not a tool named {tool_call_name}"
- return answer, tool_call_args
-
- if isinstance(tool_call_args, str):
- try:
- tool_call_args = json.loads(tool_call_args)
- except json.JSONDecodeError as e:
- params = [
- param.name
- for param in tool_instance.parameters
- if param.form == ToolParameter.ToolParameterForm.LLM
- ]
- if len(params) > 1:
- raise ValueError("tool call args is not a valid json string") from e
- tool_call_args = {params[0]: tool_call_args} if len(params) == 1 else {}
-
- tool_invoke_parameters = {**tool_instance.runtime_parameters, **tool_call_args}
- try:
- tool_invoke_responses = self.session.tool.invoke(
- provider_type=ToolProviderType(tool_instance.provider_type),
- provider=tool_instance.identity.provider,
- tool_name=tool_instance.identity.name,
- parameters=tool_invoke_parameters,
- )
- result = ""
- for response in tool_invoke_responses:
- if response.type == ToolInvokeMessage.MessageType.TEXT:
- result += cast(ToolInvokeMessage.TextMessage, response.message).text
- elif response.type == ToolInvokeMessage.MessageType.LINK:
- result += (
- f"result link: {cast(ToolInvokeMessage.TextMessage, response.message).text}."
- + " please tell user to check it."
- )
- elif response.type in {
- ToolInvokeMessage.MessageType.IMAGE_LINK,
- ToolInvokeMessage.MessageType.IMAGE,
- }:
- result += (
- "image has been created and sent to user already, "
- + "you do not need to create it, just tell the user to check it now."
- )
- elif response.type == ToolInvokeMessage.MessageType.JSON:
- text = json.dumps(
- cast(
- ToolInvokeMessage.JsonMessage, response.message
- ).json_object,
- ensure_ascii=False,
- )
- result += f"tool response: {text}."
- else:
- result += f"tool response: {response.message!r}."
- except Exception as e:
- result = f"tool invoke error: {str(e)}"
-
- return result, tool_invoke_parameters
-
- def _convert_dict_to_action(self, action: dict) -> AgentScratchpadUnit.Action:
- """
- convert dict to action
- """
- return AgentScratchpadUnit.Action(
- action_name=action["action"], action_input=action["action_input"]
- )
-
- def _fill_in_inputs_from_external_data_tools(
- self, instruction: str, inputs: Mapping[str, Any]
- ) -> str:
- """
- fill in inputs from external data tools
- """
- for key, value in inputs.items():
- try:
- instruction = instruction.replace(f"{{{{{key}}}}}", str(value))
- except Exception:
- continue
-
- return instruction
-
- def _format_assistant_message(
- self, agent_scratchpad: list[AgentScratchpadUnit]
- ) -> str:
- """
- format assistant message
- """
- message = ""
- for scratchpad in agent_scratchpad:
- if scratchpad.is_final():
- message += f"Final Answer: {scratchpad.agent_response}"
- else:
- message += f"Thought: {scratchpad.thought}\n\n"
- if scratchpad.action_str:
- message += f"Action: {scratchpad.action_str}\n\n"
- if scratchpad.observation:
- message += f"Observation: {scratchpad.observation}\n\n"
-
- return message
-
- def _organize_historic_prompt_messages(
- self,
- history_prompt_messages: list[PromptMessage],
- current_session_messages: list[PromptMessage] | None = None,
- ) -> list[PromptMessage]:
- """
- organize historic prompt messages
- """
- result: list[PromptMessage] = []
- scratchpads: list[AgentScratchpadUnit] = []
- current_scratchpad: AgentScratchpadUnit | None = None
-
- for message in history_prompt_messages:
- if isinstance(message, AssistantPromptMessage):
- if not current_scratchpad:
- assert isinstance(message.content, str)
- current_scratchpad = AgentScratchpadUnit(
- agent_response=message.content,
- thought=message.content
- or "I am thinking about how to help you",
- action_str="",
- action=None,
- observation=None,
- )
- scratchpads.append(current_scratchpad)
- if message.tool_calls:
- try:
- current_scratchpad.action = AgentScratchpadUnit.Action(
- action_name=message.tool_calls[0].function.name,
- action_input=json.loads(
- message.tool_calls[0].function.arguments
- ),
- )
- current_scratchpad.action_str = json.dumps(
- current_scratchpad.action.to_dict()
- )
- except Exception:
- pass
- elif isinstance(message, ToolPromptMessage):
- if current_scratchpad:
- assert isinstance(message.content, str)
- current_scratchpad.observation = message.content
- else:
- raise NotImplementedError("expected str type")
- elif isinstance(message, UserPromptMessage):
- if scratchpads:
- result.append(
- AssistantPromptMessage(
- content=self._format_assistant_message(scratchpads)
- )
- )
- scratchpads = []
- current_scratchpad = None
-
- result.append(message)
-
- if scratchpads:
- result.append(
- AssistantPromptMessage(
- content=self._format_assistant_message(scratchpads)
- )
- )
-
- return current_session_messages or []
diff --git a/api/init_data/plugins/storage/cwd/langgenius/agent-0.0.11@6b60e6812d1428f06a4dee70a1e9c7dd2af217bf123103758fb40483069c12c9/strategies/ReAct.yaml b/api/init_data/plugins/storage/cwd/langgenius/agent-0.0.11@6b60e6812d1428f06a4dee70a1e9c7dd2af217bf123103758fb40483069c12c9/strategies/ReAct.yaml
deleted file mode 100644
index a6faffd7a6..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/agent-0.0.11@6b60e6812d1428f06a4dee70a1e9c7dd2af217bf123103758fb40483069c12c9/strategies/ReAct.yaml
+++ /dev/null
@@ -1,58 +0,0 @@
-identity:
- name: ReAct
- author: Dify
- label:
- en_US: ReAct
- zh_Hans: ReAct
- pt_BR: ReAct
-description:
- en_US: ReAct is a basic strategy for agent, model will use the tools provided to perform the task.
- zh_Hans: ReAct 是一个基本的 Agent 策略,模型将使用提供的工具来执行任务。
- pt_BR: ReAct is a basic strategy for agent, model will use the tools provided to perform the task.
-parameters:
- - name: model
- type: model-selector
- scope: tool-call&llm
- required: true
- label:
- en_US: Model
- zh_Hans: 模型
- pt_BR: Model
- - name: tools
- type: array[tools]
- required: true
- label:
- en_US: Tool list
- zh_Hans: 工具列表
- pt_BR: Tool list
- - name: instruction
- type: string
- required: true
- label:
- en_US: Instruction
- zh_Hans: 指令
- pt_BR: Instruction
- auto_generate:
- type: prompt_instruction
- template:
- enabled: true
- - name: query
- type: string
- required: true
- label:
- en_US: Query
- zh_Hans: 查询
- pt_BR: Query
- - name: maximum_iterations
- type: number
- required: true
- label:
- en_US: Maximum Iterations
- zh_Hans: 最大迭代次数
- pt_BR: Maximum Iterations
- default: 3
- min: 1
- max: 30
-extra:
- python:
- source: strategies/ReAct.py
diff --git a/api/init_data/plugins/storage/cwd/langgenius/agent-0.0.11@6b60e6812d1428f06a4dee70a1e9c7dd2af217bf123103758fb40483069c12c9/strategies/function_calling.py b/api/init_data/plugins/storage/cwd/langgenius/agent-0.0.11@6b60e6812d1428f06a4dee70a1e9c7dd2af217bf123103758fb40483069c12c9/strategies/function_calling.py
deleted file mode 100644
index 484dedaaad..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/agent-0.0.11@6b60e6812d1428f06a4dee70a1e9c7dd2af217bf123103758fb40483069c12c9/strategies/function_calling.py
+++ /dev/null
@@ -1,546 +0,0 @@
-import json
-import time
-from collections.abc import Generator
-from copy import deepcopy
-from typing import Any, Optional, cast
-
-from dify_plugin.entities.agent import AgentInvokeMessage
-from dify_plugin.entities.model.llm import (
- LLMModelConfig,
- LLMResult,
- LLMResultChunk,
- LLMUsage,
-)
-from dify_plugin.entities.model.message import (
- AssistantPromptMessage,
- PromptMessage,
- PromptMessageContentType,
- PromptMessageRole,
- SystemPromptMessage,
- ToolPromptMessage,
- UserPromptMessage,
-)
-from dify_plugin.entities.tool import LogMetadata, ToolInvokeMessage, ToolProviderType
-from dify_plugin.interfaces.agent import AgentModelConfig, AgentStrategy, ToolEntity
-from pydantic import BaseModel, Field
-
-
-class FunctionCallingParams(BaseModel):
- query: str
- instruction: str | None
- model: AgentModelConfig
- tools: list[ToolEntity] | None
- maximum_iterations: int = 3
-
-
-class ToolInvokeMeta(BaseModel):
- """
- Tool invoke meta
- """
-
- time_cost: float = Field(..., description="The time cost of the tool invoke")
- error: Optional[str] = None
- tool_config: Optional[dict] = None
-
- @classmethod
- def empty(cls) -> "ToolInvokeMeta":
- """
- Get an empty instance of ToolInvokeMeta
- """
- return cls(time_cost=0.0, error=None, tool_config={})
-
- @classmethod
- def error_instance(cls, error: str) -> "ToolInvokeMeta":
- """
- Get an instance of ToolInvokeMeta with error
- """
- return cls(time_cost=0.0, error=error, tool_config={})
-
- def to_dict(self) -> dict:
- return {
- "time_cost": self.time_cost,
- "error": self.error,
- "tool_config": self.tool_config,
- }
-
-
-class FunctionCallingAgentStrategy(AgentStrategy):
- def __init__(self, session):
- super().__init__(session)
- self.query = ""
-
- def _invoke(self, parameters: dict[str, Any]) -> Generator[AgentInvokeMessage]:
- """
- Run FunctionCall agent application
- """
- fc_params = FunctionCallingParams(**parameters)
- query = fc_params.query
- self.query = query
- instruction = fc_params.instruction
- init_prompt_messages = [
- PromptMessage(role=PromptMessageRole.SYSTEM, content=instruction)
- ]
- tools = fc_params.tools
- tool_instances = {tool.identity.name: tool for tool in tools} if tools else {}
- model = fc_params.model
- stop = (
- fc_params.model.completion_params.get("stop", [])
- if fc_params.model.completion_params
- else []
- )
- # convert tools into ModelRuntime Tool format
- prompt_messages_tools = self._init_prompt_tools(tools)
-
- iteration_step = 1
- max_iteration_steps = fc_params.maximum_iterations
- current_thoughts: list[PromptMessage] = []
- # continue to run until there is not any tool call
- function_call_state = True
- llm_usage: dict[str, Optional[LLMUsage]] = {"usage": None}
- final_answer = ""
-
- while function_call_state and iteration_step <= max_iteration_steps:
- function_call_state = False
- round_started_at = time.perf_counter()
- round_log = self.create_log_message(
- label=f"ROUND {iteration_step}",
- data={},
- metadata={
- LogMetadata.STARTED_AT: round_started_at,
- },
- status=ToolInvokeMessage.LogMessage.LogStatus.START,
- )
- yield round_log
- if iteration_step == max_iteration_steps:
- # the last iteration, remove all tools
- prompt_messages_tools = []
-
- # recalc llm max tokens
- prompt_messages = self._organize_prompt_messages(
- history_prompt_messages=init_prompt_messages,
- current_thoughts=current_thoughts,
- )
- if model.completion_params:
- self.recalc_llm_max_tokens(
- model.entity, prompt_messages, model.completion_params
- )
- # invoke model
- model_started_at = time.perf_counter()
- model_log = self.create_log_message(
- label=f"{model.model} Thought",
- data={},
- metadata={
- LogMetadata.STARTED_AT: model_started_at,
- LogMetadata.PROVIDER: model.provider,
- },
- parent=round_log,
- status=ToolInvokeMessage.LogMessage.LogStatus.START,
- )
- yield model_log
- chunks: Generator[LLMResultChunk, None, None] | LLMResult = (
- self.session.model.llm.invoke(
- model_config=LLMModelConfig(**model.model_dump(mode="json")),
- prompt_messages=prompt_messages,
- stream=True,
- stop=stop,
- tools=prompt_messages_tools,
- )
- )
-
- tool_calls: list[tuple[str, str, dict[str, Any]]] = []
-
- # save full response
- response = ""
-
- # save tool call names and inputs
- tool_call_names = ""
-
- current_llm_usage = None
-
- if isinstance(chunks, Generator):
- for chunk in chunks:
- # check if there is any tool call
- if self.check_tool_calls(chunk):
- function_call_state = True
- tool_calls.extend(self.extract_tool_calls(chunk) or [])
- tool_call_names = ";".join(
- [tool_call[1] for tool_call in tool_calls]
- )
-
- if chunk.delta.message and chunk.delta.message.content:
- if isinstance(chunk.delta.message.content, list):
- for content in chunk.delta.message.content:
- response += content.data
- if (
- not function_call_state
- or iteration_step == max_iteration_steps
- ):
- yield self.create_text_message(content.data)
- else:
- response += str(chunk.delta.message.content)
- if (
- not function_call_state
- or iteration_step == max_iteration_steps
- ):
- yield self.create_text_message(
- str(chunk.delta.message.content)
- )
-
- if chunk.delta.usage:
- self.increase_usage(llm_usage, chunk.delta.usage)
- current_llm_usage = chunk.delta.usage
-
- else:
- result = chunks
- # check if there is any tool call
- if self.check_blocking_tool_calls(result):
- function_call_state = True
- tool_calls.extend(self.extract_blocking_tool_calls(result) or [])
- tool_call_names = ";".join(
- [tool_call[1] for tool_call in tool_calls]
- )
-
- if result.usage:
- self.increase_usage(llm_usage, result.usage)
- current_llm_usage = result.usage
-
- if result.message and result.message.content:
- if isinstance(result.message.content, list):
- for content in result.message.content:
- response += content.data
- else:
- response += str(result.message.content)
-
- if not result.message.content:
- result.message.content = ""
- yield self.finish_log_message(
- log=model_log,
- data={
- "output": response,
- "tool_name": tool_call_names,
- "tool_input": {
- tool_call[1]: tool_call[2] for tool_call in tool_calls
- },
- },
- metadata={
- LogMetadata.STARTED_AT: model_started_at,
- LogMetadata.FINISHED_AT: time.perf_counter(),
- LogMetadata.ELAPSED_TIME: time.perf_counter() - model_started_at,
- LogMetadata.PROVIDER: model.provider,
- LogMetadata.TOTAL_PRICE: current_llm_usage.total_price
- if current_llm_usage
- else 0,
- LogMetadata.CURRENCY: current_llm_usage.currency
- if current_llm_usage
- else "",
- LogMetadata.TOTAL_TOKENS: current_llm_usage.total_tokens
- if current_llm_usage
- else 0,
- },
- )
- assistant_message = AssistantPromptMessage(content="", tool_calls=[])
- if tool_calls:
- assistant_message.tool_calls = [
- AssistantPromptMessage.ToolCall(
- id=tool_call[0],
- type="function",
- function=AssistantPromptMessage.ToolCall.ToolCallFunction(
- name=tool_call[1],
- arguments=json.dumps(tool_call[2], ensure_ascii=False),
- ),
- )
- for tool_call in tool_calls
- ]
- else:
- assistant_message.content = response
-
- current_thoughts.append(assistant_message)
-
- final_answer += response + "\n"
-
- # call tools
- tool_responses = []
- for tool_call_id, tool_call_name, tool_call_args in tool_calls:
- tool_instance = tool_instances[tool_call_name]
- tool_call_started_at = time.perf_counter()
- tool_call_log = self.create_log_message(
- label=f"CALL {tool_call_name}",
- data={},
- metadata={
- LogMetadata.STARTED_AT: time.perf_counter(),
- LogMetadata.PROVIDER: tool_instance.identity.provider,
- },
- parent=round_log,
- status=ToolInvokeMessage.LogMessage.LogStatus.START,
- )
- yield tool_call_log
- if not tool_instance:
- tool_response = {
- "tool_call_id": tool_call_id,
- "tool_call_name": tool_call_name,
- "tool_response": f"there is not a tool named {tool_call_name}",
- "meta": ToolInvokeMeta.error_instance(
- f"there is not a tool named {tool_call_name}"
- ).to_dict(),
- }
- else:
- # invoke tool
- try:
- tool_invoke_responses = self.session.tool.invoke(
- provider_type=ToolProviderType(tool_instance.provider_type),
- provider=tool_instance.identity.provider,
- tool_name=tool_instance.identity.name,
- parameters={
- **tool_instance.runtime_parameters,
- **tool_call_args,
- },
- )
- result = ""
- for response in tool_invoke_responses:
- if response.type == ToolInvokeMessage.MessageType.TEXT:
- result += cast(
- ToolInvokeMessage.TextMessage, response.message
- ).text
- elif response.type == ToolInvokeMessage.MessageType.LINK:
- result += (
- f"result link: {cast(ToolInvokeMessage.TextMessage, response.message).text}."
- + " please tell user to check it."
- )
- elif response.type in {
- ToolInvokeMessage.MessageType.IMAGE_LINK,
- ToolInvokeMessage.MessageType.IMAGE,
- }:
- result += (
- "image has been created and sent to user already, "
- + "you do not need to create it, just tell the user to check it now."
- )
- elif response.type == ToolInvokeMessage.MessageType.JSON:
- text = json.dumps(
- cast(
- ToolInvokeMessage.JsonMessage, response.message
- ).json_object,
- ensure_ascii=False,
- )
- result += f"tool response: {text}."
- else:
- result += f"tool response: {response.message!r}."
- except Exception as e:
- result = f"tool invoke error: {str(e)}"
- tool_response = {
- "tool_call_id": tool_call_id,
- "tool_call_name": tool_call_name,
- "tool_call_input": {
- **tool_instance.runtime_parameters,
- **tool_call_args,
- },
- "tool_response": result,
- }
-
- yield self.finish_log_message(
- log=tool_call_log,
- data={
- "output": tool_response,
- },
- metadata={
- LogMetadata.STARTED_AT: tool_call_started_at,
- LogMetadata.PROVIDER: tool_instance.identity.provider,
- LogMetadata.FINISHED_AT: time.perf_counter(),
- LogMetadata.ELAPSED_TIME: time.perf_counter()
- - tool_call_started_at,
- },
- )
- tool_responses.append(tool_response)
- if tool_response["tool_response"] is not None:
- current_thoughts.append(
- ToolPromptMessage(
- content=str(tool_response["tool_response"]),
- tool_call_id=tool_call_id,
- name=tool_call_name,
- )
- )
-
- # update prompt tool
- for prompt_tool in prompt_messages_tools:
- self.update_prompt_message_tool(
- tool_instances[prompt_tool.name], prompt_tool
- )
- yield self.finish_log_message(
- log=round_log,
- data={
- "output": {
- "llm_response": response,
- "tool_responses": tool_responses,
- },
- },
- metadata={
- LogMetadata.STARTED_AT: round_started_at,
- LogMetadata.FINISHED_AT: time.perf_counter(),
- LogMetadata.ELAPSED_TIME: time.perf_counter() - round_started_at,
- LogMetadata.TOTAL_PRICE: current_llm_usage.total_price
- if current_llm_usage
- else 0,
- LogMetadata.CURRENCY: current_llm_usage.currency
- if current_llm_usage
- else "",
- LogMetadata.TOTAL_TOKENS: current_llm_usage.total_tokens
- if current_llm_usage
- else 0,
- },
- )
- iteration_step += 1
-
- yield self.create_json_message(
- {
- "execution_metadata": {
- LogMetadata.TOTAL_PRICE: llm_usage["usage"].total_price
- if llm_usage["usage"] is not None
- else 0,
- LogMetadata.CURRENCY: llm_usage["usage"].currency
- if llm_usage["usage"] is not None
- else "",
- LogMetadata.TOTAL_TOKENS: llm_usage["usage"].total_tokens
- if llm_usage["usage"] is not None
- else 0,
- }
- }
- )
-
- def check_tool_calls(self, llm_result_chunk: LLMResultChunk) -> bool:
- """
- Check if there is any tool call in llm result chunk
- """
- return bool(llm_result_chunk.delta.message.tool_calls)
-
- def check_blocking_tool_calls(self, llm_result: LLMResult) -> bool:
- """
- Check if there is any blocking tool call in llm result
- """
- return bool(llm_result.message.tool_calls)
-
- def extract_tool_calls(
- self, llm_result_chunk: LLMResultChunk
- ) -> list[tuple[str, str, dict[str, Any]]]:
- """
- Extract tool calls from llm result chunk
-
- Returns:
- List[Tuple[str, str, Dict[str, Any]]]: [(tool_call_id, tool_call_name, tool_call_args)]
- """
- tool_calls = []
- for prompt_message in llm_result_chunk.delta.message.tool_calls:
- args = {}
- if prompt_message.function.arguments != "":
- args = json.loads(prompt_message.function.arguments)
-
- tool_calls.append(
- (
- prompt_message.id,
- prompt_message.function.name,
- args,
- )
- )
-
- return tool_calls
-
- def extract_blocking_tool_calls(
- self, llm_result: LLMResult
- ) -> list[tuple[str, str, dict[str, Any]]]:
- """
- Extract blocking tool calls from llm result
-
- Returns:
- List[Tuple[str, str, Dict[str, Any]]]: [(tool_call_id, tool_call_name, tool_call_args)]
- """
- tool_calls = []
- for prompt_message in llm_result.message.tool_calls:
- args = {}
- if prompt_message.function.arguments != "":
- args = json.loads(prompt_message.function.arguments)
-
- tool_calls.append(
- (
- prompt_message.id,
- prompt_message.function.name,
- args,
- )
- )
-
- return tool_calls
-
- def _init_system_message(
- self, prompt_template: str, prompt_messages: list[PromptMessage]
- ) -> list[PromptMessage]:
- """
- Initialize system message
- """
- if not prompt_messages and prompt_template:
- return [
- SystemPromptMessage(content=prompt_template),
- ]
-
- if (
- prompt_messages
- and not isinstance(prompt_messages[0], SystemPromptMessage)
- and prompt_template
- ):
- prompt_messages.insert(0, SystemPromptMessage(content=prompt_template))
-
- return prompt_messages or []
-
- def _organize_user_query(
- self, query: str, prompt_messages: list[PromptMessage]
- ) -> list[PromptMessage]:
- """
- Organize user query
- """
-
- prompt_messages.append(UserPromptMessage(content=query))
-
- return prompt_messages
-
- def _clear_user_prompt_image_messages(
- self, prompt_messages: list[PromptMessage]
- ) -> list[PromptMessage]:
- """
- As for now, gpt supports both fc and vision at the first iteration.
- We need to remove the image messages from the prompt messages at the first iteration.
- """
- prompt_messages = deepcopy(prompt_messages)
-
- for prompt_message in prompt_messages:
- if isinstance(prompt_message, UserPromptMessage) and isinstance(
- prompt_message.content, list
- ):
- prompt_message.content = "\n".join(
- [
- content.data
- if content.type == PromptMessageContentType.TEXT
- else "[image]"
- if content.type == PromptMessageContentType.IMAGE
- else "[file]"
- for content in prompt_message.content
- ]
- )
-
- return prompt_messages
-
- def _organize_prompt_messages(
- self,
- current_thoughts: list[PromptMessage],
- history_prompt_messages: list[PromptMessage],
- ) -> list[PromptMessage]:
- prompt_template = ""
- history_prompt_messages = self._init_system_message(
- prompt_template, history_prompt_messages
- )
- query_prompt_messages = self._organize_user_query(self.query or "", [])
-
- prompt_messages = [
- *history_prompt_messages,
- *query_prompt_messages,
- *current_thoughts,
- ]
- if len(current_thoughts) != 0:
- # clear messages after the first iteration
- prompt_messages = self._clear_user_prompt_image_messages(prompt_messages)
- return prompt_messages
diff --git a/api/init_data/plugins/storage/cwd/langgenius/agent-0.0.11@6b60e6812d1428f06a4dee70a1e9c7dd2af217bf123103758fb40483069c12c9/strategies/function_calling.yaml b/api/init_data/plugins/storage/cwd/langgenius/agent-0.0.11@6b60e6812d1428f06a4dee70a1e9c7dd2af217bf123103758fb40483069c12c9/strategies/function_calling.yaml
deleted file mode 100644
index e1eebe259b..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/agent-0.0.11@6b60e6812d1428f06a4dee70a1e9c7dd2af217bf123103758fb40483069c12c9/strategies/function_calling.yaml
+++ /dev/null
@@ -1,58 +0,0 @@
-identity:
- name: function_calling
- author: Dify
- label:
- en_US: FunctionCalling
- zh_Hans: FunctionCalling
- pt_BR: FunctionCalling
-description:
- en_US: Function Calling is a basic strategy for agent, model will use the tools provided to perform the task.
- zh_Hans: Function Calling 是一个基本的 Agent 策略,模型将使用提供的工具来执行任务。
- pt_BR: Function Calling is a basic strategy for agent, model will use the tools provided to perform the task.
-parameters:
- - name: model
- type: model-selector
- scope: tool-call&llm
- required: true
- label:
- en_US: Model
- zh_Hans: 模型
- pt_BR: Model
- - name: tools
- type: array[tools]
- required: true
- label:
- en_US: Tool list
- zh_Hans: 工具列表
- pt_BR: Tool list
- - name: instruction
- type: string
- required: true
- label:
- en_US: Instruction
- zh_Hans: 指令
- pt_BR: Instruction
- auto_generate:
- type: prompt_instruction
- template:
- enabled: true
- - name: query
- type: string
- required: true
- label:
- en_US: Query
- zh_Hans: 查询
- pt_BR: Query
- - name: maximum_iterations
- type: number
- required: true
- label:
- en_US: Maximum Iterations
- zh_Hans: 最大迭代次数
- pt_BR: Maximum Iterations
- default: 3
- max: 30
- min: 1
-extra:
- python:
- source: strategies/function_calling.py
diff --git a/api/init_data/plugins/storage/cwd/langgenius/deepseek-0.0.5@fd6efd37c2a931911de8ab9ca3ba2da303bef146d45ee87ad896b04b36d09403/.env.example b/api/init_data/plugins/storage/cwd/langgenius/deepseek-0.0.5@fd6efd37c2a931911de8ab9ca3ba2da303bef146d45ee87ad896b04b36d09403/.env.example
deleted file mode 100644
index dbb75b858b..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/deepseek-0.0.5@fd6efd37c2a931911de8ab9ca3ba2da303bef146d45ee87ad896b04b36d09403/.env.example
+++ /dev/null
@@ -1,4 +0,0 @@
-INSTALL_METHOD=remote
-REMOTE_INSTALL_HOST=debug-plugin.dify.dev
-REMOTE_INSTALL_PORT=5003
-REMOTE_INSTALL_KEY=********-****-****-****-************
diff --git a/api/init_data/plugins/storage/cwd/langgenius/deepseek-0.0.5@fd6efd37c2a931911de8ab9ca3ba2da303bef146d45ee87ad896b04b36d09403/README.md b/api/init_data/plugins/storage/cwd/langgenius/deepseek-0.0.5@fd6efd37c2a931911de8ab9ca3ba2da303bef146d45ee87ad896b04b36d09403/README.md
deleted file mode 100644
index f9417d0874..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/deepseek-0.0.5@fd6efd37c2a931911de8ab9ca3ba2da303bef146d45ee87ad896b04b36d09403/README.md
+++ /dev/null
@@ -1,7 +0,0 @@
-# Overview
-DeepSeek provides advanced AI capabilities for chats and completions. This plugin enables developers to integrate DeepSeek's models, including text generation (deepseek-chat and deepseek-code) via the API.
-
-# Configure
-After installation, you need to get API keys from [Deepseek](https://platform.deepseek.com/api_keys) and setup in Settings -> Model Provider.
-
-
\ No newline at end of file
diff --git a/api/init_data/plugins/storage/cwd/langgenius/deepseek-0.0.5@fd6efd37c2a931911de8ab9ca3ba2da303bef146d45ee87ad896b04b36d09403/_assets/deepseek.PNG b/api/init_data/plugins/storage/cwd/langgenius/deepseek-0.0.5@fd6efd37c2a931911de8ab9ca3ba2da303bef146d45ee87ad896b04b36d09403/_assets/deepseek.PNG
deleted file mode 100644
index 89ed0fce0f..0000000000
Binary files a/api/init_data/plugins/storage/cwd/langgenius/deepseek-0.0.5@fd6efd37c2a931911de8ab9ca3ba2da303bef146d45ee87ad896b04b36d09403/_assets/deepseek.PNG and /dev/null differ
diff --git a/api/init_data/plugins/storage/cwd/langgenius/deepseek-0.0.5@fd6efd37c2a931911de8ab9ca3ba2da303bef146d45ee87ad896b04b36d09403/_assets/icon_l_en.svg b/api/init_data/plugins/storage/cwd/langgenius/deepseek-0.0.5@fd6efd37c2a931911de8ab9ca3ba2da303bef146d45ee87ad896b04b36d09403/_assets/icon_l_en.svg
deleted file mode 100644
index 425494404f..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/deepseek-0.0.5@fd6efd37c2a931911de8ab9ca3ba2da303bef146d45ee87ad896b04b36d09403/_assets/icon_l_en.svg
+++ /dev/null
@@ -1,22 +0,0 @@
-
diff --git a/api/init_data/plugins/storage/cwd/langgenius/deepseek-0.0.5@fd6efd37c2a931911de8ab9ca3ba2da303bef146d45ee87ad896b04b36d09403/_assets/icon_s_en.svg b/api/init_data/plugins/storage/cwd/langgenius/deepseek-0.0.5@fd6efd37c2a931911de8ab9ca3ba2da303bef146d45ee87ad896b04b36d09403/_assets/icon_s_en.svg
deleted file mode 100644
index aa854a7504..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/deepseek-0.0.5@fd6efd37c2a931911de8ab9ca3ba2da303bef146d45ee87ad896b04b36d09403/_assets/icon_s_en.svg
+++ /dev/null
@@ -1,3 +0,0 @@
-
diff --git a/api/init_data/plugins/storage/cwd/langgenius/deepseek-0.0.5@fd6efd37c2a931911de8ab9ca3ba2da303bef146d45ee87ad896b04b36d09403/main.py b/api/init_data/plugins/storage/cwd/langgenius/deepseek-0.0.5@fd6efd37c2a931911de8ab9ca3ba2da303bef146d45ee87ad896b04b36d09403/main.py
deleted file mode 100644
index f2bfcdfc0e..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/deepseek-0.0.5@fd6efd37c2a931911de8ab9ca3ba2da303bef146d45ee87ad896b04b36d09403/main.py
+++ /dev/null
@@ -1,6 +0,0 @@
-from dify_plugin import Plugin, DifyPluginEnv
-
-plugin = Plugin(DifyPluginEnv())
-
-if __name__ == '__main__':
- plugin.run()
diff --git a/api/init_data/plugins/storage/cwd/langgenius/deepseek-0.0.5@fd6efd37c2a931911de8ab9ca3ba2da303bef146d45ee87ad896b04b36d09403/manifest.yaml b/api/init_data/plugins/storage/cwd/langgenius/deepseek-0.0.5@fd6efd37c2a931911de8ab9ca3ba2da303bef146d45ee87ad896b04b36d09403/manifest.yaml
deleted file mode 100644
index 90fcbbda80..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/deepseek-0.0.5@fd6efd37c2a931911de8ab9ca3ba2da303bef146d45ee87ad896b04b36d09403/manifest.yaml
+++ /dev/null
@@ -1,37 +0,0 @@
-author: langgenius
-created_at: '2024-09-20T00:13:50.29298939-04:00'
-description:
- en_US: Models provided by deepseek, such as deepseek-chat、deepseek-coder.
- zh_Hans: 深度求索提供的模型,例如 deepseek-chat、deepseek-coder 。
-icon: icon_s_en.svg
-label:
- en_US: DeepSeek
- zh_Hans: 深度求索
-meta:
- arch:
- - amd64
- - arm64
- runner:
- entrypoint: main
- language: python
- version: '3.12'
- version: 0.0.1
-name: deepseek
-plugins:
- models:
- - provider/deepseek.yaml
-resource:
- memory: 268435456
- permission:
- model:
- enabled: true
- llm: true
- moderation: false
- rerank: true
- speech2text: false
- text_embedding: true
- tts: false
- tool:
- enabled: true
-type: plugin
-version: 0.0.5
diff --git a/api/init_data/plugins/storage/cwd/langgenius/deepseek-0.0.5@fd6efd37c2a931911de8ab9ca3ba2da303bef146d45ee87ad896b04b36d09403/models/llm/__init__.py b/api/init_data/plugins/storage/cwd/langgenius/deepseek-0.0.5@fd6efd37c2a931911de8ab9ca3ba2da303bef146d45ee87ad896b04b36d09403/models/llm/__init__.py
deleted file mode 100644
index e69de29bb2..0000000000
diff --git a/api/init_data/plugins/storage/cwd/langgenius/deepseek-0.0.5@fd6efd37c2a931911de8ab9ca3ba2da303bef146d45ee87ad896b04b36d09403/models/llm/_position.yaml b/api/init_data/plugins/storage/cwd/langgenius/deepseek-0.0.5@fd6efd37c2a931911de8ab9ca3ba2da303bef146d45ee87ad896b04b36d09403/models/llm/_position.yaml
deleted file mode 100644
index eeac8aa405..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/deepseek-0.0.5@fd6efd37c2a931911de8ab9ca3ba2da303bef146d45ee87ad896b04b36d09403/models/llm/_position.yaml
+++ /dev/null
@@ -1,3 +0,0 @@
-- deepseek-chat
-- deepseek-coder
-- deepseek-reasoner
diff --git a/api/init_data/plugins/storage/cwd/langgenius/deepseek-0.0.5@fd6efd37c2a931911de8ab9ca3ba2da303bef146d45ee87ad896b04b36d09403/models/llm/deepseek-chat.yaml b/api/init_data/plugins/storage/cwd/langgenius/deepseek-0.0.5@fd6efd37c2a931911de8ab9ca3ba2da303bef146d45ee87ad896b04b36d09403/models/llm/deepseek-chat.yaml
deleted file mode 100644
index 4cf6eef757..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/deepseek-0.0.5@fd6efd37c2a931911de8ab9ca3ba2da303bef146d45ee87ad896b04b36d09403/models/llm/deepseek-chat.yaml
+++ /dev/null
@@ -1,83 +0,0 @@
-model: deepseek-chat
-label:
- zh_Hans: deepseek-chat
- en_US: deepseek-chat
-model_type: llm
-features:
- - agent-thought
- - tool-call
- - multi-tool-call
- - stream-tool-call
-model_properties:
- mode: chat
- context_size: 128000
-parameter_rules:
- - name: temperature
- use_template: temperature
- type: float
- default: 1
- min: 0.0
- max: 2.0
- help:
- zh_Hans: 控制生成结果的多样性和随机性。数值越小,越严谨;数值越大,越发散。
- en_US: Control the diversity and randomness of generated results. The smaller the value, the more rigorous it is; the larger the value, the more divergent it is.
- - name: max_tokens
- use_template: max_tokens
- type: int
- default: 4096
- min: 1
- max: 8192
- help:
- zh_Hans: 指定生成结果长度的上限。如果生成结果截断,可以调大该参数。
- en_US: Specifies the upper limit on the length of generated results. If the generated results are truncated, you can increase this parameter.
- - name: top_p
- use_template: top_p
- type: float
- default: 1
- min: 0.01
- max: 1.00
- help:
- zh_Hans: 控制生成结果的随机性。数值越小,随机性越弱;数值越大,随机性越强。一般而言,top_p 和 temperature 两个参数选择一个进行调整即可。
- en_US: Control the randomness of generated results. The smaller the value, the weaker the randomness; the larger the value, the stronger the randomness. Generally speaking, you can adjust one of the two parameters top_p and temperature.
- - name: logprobs
- label:
- en_US: Logprobs
- help:
- zh_Hans: 是否返回所输出 token 的对数概率。如果为 true,则在 message 的 content 中返回每个输出 token 的对数概率。
- en_US: Whether to return the log probability of the output token. If true, returns the log probability of each output token in the content of message .
- type: boolean
- - name: top_logprobs
- label:
- en_US: Top Logprobs
- type: int
- default: 0
- min: 0
- max: 20
- help:
- zh_Hans: 一个介于 0 到 20 之间的整数 N,指定每个输出位置返回输出概率 top N 的 token,且返回这些 token 的对数概率。指定此参数时,logprobs 必须为 true。
- en_US: An integer N between 0 and 20, specifying that each output position returns the top N tokens with output probability, and returns the logarithmic probability of these tokens. When specifying this parameter, logprobs must be true.
- - name: frequency_penalty
- use_template: frequency_penalty
- default: 0
- min: -2.0
- max: 2.0
- help:
- zh_Hans: 介于 -2.0 和 2.0 之间的数字。如果该值为正,那么新 token 会根据其在已有文本中的出现频率受到相应的惩罚,降低模型重复相同内容的可能性。
- en_US: A number between -2.0 and 2.0. If the value is positive, new tokens are penalized based on their frequency of occurrence in existing text, reducing the likelihood that the model will repeat the same content.
- - name: response_format
- label:
- zh_Hans: 回复格式
- en_US: Response Format
- type: string
- help:
- zh_Hans: 指定模型必须输出的格式
- en_US: specifying the format that the model must output
- required: false
- options:
- - text
- - json_object
-pricing:
- input: "2"
- output: "8"
- unit: "0.000001"
- currency: RMB
diff --git a/api/init_data/plugins/storage/cwd/langgenius/deepseek-0.0.5@fd6efd37c2a931911de8ab9ca3ba2da303bef146d45ee87ad896b04b36d09403/models/llm/deepseek-coder.yaml b/api/init_data/plugins/storage/cwd/langgenius/deepseek-0.0.5@fd6efd37c2a931911de8ab9ca3ba2da303bef146d45ee87ad896b04b36d09403/models/llm/deepseek-coder.yaml
deleted file mode 100644
index 97310e76b9..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/deepseek-0.0.5@fd6efd37c2a931911de8ab9ca3ba2da303bef146d45ee87ad896b04b36d09403/models/llm/deepseek-coder.yaml
+++ /dev/null
@@ -1,29 +0,0 @@
-model: deepseek-coder
-label:
- zh_Hans: deepseek-coder
- en_US: deepseek-coder
-model_type: llm
-features:
- - agent-thought
- - tool-call
- - multi-tool-call
- - stream-tool-call
-model_properties:
- mode: chat
- context_size: 128000
-parameter_rules:
- - name: temperature
- use_template: temperature
- min: 0
- max: 1
- default: 0.5
- - name: top_p
- use_template: top_p
- min: 0
- max: 1
- default: 1
- - name: max_tokens
- use_template: max_tokens
- min: 1
- max: 4096
- default: 1024
diff --git a/api/init_data/plugins/storage/cwd/langgenius/deepseek-0.0.5@fd6efd37c2a931911de8ab9ca3ba2da303bef146d45ee87ad896b04b36d09403/models/llm/deepseek-reasoner.yaml b/api/init_data/plugins/storage/cwd/langgenius/deepseek-0.0.5@fd6efd37c2a931911de8ab9ca3ba2da303bef146d45ee87ad896b04b36d09403/models/llm/deepseek-reasoner.yaml
deleted file mode 100644
index 45ef70977b..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/deepseek-0.0.5@fd6efd37c2a931911de8ab9ca3ba2da303bef146d45ee87ad896b04b36d09403/models/llm/deepseek-reasoner.yaml
+++ /dev/null
@@ -1,21 +0,0 @@
-model: deepseek-reasoner
-label:
- zh_Hans: deepseek-reasoner
- en_US: deepseek-reasoner
-model_type: llm
-features:
- - agent-thought
-model_properties:
- mode: chat
- context_size: 128000
-parameter_rules:
- - name: max_tokens
- use_template: max_tokens
- min: 1
- max: 8192
- default: 4096
-pricing:
- input: "4"
- output: "16"
- unit: "0.000001"
- currency: RMB
diff --git a/api/init_data/plugins/storage/cwd/langgenius/deepseek-0.0.5@fd6efd37c2a931911de8ab9ca3ba2da303bef146d45ee87ad896b04b36d09403/models/llm/llm.py b/api/init_data/plugins/storage/cwd/langgenius/deepseek-0.0.5@fd6efd37c2a931911de8ab9ca3ba2da303bef146d45ee87ad896b04b36d09403/models/llm/llm.py
deleted file mode 100644
index 3af28fb157..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/deepseek-0.0.5@fd6efd37c2a931911de8ab9ca3ba2da303bef146d45ee87ad896b04b36d09403/models/llm/llm.py
+++ /dev/null
@@ -1,33 +0,0 @@
-from collections.abc import Generator
-from typing import Optional, Union
-from dify_plugin.entities.model.llm import LLMMode, LLMResult
-from dify_plugin.entities.model.message import PromptMessage, PromptMessageTool
-from yarl import URL
-from dify_plugin import OAICompatLargeLanguageModel
-
-
-class DeepseekLargeLanguageModel(OAICompatLargeLanguageModel):
- def _invoke(
- self,
- model: str,
- credentials: dict,
- prompt_messages: list[PromptMessage],
- model_parameters: dict,
- tools: Optional[list[PromptMessageTool]] = None,
- stop: Optional[list[str]] = None,
- stream: bool = True,
- user: Optional[str] = None,
- ) -> Union[LLMResult, Generator]:
- self._add_custom_parameters(credentials)
- return super()._invoke(model, credentials, prompt_messages, model_parameters, tools, stop, stream)
-
- def validate_credentials(self, model: str, credentials: dict) -> None:
- self._add_custom_parameters(credentials)
- super().validate_credentials(model, credentials)
-
- @staticmethod
- def _add_custom_parameters(credentials) -> None:
- credentials["endpoint_url"] = str(URL(credentials.get("endpoint_url", "https://api.deepseek.com")))
- credentials["mode"] = LLMMode.CHAT.value
- credentials["function_calling_type"] = "tool_call"
- credentials["stream_function_calling"] = "support"
diff --git a/api/init_data/plugins/storage/cwd/langgenius/deepseek-0.0.5@fd6efd37c2a931911de8ab9ca3ba2da303bef146d45ee87ad896b04b36d09403/provider/deepseek.py b/api/init_data/plugins/storage/cwd/langgenius/deepseek-0.0.5@fd6efd37c2a931911de8ab9ca3ba2da303bef146d45ee87ad896b04b36d09403/provider/deepseek.py
deleted file mode 100644
index 737fc92b43..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/deepseek-0.0.5@fd6efd37c2a931911de8ab9ca3ba2da303bef146d45ee87ad896b04b36d09403/provider/deepseek.py
+++ /dev/null
@@ -1,24 +0,0 @@
-import logging
-from dify_plugin.entities.model import ModelType
-from dify_plugin.errors.model import CredentialsValidateFailedError
-from dify_plugin import ModelProvider
-
-logger = logging.getLogger(__name__)
-
-
-class DeepSeekProvider(ModelProvider):
- def validate_provider_credentials(self, credentials: dict) -> None:
- """
- Validate provider credentials
- if validate failed, raise exception
-
- :param credentials: provider credentials, credentials form defined in `provider_credential_schema`.
- """
- try:
- model_instance = self.get_model_instance(ModelType.LLM)
- model_instance.validate_credentials(model="deepseek-chat", credentials=credentials)
- except CredentialsValidateFailedError as ex:
- raise ex
- except Exception as ex:
- logger.exception(f"{self.get_provider_schema().provider} credentials validate failed")
- raise ex
diff --git a/api/init_data/plugins/storage/cwd/langgenius/deepseek-0.0.5@fd6efd37c2a931911de8ab9ca3ba2da303bef146d45ee87ad896b04b36d09403/provider/deepseek.yaml b/api/init_data/plugins/storage/cwd/langgenius/deepseek-0.0.5@fd6efd37c2a931911de8ab9ca3ba2da303bef146d45ee87ad896b04b36d09403/provider/deepseek.yaml
deleted file mode 100644
index 2750c35e06..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/deepseek-0.0.5@fd6efd37c2a931911de8ab9ca3ba2da303bef146d45ee87ad896b04b36d09403/provider/deepseek.yaml
+++ /dev/null
@@ -1,51 +0,0 @@
-background: '#c0cdff'
-configurate_methods:
-- predefined-model
-description:
- en_US: Models provided by deepseek, such as deepseek-reasoner、deepseek-chat、deepseek-coder.
- zh_Hans: 深度求索提供的模型,例如 deepseek-reasoner、deepseek-chat、deepseek-coder 。
-extra:
- python:
- model_sources:
- - models/llm/llm.py
- provider_source: provider/deepseek.py
-help:
- title:
- en_US: Get your API Key from deepseek
- zh_Hans: 从深度求索获取 API Key
- url:
- en_US: https://platform.deepseek.com/api_keys
-icon_large:
- en_US: icon_l_en.svg
-icon_small:
- en_US: icon_s_en.svg
-label:
- en_US: deepseek
- zh_Hans: 深度求索
-models:
- llm:
- position: models/llm/_position.yaml
- predefined:
- - models/llm/*.yaml
-provider: deepseek
-provider_credential_schema:
- credential_form_schemas:
- - label:
- en_US: API Key
- placeholder:
- en_US: Enter your API Key
- zh_Hans: 在此输入您的 API Key
- required: true
- type: secret-input
- variable: api_key
- - label:
- en_US: Custom API endpoint URL
- zh_Hans: 自定义 API endpoint 地址
- placeholder:
- en_US: Base URL, e.g. https://api.deepseek.com/v1 or https://api.deepseek.com
- zh_Hans: Base URL, e.g. https://api.deepseek.com/v1 or https://api.deepseek.com
- required: false
- type: text-input
- variable: endpoint_url
-supported_model_types:
-- llm
diff --git a/api/init_data/plugins/storage/cwd/langgenius/deepseek-0.0.5@fd6efd37c2a931911de8ab9ca3ba2da303bef146d45ee87ad896b04b36d09403/requirements.txt b/api/init_data/plugins/storage/cwd/langgenius/deepseek-0.0.5@fd6efd37c2a931911de8ab9ca3ba2da303bef146d45ee87ad896b04b36d09403/requirements.txt
deleted file mode 100644
index 5e06c37aa1..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/deepseek-0.0.5@fd6efd37c2a931911de8ab9ca3ba2da303bef146d45ee87ad896b04b36d09403/requirements.txt
+++ /dev/null
@@ -1 +0,0 @@
-dify_plugin==0.0.1b65
diff --git a/api/init_data/plugins/storage/cwd/langgenius/ollama-0.0.3@9ded90ac00e8510119a24be7396ba77191c9610d5e1e29f59d68fa1229822fc7/.env.example b/api/init_data/plugins/storage/cwd/langgenius/ollama-0.0.3@9ded90ac00e8510119a24be7396ba77191c9610d5e1e29f59d68fa1229822fc7/.env.example
deleted file mode 100644
index dbb75b858b..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/ollama-0.0.3@9ded90ac00e8510119a24be7396ba77191c9610d5e1e29f59d68fa1229822fc7/.env.example
+++ /dev/null
@@ -1,4 +0,0 @@
-INSTALL_METHOD=remote
-REMOTE_INSTALL_HOST=debug-plugin.dify.dev
-REMOTE_INSTALL_PORT=5003
-REMOTE_INSTALL_KEY=********-****-****-****-************
diff --git a/api/init_data/plugins/storage/cwd/langgenius/ollama-0.0.3@9ded90ac00e8510119a24be7396ba77191c9610d5e1e29f59d68fa1229822fc7/README.md b/api/init_data/plugins/storage/cwd/langgenius/ollama-0.0.3@9ded90ac00e8510119a24be7396ba77191c9610d5e1e29f59d68fa1229822fc7/README.md
deleted file mode 100644
index c971d3ac5a..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/ollama-0.0.3@9ded90ac00e8510119a24be7396ba77191c9610d5e1e29f59d68fa1229822fc7/README.md
+++ /dev/null
@@ -1,50 +0,0 @@
-## Overview
-
-Ollama is a cross-platform inference framework client (MacOS, Windows, Linux) designed for seamless deployment of large language models (LLMs) such as Llama 2, Mistral, Llava, and more. With its one-click setup, Ollama enables local execution of LLMs, providing enhanced data privacy and security by keeping your data on your own machine.
-
-Dify supports integrating LLM and Text Embedding capabilities of large language models deployed with Ollama.
-
-## Configure
-
-#### 1. Download Ollama
-Visit [Ollama download page](https://ollama.com/download) to download the Ollama client for your system.
-
-#### 2. Run Ollama and Chat with Llava
-
-````
-ollama run llama3.2
-````
-
-After successful launch, Ollama starts an API service on local port 11434, which can be accessed at `http://localhost:11434`.
-
-For other models, visit [Ollama Models](https://ollama.com/library) for more details.
-
-#### 3. Install Ollama Plugin
-Go to the Dify marketplace and search the Ollama to download it.
-
-
-
-#### 4. Integrate Ollama in Dify
-
-In `Settings > Model Providers > Ollama`, fill in:
-
-
-
-- Model Name:`llama3.2`
-- Base URL: `http://:11434`
-- Enter the base URL where the Ollama service is accessible.
-- If Dify is deployed using Docker, consider using the local network IP address, e.g., `http://192.168.1.100:11434` or `http://host.docker.internal:11434` to access the service.
-- For local source code deployment, use `http://localhost:11434`.
-- Model Type: `Chat`
-- Model Context Length: `4096`
-- The maximum context length of the model. If unsure, use the default value of 4096.
-- Maximum Token Limit: `4096`
-- The maximum number of tokens returned by the model. If there are no specific requirements for the model, this can be consistent with the model context length.
-- Support for Vision: `Yes`
-- Check this option if the model supports image understanding (multimodal), like `llava`.
-
-Click "Save" to use the model in the application after verifying that there are no errors.
-
-The integration method for Embedding models is similar to LLM, just change the model type to Text Embedding.
-
-For more detail, please check [Dify's official document](https://docs.dify.ai/development/models-integration/ollama).
diff --git a/api/init_data/plugins/storage/cwd/langgenius/ollama-0.0.3@9ded90ac00e8510119a24be7396ba77191c9610d5e1e29f59d68fa1229822fc7/_assets/icon_l_en.svg b/api/init_data/plugins/storage/cwd/langgenius/ollama-0.0.3@9ded90ac00e8510119a24be7396ba77191c9610d5e1e29f59d68fa1229822fc7/_assets/icon_l_en.svg
deleted file mode 100644
index 39d8a1ece6..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/ollama-0.0.3@9ded90ac00e8510119a24be7396ba77191c9610d5e1e29f59d68fa1229822fc7/_assets/icon_l_en.svg
+++ /dev/null
@@ -1,15 +0,0 @@
-
diff --git a/api/init_data/plugins/storage/cwd/langgenius/ollama-0.0.3@9ded90ac00e8510119a24be7396ba77191c9610d5e1e29f59d68fa1229822fc7/_assets/icon_s_en.svg b/api/init_data/plugins/storage/cwd/langgenius/ollama-0.0.3@9ded90ac00e8510119a24be7396ba77191c9610d5e1e29f59d68fa1229822fc7/_assets/icon_s_en.svg
deleted file mode 100644
index f8482a96b9..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/ollama-0.0.3@9ded90ac00e8510119a24be7396ba77191c9610d5e1e29f59d68fa1229822fc7/_assets/icon_s_en.svg
+++ /dev/null
@@ -1,15 +0,0 @@
-
diff --git a/api/init_data/plugins/storage/cwd/langgenius/ollama-0.0.3@9ded90ac00e8510119a24be7396ba77191c9610d5e1e29f59d68fa1229822fc7/_assets/ollama-01.png b/api/init_data/plugins/storage/cwd/langgenius/ollama-0.0.3@9ded90ac00e8510119a24be7396ba77191c9610d5e1e29f59d68fa1229822fc7/_assets/ollama-01.png
deleted file mode 100644
index 854a0be798..0000000000
Binary files a/api/init_data/plugins/storage/cwd/langgenius/ollama-0.0.3@9ded90ac00e8510119a24be7396ba77191c9610d5e1e29f59d68fa1229822fc7/_assets/ollama-01.png and /dev/null differ
diff --git a/api/init_data/plugins/storage/cwd/langgenius/ollama-0.0.3@9ded90ac00e8510119a24be7396ba77191c9610d5e1e29f59d68fa1229822fc7/_assets/ollama-02.png b/api/init_data/plugins/storage/cwd/langgenius/ollama-0.0.3@9ded90ac00e8510119a24be7396ba77191c9610d5e1e29f59d68fa1229822fc7/_assets/ollama-02.png
deleted file mode 100644
index 6c58186e89..0000000000
Binary files a/api/init_data/plugins/storage/cwd/langgenius/ollama-0.0.3@9ded90ac00e8510119a24be7396ba77191c9610d5e1e29f59d68fa1229822fc7/_assets/ollama-02.png and /dev/null differ
diff --git a/api/init_data/plugins/storage/cwd/langgenius/ollama-0.0.3@9ded90ac00e8510119a24be7396ba77191c9610d5e1e29f59d68fa1229822fc7/_assets/ollama_config.PNG b/api/init_data/plugins/storage/cwd/langgenius/ollama-0.0.3@9ded90ac00e8510119a24be7396ba77191c9610d5e1e29f59d68fa1229822fc7/_assets/ollama_config.PNG
deleted file mode 100644
index a172a47f96..0000000000
Binary files a/api/init_data/plugins/storage/cwd/langgenius/ollama-0.0.3@9ded90ac00e8510119a24be7396ba77191c9610d5e1e29f59d68fa1229822fc7/_assets/ollama_config.PNG and /dev/null differ
diff --git a/api/init_data/plugins/storage/cwd/langgenius/ollama-0.0.3@9ded90ac00e8510119a24be7396ba77191c9610d5e1e29f59d68fa1229822fc7/main.py b/api/init_data/plugins/storage/cwd/langgenius/ollama-0.0.3@9ded90ac00e8510119a24be7396ba77191c9610d5e1e29f59d68fa1229822fc7/main.py
deleted file mode 100644
index f2bfcdfc0e..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/ollama-0.0.3@9ded90ac00e8510119a24be7396ba77191c9610d5e1e29f59d68fa1229822fc7/main.py
+++ /dev/null
@@ -1,6 +0,0 @@
-from dify_plugin import Plugin, DifyPluginEnv
-
-plugin = Plugin(DifyPluginEnv())
-
-if __name__ == '__main__':
- plugin.run()
diff --git a/api/init_data/plugins/storage/cwd/langgenius/ollama-0.0.3@9ded90ac00e8510119a24be7396ba77191c9610d5e1e29f59d68fa1229822fc7/manifest.yaml b/api/init_data/plugins/storage/cwd/langgenius/ollama-0.0.3@9ded90ac00e8510119a24be7396ba77191c9610d5e1e29f59d68fa1229822fc7/manifest.yaml
deleted file mode 100644
index 2e13c4c87a..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/ollama-0.0.3@9ded90ac00e8510119a24be7396ba77191c9610d5e1e29f59d68fa1229822fc7/manifest.yaml
+++ /dev/null
@@ -1,35 +0,0 @@
-author: langgenius
-created_at: '2024-09-20T00:13:50.29298939-04:00'
-description:
- en_US: Ollama
-icon: icon_s_en.svg
-label:
- en_US: Ollama
-meta:
- arch:
- - amd64
- - arm64
- runner:
- entrypoint: main
- language: python
- version: '3.12'
- version: 0.0.1
-name: ollama
-plugins:
- models:
- - provider/ollama.yaml
-resource:
- memory: 268435456
- permission:
- model:
- enabled: true
- llm: true
- moderation: false
- rerank: true
- speech2text: false
- text_embedding: true
- tts: false
- tool:
- enabled: true
-type: plugin
-version: 0.0.3
diff --git a/api/init_data/plugins/storage/cwd/langgenius/ollama-0.0.3@9ded90ac00e8510119a24be7396ba77191c9610d5e1e29f59d68fa1229822fc7/models/llm/__init__.py b/api/init_data/plugins/storage/cwd/langgenius/ollama-0.0.3@9ded90ac00e8510119a24be7396ba77191c9610d5e1e29f59d68fa1229822fc7/models/llm/__init__.py
deleted file mode 100644
index e69de29bb2..0000000000
diff --git a/api/init_data/plugins/storage/cwd/langgenius/ollama-0.0.3@9ded90ac00e8510119a24be7396ba77191c9610d5e1e29f59d68fa1229822fc7/models/llm/llm.py b/api/init_data/plugins/storage/cwd/langgenius/ollama-0.0.3@9ded90ac00e8510119a24be7396ba77191c9610d5e1e29f59d68fa1229822fc7/models/llm/llm.py
deleted file mode 100644
index 2524a828bb..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/ollama-0.0.3@9ded90ac00e8510119a24be7396ba77191c9610d5e1e29f59d68fa1229822fc7/models/llm/llm.py
+++ /dev/null
@@ -1,743 +0,0 @@
-import json
-import logging
-import re
-from collections.abc import Generator
-from decimal import Decimal
-from typing import Any, Optional, Union, cast
-from urllib.parse import urljoin
-import requests
-from dify_plugin.entities.model import (
- AIModelEntity,
- DefaultParameterName,
- FetchFrom,
- I18nObject,
- ModelFeature,
- ModelPropertyKey,
- ModelType,
- ParameterRule,
- ParameterType,
- PriceConfig,
-)
-from dify_plugin.entities.model.llm import (
- LLMMode,
- LLMResult,
- LLMResultChunk,
- LLMResultChunkDelta,
-)
-from dify_plugin.entities.model.message import (
- AssistantPromptMessage,
- ImagePromptMessageContent,
- PromptMessage,
- PromptMessageContentType,
- PromptMessageTool,
- SystemPromptMessage,
- TextPromptMessageContent,
- ToolPromptMessage,
- UserPromptMessage,
-)
-from dify_plugin.errors.model import (
- CredentialsValidateFailedError,
- InvokeAuthorizationError,
- InvokeBadRequestError,
- InvokeConnectionError,
- InvokeError,
- InvokeRateLimitError,
- InvokeServerUnavailableError,
-)
-from dify_plugin.interfaces.model.large_language_model import LargeLanguageModel
-
-logger = logging.getLogger(__name__)
-
-
-class OllamaLargeLanguageModel(LargeLanguageModel):
- """
- Model class for Ollama large language model.
- """
-
- def _invoke(
- self,
- model: str,
- credentials: dict,
- prompt_messages: list[PromptMessage],
- model_parameters: dict,
- tools: Optional[list[PromptMessageTool]] = None,
- stop: Optional[list[str]] = None,
- stream: bool = True,
- user: Optional[str] = None,
- ) -> Union[LLMResult, Generator]:
- """
- Invoke large language model
-
- :param model: model name
- :param credentials: model credentials
- :param prompt_messages: prompt messages
- :param model_parameters: model parameters
- :param tools: tools for tool calling
- :param stop: stop words
- :param stream: is stream response
- :param user: unique user id
- :return: full response or stream response chunk generator result
- """
- return self._generate(
- model=model,
- credentials=credentials,
- prompt_messages=prompt_messages,
- model_parameters=model_parameters,
- tools=tools,
- stop=stop,
- stream=stream,
- user=user,
- )
-
- def get_num_tokens(
- self,
- model: str,
- credentials: dict,
- prompt_messages: list[PromptMessage],
- tools: Optional[list[PromptMessageTool]] = None,
- ) -> int:
- """
- Get number of tokens for given prompt messages
-
- :param model: model name
- :param credentials: model credentials
- :param prompt_messages: prompt messages
- :param tools: tools for tool calling
- :return:
- """
- model_mode = self.get_model_mode(model, credentials)
- if model_mode == LLMMode.CHAT:
- return self._num_tokens_from_messages(prompt_messages)
- else:
- first_prompt_message = prompt_messages[0]
- if isinstance(first_prompt_message.content, str):
- text = first_prompt_message.content
- elif isinstance(first_prompt_message.content, list):
- text = ""
- for message_content in first_prompt_message.content:
- if message_content.type == PromptMessageContentType.TEXT:
- message_content = cast(
- TextPromptMessageContent, message_content
- )
- text = message_content.data
- break
- return self._get_num_tokens_by_gpt2(text)
-
- def validate_credentials(self, model: str, credentials: dict) -> None:
- """
- Validate model credentials
-
- :param model: model name
- :param credentials: model credentials
- :return:
- """
- try:
- self._generate(
- model=model,
- credentials=credentials,
- prompt_messages=[UserPromptMessage(content="ping")],
- model_parameters={"num_predict": 5},
- stream=False,
- )
- except InvokeError as ex:
- raise CredentialsValidateFailedError(
- f"An error occurred during credentials validation: {ex.description}"
- )
- except Exception as ex:
- raise CredentialsValidateFailedError(
- f"An error occurred during credentials validation: {str(ex)}"
- )
-
- def _generate(
- self,
- model: str,
- credentials: dict,
- prompt_messages: list[PromptMessage],
- model_parameters: dict,
- tools: Optional[list[PromptMessageTool]] = None,
- stop: Optional[list[str]] = None,
- stream: bool = True,
- user: Optional[str] = None,
- ) -> Union[LLMResult, Generator]:
- """
- Invoke llm completion model
-
- :param model: model name
- :param credentials: credentials
- :param prompt_messages: prompt messages
- :param model_parameters: model parameters
- :param stop: stop words
- :param stream: is stream response
- :param user: unique user id
- :return: full response or stream response chunk generator result
- """
- headers = {"Content-Type": "application/json"}
- endpoint_url = credentials["base_url"]
- if not endpoint_url.endswith("/"):
- endpoint_url += "/"
- data = {"model": model, "stream": stream}
- if "format" in model_parameters:
- data["format"] = model_parameters["format"]
- del model_parameters["format"]
- if "keep_alive" in model_parameters:
- data["keep_alive"] = model_parameters["keep_alive"]
- del model_parameters["keep_alive"]
- data["options"] = model_parameters or {}
- if stop:
- data["options"]["stop"] = stop
- completion_type = LLMMode.value_of(credentials["mode"])
- if completion_type is LLMMode.CHAT:
- endpoint_url = urljoin(endpoint_url, "api/chat")
- data["messages"] = [
- self._convert_prompt_message_to_dict(m) for m in prompt_messages
- ]
- if tools:
- data["tools"] = [
- self._convert_prompt_message_tool_to_dict(tool) for tool in tools
- ]
- else:
- endpoint_url = urljoin(endpoint_url, "api/generate")
- first_prompt_message = prompt_messages[0]
- if isinstance(first_prompt_message, UserPromptMessage):
- first_prompt_message = cast(UserPromptMessage, first_prompt_message)
- if isinstance(first_prompt_message.content, str):
- data["prompt"] = first_prompt_message.content
- elif isinstance(first_prompt_message.content, list):
- text = ""
- images = []
- for message_content in first_prompt_message.content:
- if message_content.type == PromptMessageContentType.TEXT:
- message_content = cast(
- TextPromptMessageContent, message_content
- )
- text = message_content.data
- elif message_content.type == PromptMessageContentType.IMAGE:
- message_content = cast(
- ImagePromptMessageContent, message_content
- )
- image_data = re.sub(
- "^data:image\\/[a-zA-Z]+;base64,",
- "",
- message_content.data,
- )
- images.append(image_data)
- data["prompt"] = text
- data["images"] = images
- response = requests.post(
- endpoint_url, headers=headers, json=data, timeout=(10, 300), stream=stream
- )
- response.encoding = "utf-8"
- if response.status_code != 200:
- raise InvokeError(
- f"API request failed with status code {response.status_code}: {response.text}"
- )
- if stream:
- return self._handle_generate_stream_response(
- model, credentials, completion_type, response, prompt_messages
- )
- return self._handle_generate_response(
- model, credentials, completion_type, response, prompt_messages, tools
- )
-
- def _handle_generate_response(
- self,
- model: str,
- credentials: dict,
- completion_type: LLMMode,
- response: requests.Response,
- prompt_messages: list[PromptMessage],
- tools: Optional[list[PromptMessageTool]],
- ) -> LLMResult:
- """
- Handle llm completion response
-
- :param model: model name
- :param credentials: model credentials
- :param completion_type: completion type
- :param response: response
- :param prompt_messages: prompt messages
- :return: llm result
- """
- response_json = response.json()
- tool_calls = []
- if completion_type is LLMMode.CHAT:
- message = response_json.get("message", {})
- response_content = message.get("content", "")
- response_tool_calls = message.get("tool_calls", [])
- tool_calls = [
- self._extract_response_tool_call(tool_call)
- for tool_call in response_tool_calls
- ]
- else:
- response_content = response_json["response"]
- assistant_message = AssistantPromptMessage(
- content=response_content, tool_calls=tool_calls
- )
- if "prompt_eval_count" in response_json and "eval_count" in response_json:
- prompt_tokens = response_json["prompt_eval_count"]
- completion_tokens = response_json["eval_count"]
- else:
- prompt_tokens = self._get_num_tokens_by_gpt2(prompt_messages[0].content)
- completion_tokens = self._get_num_tokens_by_gpt2(assistant_message.content)
- usage = self._calc_response_usage(
- model, credentials, prompt_tokens, completion_tokens
- )
- result = LLMResult(
- model=response_json["model"],
- prompt_messages=prompt_messages,
- message=assistant_message,
- usage=usage,
- )
- return result
-
- def _handle_generate_stream_response(
- self,
- model: str,
- credentials: dict,
- completion_type: LLMMode,
- response: requests.Response,
- prompt_messages: list[PromptMessage],
- ) -> Generator:
- """
- Handle llm completion stream response
-
- :param model: model name
- :param credentials: model credentials
- :param completion_type: completion type
- :param response: response
- :param prompt_messages: prompt messages
- :return: llm response chunk generator result
- """
- full_text = ""
- chunk_index = 0
-
- def create_final_llm_result_chunk(
- index: int, message: AssistantPromptMessage, finish_reason: str
- ) -> LLMResultChunk:
- prompt_tokens = self._get_num_tokens_by_gpt2(prompt_messages[0].content)
- completion_tokens = self._get_num_tokens_by_gpt2(full_text)
- usage = self._calc_response_usage(
- model, credentials, prompt_tokens, completion_tokens
- )
- return LLMResultChunk(
- model=model,
- prompt_messages=prompt_messages,
- delta=LLMResultChunkDelta(
- index=index,
- message=message,
- finish_reason=finish_reason,
- usage=usage,
- ),
- )
-
- for chunk in response.iter_lines(decode_unicode=True, delimiter="\n"):
- if not chunk:
- continue
- try:
- chunk_json = json.loads(chunk)
- except json.JSONDecodeError as e:
- yield create_final_llm_result_chunk(
- index=chunk_index,
- message=AssistantPromptMessage(content=""),
- finish_reason="Non-JSON encountered.",
- )
- chunk_index += 1
- break
- if completion_type is LLMMode.CHAT:
- if not chunk_json:
- continue
- if "message" not in chunk_json:
- text = ""
- else:
- text = chunk_json.get("message").get("content", "")
- else:
- if not chunk_json:
- continue
- text = chunk_json["response"]
- assistant_prompt_message = AssistantPromptMessage(content=text)
- full_text += text
- if chunk_json["done"]:
- if "prompt_eval_count" in chunk_json:
- prompt_tokens = chunk_json["prompt_eval_count"]
- else:
- prompt_message_content = prompt_messages[0].content
- if isinstance(prompt_message_content, str):
- prompt_tokens = self._get_num_tokens_by_gpt2(
- prompt_message_content
- )
- elif isinstance(prompt_message_content, list):
- content_text = ""
- for message_content in prompt_message_content:
- if message_content.type == PromptMessageContentType.TEXT:
- message_content = cast(
- TextPromptMessageContent, message_content
- )
- content_text += message_content.data
- prompt_tokens = self._get_num_tokens_by_gpt2(content_text)
- completion_tokens = chunk_json.get(
- "eval_count", self._get_num_tokens_by_gpt2(full_text)
- )
- usage = self._calc_response_usage(
- model, credentials, prompt_tokens, completion_tokens
- )
- yield LLMResultChunk(
- model=chunk_json["model"],
- prompt_messages=prompt_messages,
- delta=LLMResultChunkDelta(
- index=chunk_index,
- message=assistant_prompt_message,
- finish_reason="stop",
- usage=usage,
- ),
- )
- else:
- yield LLMResultChunk(
- model=chunk_json["model"],
- prompt_messages=prompt_messages,
- delta=LLMResultChunkDelta(
- index=chunk_index, message=assistant_prompt_message
- ),
- )
- chunk_index += 1
-
- def _convert_prompt_message_tool_to_dict(self, tool: PromptMessageTool) -> dict:
- """
- Convert PromptMessageTool to dict for Ollama API
-
- :param tool: tool
- :return: tool dict
- """
- return {
- "type": "function",
- "function": {
- "name": tool.name,
- "description": tool.description,
- "parameters": tool.parameters,
- },
- }
-
- def _convert_prompt_message_to_dict(self, message: PromptMessage) -> dict:
- """
- Convert PromptMessage to dict for Ollama API
-
- :param message: prompt message
- :return: message dict
- """
- if isinstance(message, UserPromptMessage):
- message = cast(UserPromptMessage, message)
- if isinstance(message.content, str):
- message_dict = {"role": "user", "content": message.content}
- elif isinstance(message.content, list):
- text = ""
- images = []
- for message_content in message.content:
- if message_content.type == PromptMessageContentType.TEXT:
- message_content = cast(
- TextPromptMessageContent, message_content
- )
- text = message_content.data
- elif message_content.type == PromptMessageContentType.IMAGE:
- message_content = cast(
- ImagePromptMessageContent, message_content
- )
- image_data = re.sub(
- "^data:image\\/[a-zA-Z]+;base64,", "", message_content.data
- )
- images.append(image_data)
- message_dict = {"role": "user", "content": text, "images": images}
- elif isinstance(message, AssistantPromptMessage):
- message = cast(AssistantPromptMessage, message)
- message_dict = {"role": "assistant", "content": message.content}
- elif isinstance(message, SystemPromptMessage):
- message = cast(SystemPromptMessage, message)
- message_dict = {"role": "system", "content": message.content}
- elif isinstance(message, ToolPromptMessage):
- message = cast(ToolPromptMessage, message)
- message_dict = {"role": "tool", "content": message.content}
- else:
- raise ValueError(f"Got unknown type {message}")
- return message_dict
-
- def _num_tokens_from_messages(self, messages: list[PromptMessage]) -> int:
- """
- Calculate num tokens.
-
- :param messages: messages
- """
- num_tokens = 0
- messages_dict = [self._convert_prompt_message_to_dict(m) for m in messages]
- for message in messages_dict:
- for key, value in message.items():
- num_tokens += self._get_num_tokens_by_gpt2(str(key))
- num_tokens += self._get_num_tokens_by_gpt2(str(value))
- return num_tokens
-
- def _extract_response_tool_call(
- self, response_tool_call: dict
- ) -> AssistantPromptMessage.ToolCall:
- """
- Extract response tool call
- """
- tool_call = None
- if response_tool_call and "function" in response_tool_call:
- arguments = response_tool_call.get("function", {}).get("arguments")
- if isinstance(arguments, dict):
- arguments = json.dumps(arguments)
- function = AssistantPromptMessage.ToolCall.ToolCallFunction(
- name=response_tool_call.get("function", {}).get("name"),
- arguments=arguments,
- )
- tool_call = AssistantPromptMessage.ToolCall(
- id=response_tool_call.get("function", {}).get("name"),
- type="function",
- function=function,
- )
- return tool_call
-
- def get_customizable_model_schema(
- self, model: str, credentials: dict
- ) -> AIModelEntity:
- """
- Get customizable model schema.
-
- :param model: model name
- :param credentials: credentials
-
- :return: model schema
- """
- extras: dict[str, Any] = {"features": []}
- if "vision_support" in credentials and credentials["vision_support"] == "true":
- extras["features"].append(ModelFeature.VISION)
- if (
- "function_call_support" in credentials
- and credentials["function_call_support"] == "true"
- ):
- extras["features"].append(ModelFeature.TOOL_CALL)
- extras["features"].append(ModelFeature.MULTI_TOOL_CALL)
- entity = AIModelEntity(
- model=model,
- label=I18nObject(zh_Hans=model, en_US=model),
- model_type=ModelType.LLM,
- fetch_from=FetchFrom.CUSTOMIZABLE_MODEL,
- model_properties={
- ModelPropertyKey.MODE: credentials.get("mode"),
- ModelPropertyKey.CONTEXT_SIZE: int(
- credentials.get("context_size", 4096)
- ),
- },
- parameter_rules=[
- ParameterRule(
- name=DefaultParameterName.TEMPERATURE.value,
- use_template=DefaultParameterName.TEMPERATURE.value,
- label=I18nObject(en_US="Temperature", zh_Hans="温度"),
- type=ParameterType.FLOAT,
- help=I18nObject(
- en_US="The temperature of the model. Increasing the temperature will make the model answer more creatively. (Default: 0.8)",
- zh_Hans="模型的温度。增加温度将使模型的回答更具创造性。(默认值:0.8)",
- ),
- default=0.1,
- min=0,
- max=1,
- ),
- ParameterRule(
- name=DefaultParameterName.TOP_P.value,
- use_template=DefaultParameterName.TOP_P.value,
- label=I18nObject(en_US="Top P", zh_Hans="Top P"),
- type=ParameterType.FLOAT,
- help=I18nObject(
- en_US="Works together with top-k. A higher value (e.g., 0.95) will lead to more diverse text, while a lower value (e.g., 0.5) will generate more focused and conservative text. (Default: 0.9)",
- zh_Hans="与top-k一起工作。较高的值(例如,0.95)会导致生成更多样化的文本,而较低的值(例如,0.5)会生成更专注和保守的文本。(默认值:0.9)",
- ),
- default=0.9,
- min=0,
- max=1,
- ),
- ParameterRule(
- name="top_k",
- label=I18nObject(en_US="Top K", zh_Hans="Top K"),
- type=ParameterType.INT,
- help=I18nObject(
- en_US="Reduces the probability of generating nonsense. A higher value (e.g. 100) will give more diverse answers, while a lower value (e.g. 10) will be more conservative. (Default: 40)",
- zh_Hans="减少生成无意义内容的可能性。较高的值(例如100)将提供更多样化的答案,而较低的值(例如10)将更为保守。(默认值:40)",
- ),
- min=1,
- max=100,
- ),
- ParameterRule(
- name="repeat_penalty",
- label=I18nObject(en_US="Repeat Penalty"),
- type=ParameterType.FLOAT,
- help=I18nObject(
- en_US="Sets how strongly to penalize repetitions. A higher value (e.g., 1.5) will penalize repetitions more strongly, while a lower value (e.g., 0.9) will be more lenient. (Default: 1.1)",
- zh_Hans="设置对重复内容的惩罚强度。一个较高的值(例如,1.5)会更强地惩罚重复内容,而一个较低的值(例如,0.9)则会相对宽容。(默认值:1.1)",
- ),
- min=-2,
- max=2,
- ),
- ParameterRule(
- name="num_predict",
- use_template="max_tokens",
- label=I18nObject(en_US="Num Predict", zh_Hans="最大令牌数预测"),
- type=ParameterType.INT,
- help=I18nObject(
- en_US="Maximum number of tokens to predict when generating text. (Default: 128, -1 = infinite generation, -2 = fill context)",
- zh_Hans="生成文本时预测的最大令牌数。(默认值:128,-1 = 无限生成,-2 = 填充上下文)",
- ),
- default=512
- if int(credentials.get("max_tokens", 4096)) >= 768
- else 128,
- min=-2,
- max=int(credentials.get("max_tokens", 4096)),
- ),
- ParameterRule(
- name="mirostat",
- label=I18nObject(
- en_US="Mirostat sampling", zh_Hans="Mirostat 采样"
- ),
- type=ParameterType.INT,
- help=I18nObject(
- en_US="Enable Mirostat sampling for controlling perplexity. (default: 0, 0 = disabled, 1 = Mirostat, 2 = Mirostat 2.0)",
- zh_Hans="启用 Mirostat 采样以控制困惑度。(默认值:0,0 = 禁用,1 = Mirostat,2 = Mirostat 2.0)",
- ),
- min=0,
- max=2,
- ),
- ParameterRule(
- name="mirostat_eta",
- label=I18nObject(en_US="Mirostat Eta", zh_Hans="学习率"),
- type=ParameterType.FLOAT,
- help=I18nObject(
- en_US="Influences how quickly the algorithm responds to feedback from the generated text. A lower learning rate will result in slower adjustments, while a higher learning rate will make the algorithm more responsive. (Default: 0.1)",
- zh_Hans="影响算法对生成文本反馈响应的速度。较低的学习率会导致调整速度变慢,而较高的学习率会使得算法更加灵敏。(默认值:0.1)",
- ),
- precision=1,
- ),
- ParameterRule(
- name="mirostat_tau",
- label=I18nObject(en_US="Mirostat Tau", zh_Hans="文本连贯度"),
- type=ParameterType.FLOAT,
- help=I18nObject(
- en_US="Controls the balance between coherence and diversity of the output. A lower value will result in more focused and coherent text. (Default: 5.0)",
- zh_Hans="控制输出的连贯性和多样性之间的平衡。较低的值会导致更专注和连贯的文本。(默认值:5.0)",
- ),
- precision=1,
- ),
- ParameterRule(
- name="num_ctx",
- label=I18nObject(
- en_US="Size of context window", zh_Hans="上下文窗口大小"
- ),
- type=ParameterType.INT,
- help=I18nObject(
- en_US="Sets the size of the context window used to generate the next token. (Default: 2048)",
- zh_Hans="设置用于生成下一个标记的上下文窗口大小。(默认值:2048)",
- ),
- default=2048,
- min=1,
- ),
- ParameterRule(
- name="num_gpu",
- label=I18nObject(en_US="GPU Layers", zh_Hans="GPU 层数"),
- type=ParameterType.INT,
- help=I18nObject(
- en_US="The number of layers to offload to the GPU(s). On macOS it defaults to 1 to enable metal support, 0 to disable.As long as a model fits into one gpu it stays in one. It does not set the number of GPU(s). ",
- zh_Hans="加载到 GPU 的层数。在 macOS 上,默认为 1 以启用 Metal 支持,设置为 0 则禁用。只要模型适合一个 GPU,它就保留在其中。它不设置 GPU 的数量。",
- ),
- min=-1,
- default=1,
- ),
- ParameterRule(
- name="num_thread",
- label=I18nObject(en_US="Num Thread", zh_Hans="线程数"),
- type=ParameterType.INT,
- help=I18nObject(
- en_US="Sets the number of threads to use during computation. By default, Ollama will detect this for optimal performance. It is recommended to set this value to the number of physical CPU cores your system has (as opposed to the logical number of cores).",
- zh_Hans="设置计算过程中使用的线程数。默认情况下,Ollama会检测以获得最佳性能。建议将此值设置为系统拥有的物理CPU核心数(而不是逻辑核心数)。",
- ),
- min=1,
- ),
- ParameterRule(
- name="repeat_last_n",
- label=I18nObject(en_US="Repeat last N", zh_Hans="回溯内容"),
- type=ParameterType.INT,
- help=I18nObject(
- en_US="Sets how far back for the model to look back to prevent repetition. (Default: 64, 0 = disabled, -1 = num_ctx)",
- zh_Hans="设置模型回溯多远的内容以防止重复。(默认值:64,0 = 禁用,-1 = num_ctx)",
- ),
- min=-1,
- ),
- ParameterRule(
- name="tfs_z",
- label=I18nObject(en_US="TFS Z", zh_Hans="减少标记影响"),
- type=ParameterType.FLOAT,
- help=I18nObject(
- en_US="Tail free sampling is used to reduce the impact of less probable tokens from the output. A higher value (e.g., 2.0) will reduce the impact more, while a value of 1.0 disables this setting. (default: 1)",
- zh_Hans="用于减少输出中不太可能的标记的影响。较高的值(例如,2.0)会更多地减少这种影响,而1.0的值则会禁用此设置。(默认值:1)",
- ),
- precision=1,
- ),
- ParameterRule(
- name="seed",
- label=I18nObject(en_US="Seed", zh_Hans="随机数种子"),
- type=ParameterType.INT,
- help=I18nObject(
- en_US="Sets the random number seed to use for generation. Setting this to a specific number will make the model generate the same text for the same prompt. (Default: 0)",
- zh_Hans="设置用于生成的随机数种子。将此设置为特定数字将使模型对相同的提示生成相同的文本。(默认值:0)",
- ),
- ),
- ParameterRule(
- name="keep_alive",
- label=I18nObject(en_US="Keep Alive", zh_Hans="模型存活时间"),
- type=ParameterType.STRING,
- help=I18nObject(
- en_US="Sets how long the model is kept in memory after generating a response. This must be a duration string with a unit (e.g., '10m' for 10 minutes or '24h' for 24 hours). A negative number keeps the model loaded indefinitely, and '0' unloads the model immediately after generating a response. Valid time units are 's','m','h'. (Default: 5m)",
- zh_Hans="设置模型在生成响应后在内存中保留的时间。这必须是一个带有单位的持续时间字符串(例如,'10m' 表示10分钟,'24h' 表示24小时)。负数表示无限期地保留模型,'0'表示在生成响应后立即卸载模型。有效的时间单位有 's'(秒)、'm'(分钟)、'h'(小时)。(默认值:5m)",
- ),
- ),
- ParameterRule(
- name="format",
- label=I18nObject(en_US="Format", zh_Hans="返回格式"),
- type=ParameterType.STRING,
- help=I18nObject(
- en_US="the format to return a response in. Currently the only accepted value is json.",
- zh_Hans="返回响应的格式。目前唯一接受的值是json。",
- ),
- options=["json"],
- ),
- ],
- pricing=PriceConfig(
- input=Decimal(credentials.get("input_price", 0)),
- output=Decimal(credentials.get("output_price", 0)),
- unit=Decimal(credentials.get("unit", 0)),
- currency=credentials.get("currency", "USD"),
- ),
- **extras,
- )
- return entity
-
- @property
- def _invoke_error_mapping(self) -> dict[type[InvokeError], list[type[Exception]]]:
- """
- Map model invoke error to unified error
- The key is the error type thrown to the caller
- The value is the error type thrown by the model,
- which needs to be converted into a unified error type for the caller.
-
- :return: Invoke error mapping
- """
- return {
- InvokeAuthorizationError: [requests.exceptions.InvalidHeader],
- InvokeBadRequestError: [
- requests.exceptions.HTTPError,
- requests.exceptions.InvalidURL,
- ],
- InvokeRateLimitError: [requests.exceptions.RetryError],
- InvokeServerUnavailableError: [
- requests.exceptions.ConnectionError,
- requests.exceptions.HTTPError,
- ],
- InvokeConnectionError: [
- requests.exceptions.ConnectTimeout,
- requests.exceptions.ReadTimeout,
- ],
- }
diff --git a/api/init_data/plugins/storage/cwd/langgenius/ollama-0.0.3@9ded90ac00e8510119a24be7396ba77191c9610d5e1e29f59d68fa1229822fc7/models/text_embedding/__init__.py b/api/init_data/plugins/storage/cwd/langgenius/ollama-0.0.3@9ded90ac00e8510119a24be7396ba77191c9610d5e1e29f59d68fa1229822fc7/models/text_embedding/__init__.py
deleted file mode 100644
index e69de29bb2..0000000000
diff --git a/api/init_data/plugins/storage/cwd/langgenius/ollama-0.0.3@9ded90ac00e8510119a24be7396ba77191c9610d5e1e29f59d68fa1229822fc7/models/text_embedding/text_embedding.py b/api/init_data/plugins/storage/cwd/langgenius/ollama-0.0.3@9ded90ac00e8510119a24be7396ba77191c9610d5e1e29f59d68fa1229822fc7/models/text_embedding/text_embedding.py
deleted file mode 100644
index 0056fe870c..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/ollama-0.0.3@9ded90ac00e8510119a24be7396ba77191c9610d5e1e29f59d68fa1229822fc7/models/text_embedding/text_embedding.py
+++ /dev/null
@@ -1,200 +0,0 @@
-import json
-import logging
-import time
-from decimal import Decimal
-from typing import Optional
-from urllib.parse import urljoin
-from dify_plugin import TextEmbeddingModel
-import numpy as np
-import requests
-from dify_plugin.entities.model import (
- AIModelEntity,
- EmbeddingInputType,
- FetchFrom,
- I18nObject,
- ModelPropertyKey,
- ModelType,
- PriceConfig,
- PriceType,
-)
-from dify_plugin.entities.model.text_embedding import (
- EmbeddingUsage,
- TextEmbeddingResult,
-)
-from dify_plugin.errors.model import (
- CredentialsValidateFailedError,
- InvokeAuthorizationError,
- InvokeBadRequestError,
- InvokeConnectionError,
- InvokeError,
- InvokeRateLimitError,
- InvokeServerUnavailableError,
-)
-
-logger = logging.getLogger(__name__)
-
-
-class OllamaEmbeddingModel(TextEmbeddingModel):
- """
- Model class for an Ollama text embedding model.
- """
-
- def _invoke(
- self,
- model: str,
- credentials: dict,
- texts: list[str],
- user: Optional[str] = None,
- input_type: EmbeddingInputType = EmbeddingInputType.DOCUMENT,
- ) -> TextEmbeddingResult:
- """
- Invoke text embedding model
-
- :param model: model name
- :param credentials: model credentials
- :param texts: texts to embed
- :param user: unique user id
- :param input_type: input type
- :return: embeddings result
- """
- headers = {"Content-Type": "application/json"}
- endpoint_url = credentials.get("base_url", "")
- if endpoint_url and not endpoint_url.endswith("/"):
- endpoint_url += "/"
- endpoint_url = urljoin(endpoint_url, "api/embed")
- context_size = self._get_context_size(model, credentials)
- inputs = []
- used_tokens = 0
- for text in texts:
- num_tokens = self._get_num_tokens_by_gpt2(text)
- if num_tokens >= context_size:
- cutoff = int(np.floor(len(text) * (context_size / num_tokens)))
- inputs.append(text[0:cutoff])
- else:
- inputs.append(text)
- payload = {"input": inputs, "model": model, "options": {"use_mmap": True}}
- response = requests.post(
- endpoint_url, headers=headers, data=json.dumps(payload), timeout=(10, 300)
- )
- response.raise_for_status()
- response_data = response.json()
- embeddings = response_data["embeddings"]
- embedding_used_tokens = self.get_num_tokens(model, credentials, inputs)
- used_tokens += sum(embedding_used_tokens)
- usage = self._calc_response_usage(
- model=model, credentials=credentials, tokens=used_tokens
- )
- return TextEmbeddingResult(embeddings=embeddings, usage=usage, model=model)
-
- def get_num_tokens(
- self, model: str, credentials: dict, texts: list[str]
- ) -> list[int]:
- """
- Approximate number of tokens for given messages using GPT2 tokenizer
-
- :param model: model name
- :param credentials: model credentials
- :param texts: texts to embed
- :return:
- """
- return [self._get_num_tokens_by_gpt2(text) for text in texts]
-
- def validate_credentials(self, model: str, credentials: dict) -> None:
- """
- Validate model credentials
-
- :param model: model name
- :param credentials: model credentials
- :return:
- """
- try:
- self._invoke(model=model, credentials=credentials, texts=["ping"])
- except InvokeError as ex:
- raise CredentialsValidateFailedError(
- f"An error occurred during credentials validation: {ex.description}"
- )
- except Exception as ex:
- raise CredentialsValidateFailedError(
- f"An error occurred during credentials validation: {str(ex)}"
- )
-
- def get_customizable_model_schema(
- self, model: str, credentials: dict
- ) -> AIModelEntity:
- """
- generate custom model entities from credentials
- """
- entity = AIModelEntity(
- model=model,
- label=I18nObject(en_US=model),
- model_type=ModelType.TEXT_EMBEDDING,
- fetch_from=FetchFrom.CUSTOMIZABLE_MODEL,
- model_properties={
- ModelPropertyKey.CONTEXT_SIZE: int(
- credentials.get("context_size", 512)
- ),
- ModelPropertyKey.MAX_CHUNKS: 1,
- },
- parameter_rules=[],
- pricing=PriceConfig(
- input=Decimal(credentials.get("input_price", 0)),
- unit=Decimal(credentials.get("unit", 0)),
- currency=credentials.get("currency", "USD"),
- ),
- )
- return entity
-
- def _calc_response_usage(
- self, model: str, credentials: dict, tokens: int
- ) -> EmbeddingUsage:
- """
- Calculate response usage
-
- :param model: model name
- :param credentials: model credentials
- :param tokens: input tokens
- :return: usage
- """
- input_price_info = self.get_price(
- model=model,
- credentials=credentials,
- price_type=PriceType.INPUT,
- tokens=tokens,
- )
- usage = EmbeddingUsage(
- tokens=tokens,
- total_tokens=tokens,
- unit_price=input_price_info.unit_price,
- price_unit=input_price_info.unit,
- total_price=input_price_info.total_amount,
- currency=input_price_info.currency,
- latency=time.perf_counter() - self.started_at,
- )
- return usage
-
- @property
- def _invoke_error_mapping(self) -> dict[type[InvokeError], list[type[Exception]]]:
- """
- Map model invoke error to unified error
- The key is the error type thrown to the caller
- The value is the error type thrown by the model,
- which needs to be converted into a unified error type for the caller.
-
- :return: Invoke error mapping
- """
- return {
- InvokeAuthorizationError: [requests.exceptions.InvalidHeader],
- InvokeBadRequestError: [
- requests.exceptions.HTTPError,
- requests.exceptions.InvalidURL,
- ],
- InvokeRateLimitError: [requests.exceptions.RetryError],
- InvokeServerUnavailableError: [
- requests.exceptions.ConnectionError,
- requests.exceptions.HTTPError,
- ],
- InvokeConnectionError: [
- requests.exceptions.ConnectTimeout,
- requests.exceptions.ReadTimeout,
- ],
- }
diff --git a/api/init_data/plugins/storage/cwd/langgenius/ollama-0.0.3@9ded90ac00e8510119a24be7396ba77191c9610d5e1e29f59d68fa1229822fc7/provider/ollama.py b/api/init_data/plugins/storage/cwd/langgenius/ollama-0.0.3@9ded90ac00e8510119a24be7396ba77191c9610d5e1e29f59d68fa1229822fc7/provider/ollama.py
deleted file mode 100644
index ba7607c2ff..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/ollama-0.0.3@9ded90ac00e8510119a24be7396ba77191c9610d5e1e29f59d68fa1229822fc7/provider/ollama.py
+++ /dev/null
@@ -1,15 +0,0 @@
-import logging
-from dify_plugin import ModelProvider
-
-logger = logging.getLogger(__name__)
-
-
-class OpenAIProvider(ModelProvider):
- def validate_provider_credentials(self, credentials: dict) -> None:
- """
- Validate provider credentials
- if validate failed, raise exception
-
- :param credentials: provider credentials, credentials form defined in `provider_credential_schema`.
- """
- pass
diff --git a/api/init_data/plugins/storage/cwd/langgenius/ollama-0.0.3@9ded90ac00e8510119a24be7396ba77191c9610d5e1e29f59d68fa1229822fc7/provider/ollama.yaml b/api/init_data/plugins/storage/cwd/langgenius/ollama-0.0.3@9ded90ac00e8510119a24be7396ba77191c9610d5e1e29f59d68fa1229822fc7/provider/ollama.yaml
deleted file mode 100644
index 3d255df16c..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/ollama-0.0.3@9ded90ac00e8510119a24be7396ba77191c9610d5e1e29f59d68fa1229822fc7/provider/ollama.yaml
+++ /dev/null
@@ -1,123 +0,0 @@
-background: '#F9FAFB'
-configurate_methods:
-- customizable-model
-extra:
- python:
- model_sources:
- - models/llm/llm.py
- - models/text_embedding/text_embedding.py
- provider_source: provider/ollama.py
-help:
- title:
- en_US: How to integrate with Ollama
- zh_Hans: 如何集成 Ollama
- url:
- en_US: https://docs.dify.ai/tutorials/model-configuration/ollama
-icon_large:
- en_US: icon_l_en.svg
-icon_small:
- en_US: icon_s_en.svg
-label:
- en_US: Ollama
-model_credential_schema:
- credential_form_schemas:
- - label:
- en_US: Base URL
- zh_Hans: 基础 URL
- placeholder:
- en_US: Base url of Ollama server, e.g. http://192.168.1.100:11434
- zh_Hans: Ollama server 的基础 URL,例如 http://192.168.1.100:11434
- required: true
- type: text-input
- variable: base_url
- - default: chat
- label:
- en_US: Completion mode
- zh_Hans: 模型类型
- options:
- - label:
- en_US: Completion
- zh_Hans: 补全
- value: completion
- - label:
- en_US: Chat
- zh_Hans: 对话
- value: chat
- placeholder:
- en_US: Select completion mode
- zh_Hans: 选择对话类型
- required: true
- show_on:
- - value: llm
- variable: __model_type
- type: select
- variable: mode
- - default: '4096'
- label:
- en_US: Model context size
- zh_Hans: 模型上下文长度
- placeholder:
- en_US: Enter your Model context size
- zh_Hans: 在此输入您的模型上下文长度
- required: true
- type: text-input
- variable: context_size
- - default: '4096'
- label:
- en_US: Upper bound for max tokens
- zh_Hans: 最大 token 上限
- required: true
- show_on:
- - value: llm
- variable: __model_type
- type: text-input
- variable: max_tokens
- - default: 'false'
- label:
- en_US: Vision support
- zh_Hans: 是否支持 Vision
- options:
- - label:
- en_US: 'Yes'
- zh_Hans: 是
- value: 'true'
- - label:
- en_US: 'No'
- zh_Hans: 否
- value: 'false'
- required: false
- show_on:
- - value: llm
- variable: __model_type
- type: radio
- variable: vision_support
- - default: 'false'
- label:
- en_US: Function call support
- zh_Hans: 是否支持函数调用
- options:
- - label:
- en_US: 'Yes'
- zh_Hans: 是
- value: 'true'
- - label:
- en_US: 'No'
- zh_Hans: 否
- value: 'false'
- required: false
- show_on:
- - value: llm
- variable: __model_type
- type: radio
- variable: function_call_support
- model:
- label:
- en_US: Model Name
- zh_Hans: 模型名称
- placeholder:
- en_US: Enter your model name
- zh_Hans: 输入模型名称
-provider: ollama
-supported_model_types:
-- llm
-- text-embedding
diff --git a/api/init_data/plugins/storage/cwd/langgenius/ollama-0.0.3@9ded90ac00e8510119a24be7396ba77191c9610d5e1e29f59d68fa1229822fc7/requirements.txt b/api/init_data/plugins/storage/cwd/langgenius/ollama-0.0.3@9ded90ac00e8510119a24be7396ba77191c9610d5e1e29f59d68fa1229822fc7/requirements.txt
deleted file mode 100644
index 268b497a18..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/ollama-0.0.3@9ded90ac00e8510119a24be7396ba77191c9610d5e1e29f59d68fa1229822fc7/requirements.txt
+++ /dev/null
@@ -1,2 +0,0 @@
-dify_plugin==0.0.1b65
-numpy~=2.1.3
diff --git a/api/init_data/plugins/storage/cwd/langgenius/openai_api_compatible-0.0.11@410445eba2fa0f693d26dea2c3b9ffe51ad0777e021146ff877af6098412efc7/README.md b/api/init_data/plugins/storage/cwd/langgenius/openai_api_compatible-0.0.11@410445eba2fa0f693d26dea2c3b9ffe51ad0777e021146ff877af6098412efc7/README.md
deleted file mode 100644
index a06958301a..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/openai_api_compatible-0.0.11@410445eba2fa0f693d26dea2c3b9ffe51ad0777e021146ff877af6098412efc7/README.md
+++ /dev/null
@@ -1,9 +0,0 @@
-## Overview
-
-This plugin provides access to models that are OpenAI-compatible, including LLMs, reranking, text embedding, speech-to-text (STT), and text-to-speech(TTS) models. Developers can easily add models by providing configuration parameters such as the model name and API key.
-
-## Configure
-
-Configure the OpenAI-API-compatible model by providing its core details (Type, Name, API Key, URL) and adjusting further options like completion, context, and token limits, as well as streaming and vision settings. Save when done.
-
-
diff --git a/api/init_data/plugins/storage/cwd/langgenius/openai_api_compatible-0.0.11@410445eba2fa0f693d26dea2c3b9ffe51ad0777e021146ff877af6098412efc7/_assets/audio.mp3 b/api/init_data/plugins/storage/cwd/langgenius/openai_api_compatible-0.0.11@410445eba2fa0f693d26dea2c3b9ffe51ad0777e021146ff877af6098412efc7/_assets/audio.mp3
deleted file mode 100644
index 7c86e02e16..0000000000
Binary files a/api/init_data/plugins/storage/cwd/langgenius/openai_api_compatible-0.0.11@410445eba2fa0f693d26dea2c3b9ffe51ad0777e021146ff877af6098412efc7/_assets/audio.mp3 and /dev/null differ
diff --git a/api/init_data/plugins/storage/cwd/langgenius/openai_api_compatible-0.0.11@410445eba2fa0f693d26dea2c3b9ffe51ad0777e021146ff877af6098412efc7/_assets/icon.svg b/api/init_data/plugins/storage/cwd/langgenius/openai_api_compatible-0.0.11@410445eba2fa0f693d26dea2c3b9ffe51ad0777e021146ff877af6098412efc7/_assets/icon.svg
deleted file mode 100644
index ce65af405f..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/openai_api_compatible-0.0.11@410445eba2fa0f693d26dea2c3b9ffe51ad0777e021146ff877af6098412efc7/_assets/icon.svg
+++ /dev/null
@@ -1 +0,0 @@
-
\ No newline at end of file
diff --git a/api/init_data/plugins/storage/cwd/langgenius/openai_api_compatible-0.0.11@410445eba2fa0f693d26dea2c3b9ffe51ad0777e021146ff877af6098412efc7/_assets/openai_api_compatible-01.png b/api/init_data/plugins/storage/cwd/langgenius/openai_api_compatible-0.0.11@410445eba2fa0f693d26dea2c3b9ffe51ad0777e021146ff877af6098412efc7/_assets/openai_api_compatible-01.png
deleted file mode 100644
index 4189f8de9b..0000000000
Binary files a/api/init_data/plugins/storage/cwd/langgenius/openai_api_compatible-0.0.11@410445eba2fa0f693d26dea2c3b9ffe51ad0777e021146ff877af6098412efc7/_assets/openai_api_compatible-01.png and /dev/null differ
diff --git a/api/init_data/plugins/storage/cwd/langgenius/openai_api_compatible-0.0.11@410445eba2fa0f693d26dea2c3b9ffe51ad0777e021146ff877af6098412efc7/main.py b/api/init_data/plugins/storage/cwd/langgenius/openai_api_compatible-0.0.11@410445eba2fa0f693d26dea2c3b9ffe51ad0777e021146ff877af6098412efc7/main.py
deleted file mode 100644
index 37eb41b64f..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/openai_api_compatible-0.0.11@410445eba2fa0f693d26dea2c3b9ffe51ad0777e021146ff877af6098412efc7/main.py
+++ /dev/null
@@ -1,6 +0,0 @@
-from dify_plugin import Plugin, DifyPluginEnv
-
-plugin = Plugin(DifyPluginEnv())
-
-if __name__ == "__main__":
- plugin.run()
diff --git a/api/init_data/plugins/storage/cwd/langgenius/openai_api_compatible-0.0.11@410445eba2fa0f693d26dea2c3b9ffe51ad0777e021146ff877af6098412efc7/manifest.yaml b/api/init_data/plugins/storage/cwd/langgenius/openai_api_compatible-0.0.11@410445eba2fa0f693d26dea2c3b9ffe51ad0777e021146ff877af6098412efc7/manifest.yaml
deleted file mode 100644
index 1eed23d797..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/openai_api_compatible-0.0.11@410445eba2fa0f693d26dea2c3b9ffe51ad0777e021146ff877af6098412efc7/manifest.yaml
+++ /dev/null
@@ -1,31 +0,0 @@
-version: 0.0.11
-type: plugin
-author: "langgenius"
-name: "openai_api_compatible"
-description:
- en_US: Model providers compatible with OpenAI's API standard, such as LM Studio.
- zh_Hans: 兼容 OpenAI API 的模型供应商,例如 LM Studio 。
-label:
- en_US: "OpenAI-API-compatible"
-created_at: "2024-07-12T08:03:44.658609186Z"
-icon: icon.svg
-resource:
- memory: 1048576
- permission:
- tool:
- enabled: true
- model:
- enabled: true
- llm: true
-plugins:
- models:
- - "provider/openai_api_compatible.yaml"
-meta:
- version: 0.0.1
- arch:
- - "amd64"
- - "arm64"
- runner:
- language: "python"
- version: "3.12"
- entrypoint: "main"
diff --git a/api/init_data/plugins/storage/cwd/langgenius/openai_api_compatible-0.0.11@410445eba2fa0f693d26dea2c3b9ffe51ad0777e021146ff877af6098412efc7/models/common_openai.py b/api/init_data/plugins/storage/cwd/langgenius/openai_api_compatible-0.0.11@410445eba2fa0f693d26dea2c3b9ffe51ad0777e021146ff877af6098412efc7/models/common_openai.py
deleted file mode 100644
index 282828eb98..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/openai_api_compatible-0.0.11@410445eba2fa0f693d26dea2c3b9ffe51ad0777e021146ff877af6098412efc7/models/common_openai.py
+++ /dev/null
@@ -1,53 +0,0 @@
-from collections.abc import Mapping
-
-import openai
-from httpx import Timeout
-
-from dify_plugin.errors.model import InvokeAuthorizationError, InvokeBadRequestError, InvokeConnectionError, InvokeError, InvokeRateLimitError, InvokeServerUnavailableError
-
-
-class _CommonOpenAI:
- def _to_credential_kwargs(self, credentials: Mapping) -> dict:
- """
- Transform credentials to kwargs for model instance
-
- :param credentials:
- :return:
- """
- credentials_kwargs = {
- "api_key": credentials['openai_api_key'],
- "timeout": Timeout(315.0, read=300.0, write=10.0, connect=5.0),
- "max_retries": 1,
- }
-
- if credentials.get("openai_api_base"):
- openai_api_base = credentials["openai_api_base"].rstrip("/")
- credentials_kwargs["base_url"] = openai_api_base + "/v1"
-
- if 'openai_organization' in credentials:
- credentials_kwargs['organization'] = credentials['openai_organization']
-
- return credentials_kwargs
-
- @property
- def _invoke_error_mapping(self) -> dict[type[InvokeError], list[type[Exception]]]:
- """
- Map model invoke error to unified error
- The key is the error type thrown to the caller
- The value is the error type thrown by the model,
- which needs to be converted into a unified error type for the caller.
-
- :return: Invoke error mapping
- """
- return {
- InvokeConnectionError: [openai.APIConnectionError, openai.APITimeoutError],
- InvokeServerUnavailableError: [openai.InternalServerError],
- InvokeRateLimitError: [openai.RateLimitError],
- InvokeAuthorizationError: [openai.AuthenticationError, openai.PermissionDeniedError],
- InvokeBadRequestError: [
- openai.BadRequestError,
- openai.NotFoundError,
- openai.UnprocessableEntityError,
- openai.APIError,
- ],
- }
diff --git a/api/init_data/plugins/storage/cwd/langgenius/openai_api_compatible-0.0.11@410445eba2fa0f693d26dea2c3b9ffe51ad0777e021146ff877af6098412efc7/models/llm/llm.py b/api/init_data/plugins/storage/cwd/langgenius/openai_api_compatible-0.0.11@410445eba2fa0f693d26dea2c3b9ffe51ad0777e021146ff877af6098412efc7/models/llm/llm.py
deleted file mode 100644
index b3e2755866..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/openai_api_compatible-0.0.11@410445eba2fa0f693d26dea2c3b9ffe51ad0777e021146ff877af6098412efc7/models/llm/llm.py
+++ /dev/null
@@ -1,31 +0,0 @@
-from typing import Mapping
-
-from dify_plugin.entities.model import (
- AIModelEntity,
- I18nObject,
- ModelFeature
-)
-
-from dify_plugin.interfaces.model.openai_compatible.llm import (
- OAICompatLargeLanguageModel,
-)
-
-
-class OpenAILargeLanguageModel(OAICompatLargeLanguageModel):
- def get_customizable_model_schema(self, model: str, credentials: Mapping) -> AIModelEntity:
- entity = super().get_customizable_model_schema(model, credentials)
-
- agent_though_support = credentials.get("agent_though_support", "not_supported")
- if agent_though_support == "supported":
- try:
- entity.features.index(ModelFeature.AGENT_THOUGHT)
- except ValueError:
- entity.features.append(ModelFeature.AGENT_THOUGHT)
-
- if "display_name" in credentials and credentials["display_name"] != "":
- entity.label= I18nObject(
- en_US=credentials["display_name"],
- zh_Hans=credentials["display_name"]
- )
-
- return entity
diff --git a/api/init_data/plugins/storage/cwd/langgenius/openai_api_compatible-0.0.11@410445eba2fa0f693d26dea2c3b9ffe51ad0777e021146ff877af6098412efc7/models/rerank/rerank.py b/api/init_data/plugins/storage/cwd/langgenius/openai_api_compatible-0.0.11@410445eba2fa0f693d26dea2c3b9ffe51ad0777e021146ff877af6098412efc7/models/rerank/rerank.py
deleted file mode 100644
index 050b8415d2..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/openai_api_compatible-0.0.11@410445eba2fa0f693d26dea2c3b9ffe51ad0777e021146ff877af6098412efc7/models/rerank/rerank.py
+++ /dev/null
@@ -1,50 +0,0 @@
-from typing import Mapping
-
-from dify_plugin.entities.model import (
- AIModelEntity,
- I18nObject
-)
-
-from dify_plugin.interfaces.model.openai_compatible.rerank import (
- OAICompatRerankModel,
-)
-from dify_plugin.errors.model import (
- CredentialsValidateFailedError,
-)
-
-class OpenAIRerankModel(OAICompatRerankModel):
- def validate_credentials(self, model: str, credentials: dict) -> None:
- """
- Validate model credentials
-
- :param model: model name
- :param credentials: model credentials
- :return:
- """
- try:
- self._invoke(
- model=model,
- credentials=credentials,
- query="What is the capital of the United States?",
- docs=[
- "Carson City is the capital city of the American state of Nevada. At the 2010 United States "
- "Census, Carson City had a population of 55,274.",
- "The Commonwealth of the Northern Mariana Islands is a group of islands in the Pacific Ocean that "
- "are a political division controlled by the United States. Its capital is Saipan.",
- ],
- score_threshold=0.8,
- top_n=3,
- )
- except Exception as ex:
- raise CredentialsValidateFailedError(str(ex)) from ex
-
- def get_customizable_model_schema(self, model: str, credentials: Mapping) -> AIModelEntity:
- entity = super().get_customizable_model_schema(model, credentials)
-
- if "display_name" in credentials and credentials["display_name"] != "":
- entity.label= I18nObject(
- en_US=credentials["display_name"],
- zh_Hans=credentials["display_name"]
- )
-
- return entity
diff --git a/api/init_data/plugins/storage/cwd/langgenius/openai_api_compatible-0.0.11@410445eba2fa0f693d26dea2c3b9ffe51ad0777e021146ff877af6098412efc7/models/speech2text/speech2text.py b/api/init_data/plugins/storage/cwd/langgenius/openai_api_compatible-0.0.11@410445eba2fa0f693d26dea2c3b9ffe51ad0777e021146ff877af6098412efc7/models/speech2text/speech2text.py
deleted file mode 100644
index 0dc949dfab..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/openai_api_compatible-0.0.11@410445eba2fa0f693d26dea2c3b9ffe51ad0777e021146ff877af6098412efc7/models/speech2text/speech2text.py
+++ /dev/null
@@ -1,28 +0,0 @@
-from typing import Optional
-from dify_plugin.entities.model import AIModelEntity, FetchFrom, I18nObject, ModelType
-from dify_plugin.interfaces.model.openai_compatible.speech2text import (
- OAICompatSpeech2TextModel,
-)
-
-
-class OpenAISpeech2TextModel(OAICompatSpeech2TextModel):
- def get_customizable_model_schema(self, model: str, credentials: dict) -> Optional[AIModelEntity]:
- """
- used to define customizable model schema
- """
- entity = AIModelEntity(
- model=model,
- label=I18nObject(en_US=model),
- fetch_from=FetchFrom.CUSTOMIZABLE_MODEL,
- model_type=ModelType.SPEECH2TEXT,
- model_properties={},
- parameter_rules=[],
- )
-
- if "display_name" in credentials and credentials["display_name"] != "":
- entity.label= I18nObject(
- en_US=credentials["display_name"],
- zh_Hans=credentials["display_name"]
- )
-
- return entity
diff --git a/api/init_data/plugins/storage/cwd/langgenius/openai_api_compatible-0.0.11@410445eba2fa0f693d26dea2c3b9ffe51ad0777e021146ff877af6098412efc7/models/text_embedding/text_embedding.py b/api/init_data/plugins/storage/cwd/langgenius/openai_api_compatible-0.0.11@410445eba2fa0f693d26dea2c3b9ffe51ad0777e021146ff877af6098412efc7/models/text_embedding/text_embedding.py
deleted file mode 100644
index d3fd211b40..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/openai_api_compatible-0.0.11@410445eba2fa0f693d26dea2c3b9ffe51ad0777e021146ff877af6098412efc7/models/text_embedding/text_embedding.py
+++ /dev/null
@@ -1,24 +0,0 @@
-from typing import Mapping
-
-from dify_plugin.entities.model import (
- AIModelEntity,
- I18nObject
-)
-
-from dify_plugin.interfaces.model.openai_compatible.text_embedding import (
- OAICompatEmbeddingModel,
-)
-
-
-class OpenAITextEmbeddingModel(OAICompatEmbeddingModel):
-
- def get_customizable_model_schema(self, model: str, credentials: Mapping) -> AIModelEntity:
- entity = super().get_customizable_model_schema(model, credentials)
-
- if "display_name" in credentials and credentials["display_name"] != "":
- entity.label= I18nObject(
- en_US=credentials["display_name"],
- zh_Hans=credentials["display_name"]
- )
-
- return entity
diff --git a/api/init_data/plugins/storage/cwd/langgenius/openai_api_compatible-0.0.11@410445eba2fa0f693d26dea2c3b9ffe51ad0777e021146ff877af6098412efc7/models/tts/tts.py b/api/init_data/plugins/storage/cwd/langgenius/openai_api_compatible-0.0.11@410445eba2fa0f693d26dea2c3b9ffe51ad0777e021146ff877af6098412efc7/models/tts/tts.py
deleted file mode 100644
index 2201dff8a5..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/openai_api_compatible-0.0.11@410445eba2fa0f693d26dea2c3b9ffe51ad0777e021146ff877af6098412efc7/models/tts/tts.py
+++ /dev/null
@@ -1,22 +0,0 @@
-from typing import Mapping
-
-from dify_plugin.entities.model import (
- AIModelEntity,
- I18nObject
-)
-
-from dify_plugin.interfaces.model.openai_compatible.tts import OAICompatText2SpeechModel
-
-
-class OpenAIText2SpeechModel(OAICompatText2SpeechModel):
-
- def get_customizable_model_schema(self, model: str, credentials: Mapping) -> AIModelEntity:
- entity = super().get_customizable_model_schema(model, credentials)
-
- if "display_name" in credentials and credentials["display_name"] != "":
- entity.label= I18nObject(
- en_US=credentials["display_name"],
- zh_Hans=credentials["display_name"]
- )
-
- return entity
diff --git a/api/init_data/plugins/storage/cwd/langgenius/openai_api_compatible-0.0.11@410445eba2fa0f693d26dea2c3b9ffe51ad0777e021146ff877af6098412efc7/provider/openai_api_compatible.py b/api/init_data/plugins/storage/cwd/langgenius/openai_api_compatible-0.0.11@410445eba2fa0f693d26dea2c3b9ffe51ad0777e021146ff877af6098412efc7/provider/openai_api_compatible.py
deleted file mode 100644
index 57e28ffbc2..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/openai_api_compatible-0.0.11@410445eba2fa0f693d26dea2c3b9ffe51ad0777e021146ff877af6098412efc7/provider/openai_api_compatible.py
+++ /dev/null
@@ -1,17 +0,0 @@
-import logging
-from collections.abc import Mapping
-
-from dify_plugin import ModelProvider
-
-logger = logging.getLogger(__name__)
-
-
-class OpenAIProvider(ModelProvider):
- def validate_provider_credentials(self, credentials: Mapping) -> None:
- """
- Validate provider credentials
- if validate failed, raise exception
-
- :param credentials: provider credentials, credentials form defined in `provider_credential_schema`.
- """
- pass
\ No newline at end of file
diff --git a/api/init_data/plugins/storage/cwd/langgenius/openai_api_compatible-0.0.11@410445eba2fa0f693d26dea2c3b9ffe51ad0777e021146ff877af6098412efc7/provider/openai_api_compatible.yaml b/api/init_data/plugins/storage/cwd/langgenius/openai_api_compatible-0.0.11@410445eba2fa0f693d26dea2c3b9ffe51ad0777e021146ff877af6098412efc7/provider/openai_api_compatible.yaml
deleted file mode 100644
index 193ce61976..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/openai_api_compatible-0.0.11@410445eba2fa0f693d26dea2c3b9ffe51ad0777e021146ff877af6098412efc7/provider/openai_api_compatible.yaml
+++ /dev/null
@@ -1,240 +0,0 @@
-provider: openai_api_compatible
-label:
- en_US: OpenAI-API-compatible
-description:
- en_US: Model providers compatible with OpenAI's API standard, such as LM Studio.
- zh_Hans: 兼容 OpenAI API 的模型供应商,例如 LM Studio 。
-icon_small:
- en_US: icon.svg
-supported_model_types:
- - llm
- - rerank
- - text-embedding
- - speech2text
- - tts
-configurate_methods:
- - customizable-model
-model_credential_schema:
- model:
- label:
- en_US: Model Name
- zh_Hans: 模型名称
- placeholder:
- en_US: Enter full model name
- zh_Hans: 输入模型全称
- credential_form_schemas:
- - variable: display_name
- label:
- en_US: Model display name
- zh_Hans: 模型显示名称
- type: text-input
- required: false
- placeholder:
- zh_Hans: 模型在界面的显示名称
- en_US: The display name of the model in the interface.
- - variable: api_key
- label:
- en_US: API Key
- type: secret-input
- required: false
- placeholder:
- zh_Hans: 在此输入您的 API Key
- en_US: Enter your API Key
- - variable: endpoint_url
- label:
- zh_Hans: API endpoint URL
- en_US: API endpoint URL
- type: text-input
- required: true
- placeholder:
- zh_Hans: Base URL, e.g. https://api.openai.com/v1
- en_US: Base URL, e.g. https://api.openai.com/v1
- - variable: endpoint_model_name
- label:
- zh_Hans: API endpoint中的模型名称
- en_US: model name for API endpoint
- type: text-input
- required: false
- placeholder:
- zh_Hans: endpoint model name, e.g. chatgpt4.0
- en_US: endpoint model name, e.g. chatgpt4.0
- - variable: mode
- show_on:
- - variable: __model_type
- value: llm
- label:
- en_US: Completion mode
- type: select
- required: false
- default: chat
- placeholder:
- zh_Hans: 选择对话类型
- en_US: Select completion mode
- options:
- - value: completion
- label:
- en_US: Completion
- zh_Hans: 补全
- - value: chat
- label:
- en_US: Chat
- zh_Hans: 对话
- - variable: context_size
- label:
- zh_Hans: 模型上下文长度
- en_US: Model context size
- required: true
- show_on:
- - variable: __model_type
- value: llm
- type: text-input
- default: "4096"
- placeholder:
- zh_Hans: 在此输入您的模型上下文长度
- en_US: Enter your Model context size
- - variable: context_size
- label:
- zh_Hans: 模型上下文长度
- en_US: Model context size
- required: true
- show_on:
- - variable: __model_type
- value: text-embedding
- type: text-input
- default: "4096"
- placeholder:
- zh_Hans: 在此输入您的模型上下文长度
- en_US: Enter your Model context size
- - variable: context_size
- label:
- zh_Hans: 模型上下文长度
- en_US: Model context size
- required: true
- show_on:
- - variable: __model_type
- value: rerank
- type: text-input
- default: "4096"
- placeholder:
- zh_Hans: 在此输入您的模型上下文长度
- en_US: Enter your Model context size
- - variable: max_tokens_to_sample
- label:
- zh_Hans: 最大 token 上限
- en_US: Upper bound for max tokens
- show_on:
- - variable: __model_type
- value: llm
- default: "4096"
- type: text-input
- - variable: agent_though_support
- show_on:
- - variable: __model_type
- value: llm
- label:
- en_US: Agent Thought
- type: select
- required: false
- default: not_supported
- options:
- - value: supported
- label:
- en_US: Support
- zh_Hans: 支持
- - value: not_supported
- label:
- en_US: Not Support
- zh_Hans: 不支持
- - variable: function_calling_type
- show_on:
- - variable: __model_type
- value: llm
- label:
- en_US: Function calling
- type: select
- required: false
- default: no_call
- options:
- - value: function_call
- label:
- en_US: Function Call
- zh_Hans: Function Call
- - value: tool_call
- label:
- en_US: Tool Call
- zh_Hans: Tool Call
- - value: no_call
- label:
- en_US: Not Support
- zh_Hans: 不支持
- - variable: stream_function_calling
- show_on:
- - variable: __model_type
- value: llm
- label:
- en_US: Stream function calling
- type: select
- required: false
- default: not_supported
- options:
- - value: supported
- label:
- en_US: Support
- zh_Hans: 支持
- - value: not_supported
- label:
- en_US: Not Support
- zh_Hans: 不支持
- - variable: vision_support
- show_on:
- - variable: __model_type
- value: llm
- label:
- zh_Hans: Vision 支持
- en_US: Vision Support
- type: select
- required: false
- default: no_support
- options:
- - value: support
- label:
- en_US: Support
- zh_Hans: 支持
- - value: no_support
- label:
- en_US: Not Support
- zh_Hans: 不支持
- - variable: stream_mode_delimiter
- label:
- zh_Hans: 流模式返回结果的分隔符
- en_US: Delimiter for streaming results
- show_on:
- - variable: __model_type
- value: llm
- default: '\n\n'
- type: text-input
- - variable: voices
- show_on:
- - variable: __model_type
- value: tts
- label:
- en_US: Available Voices (comma-separated)
- zh_Hans: 可用声音(用英文逗号分隔)
- type: text-input
- required: false
- default: "alloy"
- placeholder:
- en_US: "alloy,echo,fable,onyx,nova,shimmer"
- zh_Hans: "alloy,echo,fable,onyx,nova,shimmer"
- help:
- en_US: "List voice names separated by commas. First voice will be used as default."
- zh_Hans: "用英文逗号分隔的声音列表。第一个声音将作为默认值。"
-extra:
- python:
- provider_source: provider/openai_api_compatible.py
- model_sources:
- - "models/llm/llm.py"
- - "models/text_embedding/text_embedding.py"
- - "models/rerank/rerank.py"
- - "models/speech2text/speech2text.py"
- - "models/tts/tts.py"
diff --git a/api/init_data/plugins/storage/cwd/langgenius/openai_api_compatible-0.0.11@410445eba2fa0f693d26dea2c3b9ffe51ad0777e021146ff877af6098412efc7/requirements.txt b/api/init_data/plugins/storage/cwd/langgenius/openai_api_compatible-0.0.11@410445eba2fa0f693d26dea2c3b9ffe51ad0777e021146ff877af6098412efc7/requirements.txt
deleted file mode 100644
index dd23658227..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/openai_api_compatible-0.0.11@410445eba2fa0f693d26dea2c3b9ffe51ad0777e021146ff877af6098412efc7/requirements.txt
+++ /dev/null
@@ -1,2 +0,0 @@
-dify_plugin==0.0.1b73
-openai~=1.66.3
\ No newline at end of file
diff --git a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/.env.example b/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/.env.example
deleted file mode 100644
index dbb75b858b..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/.env.example
+++ /dev/null
@@ -1,4 +0,0 @@
-INSTALL_METHOD=remote
-REMOTE_INSTALL_HOST=debug-plugin.dify.dev
-REMOTE_INSTALL_PORT=5003
-REMOTE_INSTALL_KEY=********-****-****-****-************
diff --git a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/README.md b/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/README.md
deleted file mode 100644
index a27b2c9121..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/README.md
+++ /dev/null
@@ -1,15 +0,0 @@
-## Overview
-
-SiliconCloud (MaaS) simplifies AI model deployment with robust performance. This plugin provides access to various models (LLMs, text embedding, reranking, STT, TTS), configurable via model name, API key, and other parameters.
-
-## Configure
-
-Install the SiliconFlow plugin, then configure it by entering your API Key. Get your API Key from [SiliconFlow](https://cloud.siliconflow.cn/account/ak) and save.
-
-
-
-## About SiliconFlow
-
-SiliconFlow is committed to building a scalable, standardized, and high-performance AI Infra platform. It offers SiliconCloud (the model cloud service platform), SiliconLLM (the LLM inference engine), and OneDiff (the high-performance text-to-image/video acceleration library). These solutions help enterprises and individual users deploy AI models efficiently and cost-effectively.
-
-[Website](https://siliconflow.cn/) | [SiliconCloud Quick Start](https://docs.siliconflow.cn/quickstart)
\ No newline at end of file
diff --git a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/_assets/siliconflow-01.png b/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/_assets/siliconflow-01.png
deleted file mode 100644
index d930db0b39..0000000000
Binary files a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/_assets/siliconflow-01.png and /dev/null differ
diff --git a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/_assets/siliconflow.svg b/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/_assets/siliconflow.svg
deleted file mode 100644
index 16e406f030..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/_assets/siliconflow.svg
+++ /dev/null
@@ -1 +0,0 @@
-
\ No newline at end of file
diff --git a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/_assets/siliconflow_square.svg b/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/_assets/siliconflow_square.svg
deleted file mode 100644
index ad6b384f7a..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/_assets/siliconflow_square.svg
+++ /dev/null
@@ -1 +0,0 @@
-
\ No newline at end of file
diff --git a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/main.py b/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/main.py
deleted file mode 100644
index f2bfcdfc0e..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/main.py
+++ /dev/null
@@ -1,6 +0,0 @@
-from dify_plugin import Plugin, DifyPluginEnv
-
-plugin = Plugin(DifyPluginEnv())
-
-if __name__ == '__main__':
- plugin.run()
diff --git a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/manifest.yaml b/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/manifest.yaml
deleted file mode 100644
index 4262fe5aa5..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/manifest.yaml
+++ /dev/null
@@ -1,29 +0,0 @@
-meta:
- arch:
- - amd64
- - arm64
- runner:
- entrypoint: main
- language: python
- version: "3.12"
- version: 0.0.1
-name: siliconflow
-author: langgenius
-label:
- en_US: SiliconFlow
- zh_Hans: 硅基流动
-description:
- en_US: SiliconFlow provides access to various models (LLMs, text embedding, reranking, STT, TTS), configurable via model name, API key, and other parameters.
- zh_Hans: 硅基流动提供对各种模型(LLM、文本嵌入、重排序、STT、TTS)的访问,可通过模型名称、API密钥和其他参数进行配置。
-icon: siliconflow_square.svg
-plugins:
- models:
- - provider/siliconflow.yaml
-resource:
- memory: 268435456
- permission:
- model:
- enabled: false
-type: plugin
-version: 0.0.8
-created_at: 2024-09-20T00:13:50.29298939-04:00
diff --git a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/Internvl2-26b.yaml b/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/Internvl2-26b.yaml
deleted file mode 100644
index f7b03e1254..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/Internvl2-26b.yaml
+++ /dev/null
@@ -1,84 +0,0 @@
-model: OpenGVLab/InternVL2-26B
-label:
- en_US: OpenGVLab/InternVL2-26B
-model_type: llm
-features:
- - vision
-model_properties:
- mode: chat
- context_size: 32768
-parameter_rules:
- - name: temperature
- use_template: temperature
- type: float
- default: 0.3
- min: 0.0
- max: 2.0
- help:
- zh_Hans: 用于控制随机性和多样性的程度。具体来说,temperature值控制了生成文本时对每个候选词的概率分布进行平滑的程度。较高的temperature值会降低概率分布的峰值,使得更多的低概率词被选择,生成结果更加多样化;而较低的temperature值则会增强概率分布的峰值,使得高概率词更容易被选择,生成结果更加确定。
- en_US: Used to control the degree of randomness and diversity. Specifically, the temperature value controls the degree to which the probability distribution of each candidate word is smoothed when generating text. A higher temperature value will reduce the peak value of the probability distribution, allowing more low-probability words to be selected, and the generated results will be more diverse; while a lower temperature value will enhance the peak value of the probability distribution, making it easier for high-probability words to be selected. , the generated results are more certain.
- - name: max_tokens
- use_template: max_tokens
- type: int
- default: 2000
- min: 1
- max: 2000
- help:
- zh_Hans: 用于指定模型在生成内容时token的最大数量,它定义了生成的上限,但不保证每次都会生成到这个数量。
- en_US: It is used to specify the maximum number of tokens when the model generates content. It defines the upper limit of generation, but does not guarantee that this number will be generated every time.
- - name: top_p
- use_template: top_p
- type: float
- default: 0.8
- min: 0.1
- max: 0.9
- help:
- zh_Hans: 生成过程中核采样方法概率阈值,例如,取值为0.8时,仅保留概率加起来大于等于0.8的最可能token的最小集合作为候选集。取值范围为(0,1.0),取值越大,生成的随机性越高;取值越低,生成的确定性越高。
- en_US: The probability threshold of the kernel sampling method during the generation process. For example, when the value is 0.8, only the smallest set of the most likely tokens with a sum of probabilities greater than or equal to 0.8 is retained as the candidate set. The value range is (0,1.0). The larger the value, the higher the randomness generated; the lower the value, the higher the certainty generated.
- - name: top_k
- type: int
- min: 0
- max: 99
- label:
- zh_Hans: 取样数量
- en_US: Top k
- help:
- zh_Hans: 生成时,采样候选集的大小。例如,取值为50时,仅将单次生成中得分最高的50个token组成随机采样的候选集。取值越大,生成的随机性越高;取值越小,生成的确定性越高。
- en_US: The size of the sample candidate set when generated. For example, when the value is 50, only the 50 highest-scoring tokens in a single generation form a randomly sampled candidate set. The larger the value, the higher the randomness generated; the smaller the value, the higher the certainty generated.
- - name: seed
- required: false
- type: int
- default: 1234
- label:
- zh_Hans: 随机种子
- en_US: Random seed
- help:
- zh_Hans: 生成时使用的随机数种子,用户控制模型生成内容的随机性。支持无符号64位整数,默认值为 1234。在使用seed时,模型将尽可能生成相同或相似的结果,但目前不保证每次生成的结果完全相同。
- en_US: The random number seed used when generating, the user controls the randomness of the content generated by the model. Supports unsigned 64-bit integers, default value is 1234. When using seed, the model will try its best to generate the same or similar results, but there is currently no guarantee that the results will be exactly the same every time.
- - name: repetition_penalty
- required: false
- type: float
- default: 1.1
- label:
- zh_Hans: 重复惩罚
- en_US: Repetition penalty
- help:
- zh_Hans: 用于控制模型生成时的重复度。提高repetition_penalty时可以降低模型生成的重复度。1.0表示不做惩罚。
- en_US: Used to control the repeatability when generating models. Increasing repetition_penalty can reduce the duplication of model generation. 1.0 means no punishment.
- - name: response_format
- label:
- zh_Hans: 回复格式
- en_US: Response Format
- type: string
- help:
- zh_Hans: 指定模型必须输出的格式
- en_US: specifying the format that the model must output
- required: false
- options:
- - text
- - json_object
-pricing:
- input: '21'
- output: '21'
- unit: '0.000001'
- currency: RMB
diff --git a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/Internvl2-8b.yaml b/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/Internvl2-8b.yaml
deleted file mode 100644
index 1e858bb4be..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/Internvl2-8b.yaml
+++ /dev/null
@@ -1,84 +0,0 @@
-model: Pro/OpenGVLab/InternVL2-8B
-label:
- en_US: Pro/OpenGVLab/InternVL2-8B
-model_type: llm
-features:
- - vision
-model_properties:
- mode: chat
- context_size: 32768
-parameter_rules:
- - name: temperature
- use_template: temperature
- type: float
- default: 0.3
- min: 0.0
- max: 2.0
- help:
- zh_Hans: 用于控制随机性和多样性的程度。具体来说,temperature值控制了生成文本时对每个候选词的概率分布进行平滑的程度。较高的temperature值会降低概率分布的峰值,使得更多的低概率词被选择,生成结果更加多样化;而较低的temperature值则会增强概率分布的峰值,使得高概率词更容易被选择,生成结果更加确定。
- en_US: Used to control the degree of randomness and diversity. Specifically, the temperature value controls the degree to which the probability distribution of each candidate word is smoothed when generating text. A higher temperature value will reduce the peak value of the probability distribution, allowing more low-probability words to be selected, and the generated results will be more diverse; while a lower temperature value will enhance the peak value of the probability distribution, making it easier for high-probability words to be selected. , the generated results are more certain.
- - name: max_tokens
- use_template: max_tokens
- type: int
- default: 2000
- min: 1
- max: 2000
- help:
- zh_Hans: 用于指定模型在生成内容时token的最大数量,它定义了生成的上限,但不保证每次都会生成到这个数量。
- en_US: It is used to specify the maximum number of tokens when the model generates content. It defines the upper limit of generation, but does not guarantee that this number will be generated every time.
- - name: top_p
- use_template: top_p
- type: float
- default: 0.8
- min: 0.1
- max: 0.9
- help:
- zh_Hans: 生成过程中核采样方法概率阈值,例如,取值为0.8时,仅保留概率加起来大于等于0.8的最可能token的最小集合作为候选集。取值范围为(0,1.0),取值越大,生成的随机性越高;取值越低,生成的确定性越高。
- en_US: The probability threshold of the kernel sampling method during the generation process. For example, when the value is 0.8, only the smallest set of the most likely tokens with a sum of probabilities greater than or equal to 0.8 is retained as the candidate set. The value range is (0,1.0). The larger the value, the higher the randomness generated; the lower the value, the higher the certainty generated.
- - name: top_k
- type: int
- min: 0
- max: 99
- label:
- zh_Hans: 取样数量
- en_US: Top k
- help:
- zh_Hans: 生成时,采样候选集的大小。例如,取值为50时,仅将单次生成中得分最高的50个token组成随机采样的候选集。取值越大,生成的随机性越高;取值越小,生成的确定性越高。
- en_US: The size of the sample candidate set when generated. For example, when the value is 50, only the 50 highest-scoring tokens in a single generation form a randomly sampled candidate set. The larger the value, the higher the randomness generated; the smaller the value, the higher the certainty generated.
- - name: seed
- required: false
- type: int
- default: 1234
- label:
- zh_Hans: 随机种子
- en_US: Random seed
- help:
- zh_Hans: 生成时使用的随机数种子,用户控制模型生成内容的随机性。支持无符号64位整数,默认值为 1234。在使用seed时,模型将尽可能生成相同或相似的结果,但目前不保证每次生成的结果完全相同。
- en_US: The random number seed used when generating, the user controls the randomness of the content generated by the model. Supports unsigned 64-bit integers, default value is 1234. When using seed, the model will try its best to generate the same or similar results, but there is currently no guarantee that the results will be exactly the same every time.
- - name: repetition_penalty
- required: false
- type: float
- default: 1.1
- label:
- zh_Hans: 重复惩罚
- en_US: Repetition penalty
- help:
- zh_Hans: 用于控制模型生成时的重复度。提高repetition_penalty时可以降低模型生成的重复度。1.0表示不做惩罚。
- en_US: Used to control the repeatability when generating models. Increasing repetition_penalty can reduce the duplication of model generation. 1.0 means no punishment.
- - name: response_format
- label:
- zh_Hans: 回复格式
- en_US: Response Format
- type: string
- help:
- zh_Hans: 指定模型必须输出的格式
- en_US: specifying the format that the model must output
- required: false
- options:
- - text
- - json_object
-pricing:
- input: '21'
- output: '21'
- unit: '0.000001'
- currency: RMB
diff --git a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/_position.yaml b/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/_position.yaml
deleted file mode 100644
index ffa16f8bb4..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/_position.yaml
+++ /dev/null
@@ -1,44 +0,0 @@
-- Pro/deepseek-ai/DeepSeek-R1
-- Pro/deepseek-ai/DeepSeek-V3
-- deepseek-ai/DeepSeek-R1
-- deepseek-ai/DeepSeek-V3
-- deepseek-ai/DeepSeek-V2.5
-- deepseek-ai/DeepSeek-R1-Distill-Qwen-32B
-- deepseek-ai/DeepSeek-R1-Distill-Qwen-14B
-- deepseek-ai/DeepSeek-R1-Distill-Qwen-7B
-- deepseek-ai/DeepSeek-R1-Distill-Qwen-1.5B
-- deepseek-ai/DeepSeek-R1-Distill-Llama-70B
-- deepseek-ai/DeepSeek-R1-Distill-Llama-8B
-- deepseek-ai/DeepSeek-V2.5
-- deepseek-ai/Janus-Pro-7B
-- Qwen/QwQ-32B-Preview
-- Qwen/QVQ-72B-Preview
-- Qwen/Qwen2.5-72B-Instruct
-- Qwen/Qwen2.5-72B-Instruct-128K
-- Qwen/Qwen2.5-32B-Instruct
-- Qwen/Qwen2.5-14B-Instruct
-- Qwen/Qwen2.5-7B-Instruct
-- Qwen/Qwen2.5-Coder-32B-Instruct
-- Qwen/Qwen2.5-Coder-7B-Instruct
-- Qwen/Qwen2-VL-72B-Instruct
-- Qwen/Qwen2-1.5B-Instruct
-- Qwen/Qwen2.5-72B-Instruct-128K
-- Vendor-A/Qwen/Qwen2.5-72B-Instruct
-- Pro/Qwen/Qwen2-VL-7B-Instruct
-- OpenGVLab/InternVL2-26B
-- Pro/OpenGVLab/InternVL2-8B
-- Vendor-A/Qwen/Qwen2.5-72B-Instruct
-- Pro/Qwen/Qwen2-VL-7B-Instruct
-- Pro/OpenGVLab/InternVL2-8B
-- OpenGVLab/InternVL2-26B
-- THUDM/glm-4-9b-chat
-- 01-ai/Yi-1.5-34B-Chat-16K
-- 01-ai/Yi-1.5-9B-Chat-16K
-- 01-ai/Yi-1.5-6B-Chat
-- internlm/internlm2_5-20b-chat
-- internlm/internlm2_5-7b-chat
-- meta-llama/Llama-3.3-70B-Instruct
-- meta-llama/Meta-Llama-3.1-70B-Instruct
-- meta-llama/Meta-Llama-3.1-8B-Instruct
-- google/gemma-2-27b-it
-- google/gemma-2-9b-it
diff --git a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/deepdeek-coder-v2-instruct.yaml b/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/deepdeek-coder-v2-instruct.yaml
deleted file mode 100644
index b13a2a751c..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/deepdeek-coder-v2-instruct.yaml
+++ /dev/null
@@ -1,40 +0,0 @@
-model: deepseek-ai/DeepSeek-Coder-V2-Instruct
-label:
- en_US: deepseek-ai/DeepSeek-Coder-V2-Instruct
-model_type: llm
-features:
- - agent-thought
-model_properties:
- mode: chat
- context_size: 32768
-parameter_rules:
- - name: temperature
- use_template: temperature
- - name: max_tokens
- use_template: max_tokens
- type: int
- default: 512
- min: 1
- max: 4096
- help:
- zh_Hans: 指定生成结果长度的上限。如果生成结果截断,可以调大该参数。
- en_US: Specifies the upper limit on the length of generated results. If the generated results are truncated, you can increase this parameter.
- - name: top_p
- use_template: top_p
- - name: top_k
- label:
- zh_Hans: 取样数量
- en_US: Top k
- type: int
- help:
- zh_Hans: 仅从每个后续标记的前 K 个选项中采样。
- en_US: Only sample from the top K options for each subsequent token.
- required: false
- - name: frequency_penalty
- use_template: frequency_penalty
-pricing:
- input: '1.33'
- output: '1.33'
- unit: '0.000001'
- currency: RMB
-deprecated: true
diff --git a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/deepseek-r1-distill-llama-70B.yaml b/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/deepseek-r1-distill-llama-70B.yaml
deleted file mode 100644
index 59e0b4d68e..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/deepseek-r1-distill-llama-70B.yaml
+++ /dev/null
@@ -1,21 +0,0 @@
-model: deepseek-ai/DeepSeek-R1-Distill-Llama-70B
-label:
- zh_Hans: deepseek-ai/DeepSeek-R1-Distill-Llama-70B
- en_US: deepseek-ai/DeepSeek-R1-Distill-Llama-70B
-model_type: llm
-features:
- - agent-thought
-model_properties:
- mode: chat
- context_size: 32000
-parameter_rules:
- - name: max_tokens
- use_template: max_tokens
- min: 1
- max: 8192
- default: 4096
-pricing:
- input: "0.00"
- output: "4.3"
- unit: "0.000001"
- currency: RMB
diff --git a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/deepseek-r1-distill-llama-8B.yaml b/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/deepseek-r1-distill-llama-8B.yaml
deleted file mode 100644
index f3256aa5a0..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/deepseek-r1-distill-llama-8B.yaml
+++ /dev/null
@@ -1,21 +0,0 @@
-model: deepseek-ai/DeepSeek-R1-Distill-Llama-8B
-label:
- zh_Hans: deepseek-ai/DeepSeek-R1-Distill-Llama-8B
- en_US: deepseek-ai/DeepSeek-R1-Distill-Llama-8B
-model_type: llm
-features:
- - agent-thought
-model_properties:
- mode: chat
- context_size: 32000
-parameter_rules:
- - name: max_tokens
- use_template: max_tokens
- min: 1
- max: 8192
- default: 4096
-pricing:
- input: "0.00"
- output: "0.00"
- unit: "0.000001"
- currency: RMB
diff --git a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/deepseek-r1-distill-qwen-1.5B.yaml b/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/deepseek-r1-distill-qwen-1.5B.yaml
deleted file mode 100644
index 7297278654..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/deepseek-r1-distill-qwen-1.5B.yaml
+++ /dev/null
@@ -1,21 +0,0 @@
-model: deepseek-ai/DeepSeek-R1-Distill-Qwen-1.5B
-label:
- zh_Hans: deepseek-ai/DeepSeek-R1-Distill-Qwen-1.5B
- en_US: deepseek-ai/DeepSeek-R1-Distill-Qwen-1.5B
-model_type: llm
-features:
- - agent-thought
-model_properties:
- mode: chat
- context_size: 32000
-parameter_rules:
- - name: max_tokens
- use_template: max_tokens
- min: 1
- max: 8192
- default: 4096
-pricing:
- input: "0.00"
- output: "1.26"
- unit: "0.000001"
- currency: RMB
diff --git a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/deepseek-r1-distill-qwen-14B.yaml b/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/deepseek-r1-distill-qwen-14B.yaml
deleted file mode 100644
index 24b5c89ebf..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/deepseek-r1-distill-qwen-14B.yaml
+++ /dev/null
@@ -1,21 +0,0 @@
-model: deepseek-ai/DeepSeek-R1-Distill-Qwen-14B
-label:
- zh_Hans: deepseek-ai/DeepSeek-R1-Distill-Qwen-14B
- en_US: deepseek-ai/DeepSeek-R1-Distill-Qwen-14B
-model_type: llm
-features:
- - agent-thought
-model_properties:
- mode: chat
- context_size: 32000
-parameter_rules:
- - name: max_tokens
- use_template: max_tokens
- min: 1
- max: 8192
- default: 4096
-pricing:
- input: "0.00"
- output: "0.70"
- unit: "0.000001"
- currency: RMB
diff --git a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/deepseek-r1-distill-qwen-32B.yaml b/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/deepseek-r1-distill-qwen-32B.yaml
deleted file mode 100644
index 2a8cce1f96..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/deepseek-r1-distill-qwen-32B.yaml
+++ /dev/null
@@ -1,21 +0,0 @@
-model: deepseek-ai/DeepSeek-R1-Distill-Qwen-32B
-label:
- zh_Hans: deepseek-ai/DeepSeek-R1-Distill-Qwen-32B
- en_US: deepseek-ai/DeepSeek-R1-Distill-Qwen-32B
-model_type: llm
-features:
- - agent-thought
-model_properties:
- mode: chat
- context_size: 32000
-parameter_rules:
- - name: max_tokens
- use_template: max_tokens
- min: 1
- max: 8192
- default: 4096
-pricing:
- input: "0.00"
- output: "1.26"
- unit: "0.000001"
- currency: RMB
diff --git a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/deepseek-r1-distill-qwen-7B.yaml b/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/deepseek-r1-distill-qwen-7B.yaml
deleted file mode 100644
index cde1c14aae..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/deepseek-r1-distill-qwen-7B.yaml
+++ /dev/null
@@ -1,21 +0,0 @@
-model: deepseek-ai/DeepSeek-R1-Distill-Qwen-7B
-label:
- zh_Hans: deepseek-ai/DeepSeek-R1-Distill-Qwen-7B
- en_US: deepseek-ai/DeepSeek-R1-Distill-Qwen-7B
-model_type: llm
-features:
- - agent-thought
-model_properties:
- mode: chat
- context_size: 32000
-parameter_rules:
- - name: max_tokens
- use_template: max_tokens
- min: 1
- max: 8192
- default: 4096
-pricing:
- input: "0.00"
- output: "0.00"
- unit: "0.000001"
- currency: RMB
diff --git a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/deepseek-r1-pro.yaml b/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/deepseek-r1-pro.yaml
deleted file mode 100644
index d9d34ab2a1..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/deepseek-r1-pro.yaml
+++ /dev/null
@@ -1,21 +0,0 @@
-model: Pro/deepseek-ai/DeepSeek-R1
-label:
- zh_Hans: Pro/deepseek-ai/DeepSeek-R1
- en_US: Pro/deepseek-ai/DeepSeek-R1
-model_type: llm
-features:
- - agent-thought
-model_properties:
- mode: chat
- context_size: 64000
-parameter_rules:
- - name: max_tokens
- use_template: max_tokens
- min: 1
- max: 16384
- default: 16384
-pricing:
- input: "4"
- output: "16"
- unit: "0.000001"
- currency: RMB
diff --git a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/deepseek-r1.yaml b/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/deepseek-r1.yaml
deleted file mode 100644
index 1c382f26ea..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/deepseek-r1.yaml
+++ /dev/null
@@ -1,21 +0,0 @@
-model: deepseek-ai/DeepSeek-R1
-label:
- zh_Hans: deepseek-ai/DeepSeek-R1
- en_US: deepseek-ai/DeepSeek-R1
-model_type: llm
-features:
- - agent-thought
-model_properties:
- mode: chat
- context_size: 64000
-parameter_rules:
- - name: max_tokens
- use_template: max_tokens
- min: 1
- max: 16384
- default: 16384
-pricing:
- input: "4"
- output: "16"
- unit: "0.000001"
- currency: RMB
diff --git a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/deepseek-v2-chat.yaml b/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/deepseek-v2-chat.yaml
deleted file mode 100644
index 00bdb0ddf5..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/deepseek-v2-chat.yaml
+++ /dev/null
@@ -1,40 +0,0 @@
-model: deepseek-ai/DeepSeek-V2-Chat
-label:
- en_US: deepseek-ai/DeepSeek-V2-Chat
-model_type: llm
-features:
- - agent-thought
-model_properties:
- mode: chat
- context_size: 32768
-parameter_rules:
- - name: temperature
- use_template: temperature
- - name: max_tokens
- use_template: max_tokens
- type: int
- default: 512
- min: 1
- max: 4096
- help:
- zh_Hans: 指定生成结果长度的上限。如果生成结果截断,可以调大该参数。
- en_US: Specifies the upper limit on the length of generated results. If the generated results are truncated, you can increase this parameter.
- - name: top_p
- use_template: top_p
- - name: top_k
- label:
- zh_Hans: 取样数量
- en_US: Top k
- type: int
- help:
- zh_Hans: 仅从每个后续标记的前 K 个选项中采样。
- en_US: Only sample from the top K options for each subsequent token.
- required: false
- - name: frequency_penalty
- use_template: frequency_penalty
-pricing:
- input: '1.33'
- output: '1.33'
- unit: '0.000001'
- currency: RMB
-deprecated: true
diff --git a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/deepseek-v2.5.yaml b/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/deepseek-v2.5.yaml
deleted file mode 100644
index 511cc1df9f..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/deepseek-v2.5.yaml
+++ /dev/null
@@ -1,53 +0,0 @@
-model: deepseek-ai/DeepSeek-V2.5
-label:
- en_US: deepseek-ai/DeepSeek-V2.5
-model_type: llm
-features:
- - agent-thought
- - tool-call
- - stream-tool-call
-model_properties:
- mode: chat
- context_size: 32768
-parameter_rules:
- - name: temperature
- use_template: temperature
- - name: max_tokens
- use_template: max_tokens
- type: int
- default: 512
- min: 1
- max: 4096
- help:
- zh_Hans: 指定生成结果长度的上限。如果生成结果截断,可以调大该参数。
- en_US: Specifies the upper limit on the length of generated results. If the generated results are truncated, you can increase this parameter.
- - name: top_p
- use_template: top_p
- - name: top_k
- label:
- zh_Hans: 取样数量
- en_US: Top k
- type: int
- help:
- zh_Hans: 仅从每个后续标记的前 K 个选项中采样。
- en_US: Only sample from the top K options for each subsequent token.
- required: false
- - name: frequency_penalty
- use_template: frequency_penalty
- - name: response_format
- label:
- zh_Hans: 回复格式
- en_US: Response Format
- type: string
- help:
- zh_Hans: 指定模型必须输出的格式
- en_US: specifying the format that the model must output
- required: false
- options:
- - text
- - json_object
-pricing:
- input: '1.33'
- output: '1.33'
- unit: '0.000001'
- currency: RMB
diff --git a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/deepseek-v3-pro.yaml b/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/deepseek-v3-pro.yaml
deleted file mode 100644
index 3d37734045..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/deepseek-v3-pro.yaml
+++ /dev/null
@@ -1,53 +0,0 @@
-model: Pro/deepseek-ai/DeepSeek-V3
-label:
- en_US: Pro/deepseek-ai/DeepSeek-V3
-model_type: llm
-features:
- - agent-thought
- - tool-call
- - stream-tool-call
-model_properties:
- mode: chat
- context_size: 64000
-parameter_rules:
- - name: temperature
- use_template: temperature
- - name: max_tokens
- use_template: max_tokens
- type: int
- default: 4096
- min: 1
- max: 4096
- help:
- zh_Hans: 指定生成结果长度的上限。如果生成结果截断,可以调大该参数。
- en_US: Specifies the upper limit on the length of generated results. If the generated results are truncated, you can increase this parameter.
- - name: top_p
- use_template: top_p
- - name: top_k
- label:
- zh_Hans: 取样数量
- en_US: Top k
- type: int
- help:
- zh_Hans: 仅从每个后续标记的前 K 个选项中采样。
- en_US: Only sample from the top K options for each subsequent token.
- required: false
- - name: frequency_penalty
- use_template: frequency_penalty
- - name: response_format
- label:
- zh_Hans: 回复格式
- en_US: Response Format
- type: string
- help:
- zh_Hans: 指定模型必须输出的格式
- en_US: specifying the format that the model must output
- required: false
- options:
- - text
- - json_object
-pricing:
- input: "1"
- output: "2"
- unit: "0.000001"
- currency: RMB
diff --git a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/deepseek-v3.yaml b/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/deepseek-v3.yaml
deleted file mode 100644
index ed1a5f0099..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/deepseek-v3.yaml
+++ /dev/null
@@ -1,53 +0,0 @@
-model: deepseek-ai/DeepSeek-V3
-label:
- en_US: deepseek-ai/DeepSeek-V3
-model_type: llm
-features:
- - agent-thought
- - tool-call
- - stream-tool-call
-model_properties:
- mode: chat
- context_size: 64000
-parameter_rules:
- - name: temperature
- use_template: temperature
- - name: max_tokens
- use_template: max_tokens
- type: int
- default: 512
- min: 1
- max: 4096
- help:
- zh_Hans: 指定生成结果长度的上限。如果生成结果截断,可以调大该参数。
- en_US: Specifies the upper limit on the length of generated results. If the generated results are truncated, you can increase this parameter.
- - name: top_p
- use_template: top_p
- - name: top_k
- label:
- zh_Hans: 取样数量
- en_US: Top k
- type: int
- help:
- zh_Hans: 仅从每个后续标记的前 K 个选项中采样。
- en_US: Only sample from the top K options for each subsequent token.
- required: false
- - name: frequency_penalty
- use_template: frequency_penalty
- - name: response_format
- label:
- zh_Hans: 回复格式
- en_US: Response Format
- type: string
- help:
- zh_Hans: 指定模型必须输出的格式
- en_US: specifying the format that the model must output
- required: false
- options:
- - text
- - json_object
-pricing:
- input: "1"
- output: "2"
- unit: "0.000001"
- currency: RMB
diff --git a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/gemma-2-27b-it.yaml b/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/gemma-2-27b-it.yaml
deleted file mode 100644
index 7fd7adb753..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/gemma-2-27b-it.yaml
+++ /dev/null
@@ -1,51 +0,0 @@
-model: google/gemma-2-27b-it
-label:
- en_US: google/gemma-2-27b-it
-model_type: llm
-features:
- - agent-thought
-model_properties:
- mode: chat
- context_size: 8196
-parameter_rules:
- - name: temperature
- use_template: temperature
- - name: max_tokens
- use_template: max_tokens
- type: int
- default: 512
- min: 1
- max: 4096
- help:
- zh_Hans: 指定生成结果长度的上限。如果生成结果截断,可以调大该参数。
- en_US: Specifies the upper limit on the length of generated results. If the generated results are truncated, you can increase this parameter.
- - name: top_p
- use_template: top_p
- - name: top_k
- label:
- zh_Hans: 取样数量
- en_US: Top k
- type: int
- help:
- zh_Hans: 仅从每个后续标记的前 K 个选项中采样。
- en_US: Only sample from the top K options for each subsequent token.
- required: false
- - name: frequency_penalty
- use_template: frequency_penalty
- - name: response_format
- label:
- zh_Hans: 回复格式
- en_US: Response Format
- type: string
- help:
- zh_Hans: 指定模型必须输出的格式
- en_US: specifying the format that the model must output
- required: false
- options:
- - text
- - json_object
-pricing:
- input: '1.26'
- output: '1.26'
- unit: '0.000001'
- currency: RMB
diff --git a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/gemma-2-9b-it.yaml b/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/gemma-2-9b-it.yaml
deleted file mode 100644
index ab548e4409..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/gemma-2-9b-it.yaml
+++ /dev/null
@@ -1,51 +0,0 @@
-model: google/gemma-2-9b-it
-label:
- en_US: google/gemma-2-9b-it
-model_type: llm
-features:
- - agent-thought
-model_properties:
- mode: chat
- context_size: 8196
-parameter_rules:
- - name: temperature
- use_template: temperature
- - name: max_tokens
- use_template: max_tokens
- type: int
- default: 512
- min: 1
- max: 4096
- help:
- zh_Hans: 指定生成结果长度的上限。如果生成结果截断,可以调大该参数。
- en_US: Specifies the upper limit on the length of generated results. If the generated results are truncated, you can increase this parameter.
- - name: top_p
- use_template: top_p
- - name: top_k
- label:
- zh_Hans: 取样数量
- en_US: Top k
- type: int
- help:
- zh_Hans: 仅从每个后续标记的前 K 个选项中采样。
- en_US: Only sample from the top K options for each subsequent token.
- required: false
- - name: frequency_penalty
- use_template: frequency_penalty
- - name: response_format
- label:
- zh_Hans: 回复格式
- en_US: Response Format
- type: string
- help:
- zh_Hans: 指定模型必须输出的格式
- en_US: specifying the format that the model must output
- required: false
- options:
- - text
- - json_object
-pricing:
- input: '0'
- output: '0'
- unit: '0.000001'
- currency: RMB
diff --git a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/glm4-9b-chat.yaml b/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/glm4-9b-chat.yaml
deleted file mode 100644
index 43c5b344a0..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/glm4-9b-chat.yaml
+++ /dev/null
@@ -1,51 +0,0 @@
-model: THUDM/glm-4-9b-chat
-label:
- en_US: THUDM/glm-4-9b-chat
-model_type: llm
-features:
- - agent-thought
-model_properties:
- mode: chat
- context_size: 32768
-parameter_rules:
- - name: temperature
- use_template: temperature
- - name: max_tokens
- use_template: max_tokens
- type: int
- default: 512
- min: 1
- max: 4096
- help:
- zh_Hans: 指定生成结果长度的上限。如果生成结果截断,可以调大该参数。
- en_US: Specifies the upper limit on the length of generated results. If the generated results are truncated, you can increase this parameter.
- - name: top_p
- use_template: top_p
- - name: top_k
- label:
- zh_Hans: 取样数量
- en_US: Top k
- type: int
- help:
- zh_Hans: 仅从每个后续标记的前 K 个选项中采样。
- en_US: Only sample from the top K options for each subsequent token.
- required: false
- - name: frequency_penalty
- use_template: frequency_penalty
- - name: response_format
- label:
- zh_Hans: 回复格式
- en_US: Response Format
- type: string
- help:
- zh_Hans: 指定模型必须输出的格式
- en_US: specifying the format that the model must output
- required: false
- options:
- - text
- - json_object
-pricing:
- input: '0'
- output: '0'
- unit: '0.000001'
- currency: RMB
diff --git a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/hunyuan-a52b-instruct.yaml b/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/hunyuan-a52b-instruct.yaml
deleted file mode 100644
index 51d6c024ff..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/hunyuan-a52b-instruct.yaml
+++ /dev/null
@@ -1,85 +0,0 @@
-model: Tencent/Hunyuan-A52B-Instruct
-label:
- en_US: Tencent/Hunyuan-A52B-Instruct
-model_type: llm
-features:
- - agent-thought
-model_properties:
- mode: chat
- context_size: 32768
-parameter_rules:
- - name: temperature
- use_template: temperature
- type: float
- default: 0.3
- min: 0.0
- max: 2.0
- help:
- zh_Hans: 用于控制随机性和多样性的程度。具体来说,temperature值控制了生成文本时对每个候选词的概率分布进行平滑的程度。较高的temperature值会降低概率分布的峰值,使得更多的低概率词被选择,生成结果更加多样化;而较低的temperature值则会增强概率分布的峰值,使得高概率词更容易被选择,生成结果更加确定。
- en_US: Used to control the degree of randomness and diversity. Specifically, the temperature value controls the degree to which the probability distribution of each candidate word is smoothed when generating text. A higher temperature value will reduce the peak value of the probability distribution, allowing more low-probability words to be selected, and the generated results will be more diverse; while a lower temperature value will enhance the peak value of the probability distribution, making it easier for high-probability words to be selected. , the generated results are more certain.
- - name: max_tokens
- use_template: max_tokens
- type: int
- default: 2000
- min: 1
- max: 2000
- help:
- zh_Hans: 用于指定模型在生成内容时token的最大数量,它定义了生成的上限,但不保证每次都会生成到这个数量。
- en_US: It is used to specify the maximum number of tokens when the model generates content. It defines the upper limit of generation, but does not guarantee that this number will be generated every time.
- - name: top_p
- use_template: top_p
- type: float
- default: 0.8
- min: 0.1
- max: 0.9
- help:
- zh_Hans: 生成过程中核采样方法概率阈值,例如,取值为0.8时,仅保留概率加起来大于等于0.8的最可能token的最小集合作为候选集。取值范围为(0,1.0),取值越大,生成的随机性越高;取值越低,生成的确定性越高。
- en_US: The probability threshold of the kernel sampling method during the generation process. For example, when the value is 0.8, only the smallest set of the most likely tokens with a sum of probabilities greater than or equal to 0.8 is retained as the candidate set. The value range is (0,1.0). The larger the value, the higher the randomness generated; the lower the value, the higher the certainty generated.
- - name: top_k
- type: int
- min: 0
- max: 99
- label:
- zh_Hans: 取样数量
- en_US: Top k
- help:
- zh_Hans: 生成时,采样候选集的大小。例如,取值为50时,仅将单次生成中得分最高的50个token组成随机采样的候选集。取值越大,生成的随机性越高;取值越小,生成的确定性越高。
- en_US: The size of the sample candidate set when generated. For example, when the value is 50, only the 50 highest-scoring tokens in a single generation form a randomly sampled candidate set. The larger the value, the higher the randomness generated; the smaller the value, the higher the certainty generated.
- - name: seed
- required: false
- type: int
- default: 1234
- label:
- zh_Hans: 随机种子
- en_US: Random seed
- help:
- zh_Hans: 生成时使用的随机数种子,用户控制模型生成内容的随机性。支持无符号64位整数,默认值为 1234。在使用seed时,模型将尽可能生成相同或相似的结果,但目前不保证每次生成的结果完全相同。
- en_US: The random number seed used when generating, the user controls the randomness of the content generated by the model. Supports unsigned 64-bit integers, default value is 1234. When using seed, the model will try its best to generate the same or similar results, but there is currently no guarantee that the results will be exactly the same every time.
- - name: repetition_penalty
- required: false
- type: float
- default: 1.1
- label:
- zh_Hans: 重复惩罚
- en_US: Repetition penalty
- help:
- zh_Hans: 用于控制模型生成时的重复度。提高repetition_penalty时可以降低模型生成的重复度。1.0表示不做惩罚。
- en_US: Used to control the repeatability when generating models. Increasing repetition_penalty can reduce the duplication of model generation. 1.0 means no punishment.
- - name: response_format
- label:
- zh_Hans: 回复格式
- en_US: Response Format
- type: string
- help:
- zh_Hans: 指定模型必须输出的格式
- en_US: specifying the format that the model must output
- required: false
- options:
- - text
- - json_object
-pricing:
- input: '21'
- output: '21'
- unit: '0.000001'
- currency: RMB
-deprecated: true
diff --git a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/internlm2_5-20b-chat.yaml b/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/internlm2_5-20b-chat.yaml
deleted file mode 100644
index a5ae3674c9..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/internlm2_5-20b-chat.yaml
+++ /dev/null
@@ -1,51 +0,0 @@
-model: internlm/internlm2_5-20b-chat
-label:
- en_US: internlm/internlm2_5-20b-chat
-model_type: llm
-features:
- - agent-thought
-model_properties:
- mode: chat
- context_size: 32768
-parameter_rules:
- - name: temperature
- use_template: temperature
- - name: max_tokens
- use_template: max_tokens
- type: int
- default: 512
- min: 1
- max: 4096
- help:
- zh_Hans: 指定生成结果长度的上限。如果生成结果截断,可以调大该参数。
- en_US: Specifies the upper limit on the length of generated results. If the generated results are truncated, you can increase this parameter.
- - name: top_p
- use_template: top_p
- - name: top_k
- label:
- zh_Hans: 取样数量
- en_US: Top k
- type: int
- help:
- zh_Hans: 仅从每个后续标记的前 K 个选项中采样。
- en_US: Only sample from the top K options for each subsequent token.
- required: false
- - name: frequency_penalty
- use_template: frequency_penalty
- - name: response_format
- label:
- zh_Hans: 回复格式
- en_US: Response Format
- type: string
- help:
- zh_Hans: 指定模型必须输出的格式
- en_US: specifying the format that the model must output
- required: false
- options:
- - text
- - json_object
-pricing:
- input: '1'
- output: '1'
- unit: '0.000001'
- currency: RMB
diff --git a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/internlm2_5-7b-chat.yaml b/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/internlm2_5-7b-chat.yaml
deleted file mode 100644
index dec856ed2e..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/internlm2_5-7b-chat.yaml
+++ /dev/null
@@ -1,51 +0,0 @@
-model: internlm/internlm2_5-7b-chat
-label:
- en_US: internlm/internlm2_5-7b-chat
-model_type: llm
-features:
- - agent-thought
-model_properties:
- mode: chat
- context_size: 32768
-parameter_rules:
- - name: temperature
- use_template: temperature
- - name: max_tokens
- use_template: max_tokens
- type: int
- default: 512
- min: 1
- max: 4096
- help:
- zh_Hans: 指定生成结果长度的上限。如果生成结果截断,可以调大该参数。
- en_US: Specifies the upper limit on the length of generated results. If the generated results are truncated, you can increase this parameter.
- - name: top_p
- use_template: top_p
- - name: top_k
- label:
- zh_Hans: 取样数量
- en_US: Top k
- type: int
- help:
- zh_Hans: 仅从每个后续标记的前 K 个选项中采样。
- en_US: Only sample from the top K options for each subsequent token.
- required: false
- - name: frequency_penalty
- use_template: frequency_penalty
- - name: response_format
- label:
- zh_Hans: 回复格式
- en_US: Response Format
- type: string
- help:
- zh_Hans: 指定模型必须输出的格式
- en_US: specifying the format that the model must output
- required: false
- options:
- - text
- - json_object
-pricing:
- input: '0'
- output: '0'
- unit: '0.000001'
- currency: RMB
diff --git a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/internvl2-llama3-76b.yaml b/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/internvl2-llama3-76b.yaml
deleted file mode 100644
index b5443df18c..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/internvl2-llama3-76b.yaml
+++ /dev/null
@@ -1,85 +0,0 @@
-model: OpenGVLab/InternVL2-Llama3-76B
-label:
- en_US: OpenGVLab/InternVL2-Llama3-76B
-model_type: llm
-features:
- - vision
-model_properties:
- mode: chat
- context_size: 8192
-parameter_rules:
- - name: temperature
- use_template: temperature
- type: float
- default: 0.3
- min: 0.0
- max: 2.0
- help:
- zh_Hans: 用于控制随机性和多样性的程度。具体来说,temperature值控制了生成文本时对每个候选词的概率分布进行平滑的程度。较高的temperature值会降低概率分布的峰值,使得更多的低概率词被选择,生成结果更加多样化;而较低的temperature值则会增强概率分布的峰值,使得高概率词更容易被选择,生成结果更加确定。
- en_US: Used to control the degree of randomness and diversity. Specifically, the temperature value controls the degree to which the probability distribution of each candidate word is smoothed when generating text. A higher temperature value will reduce the peak value of the probability distribution, allowing more low-probability words to be selected, and the generated results will be more diverse; while a lower temperature value will enhance the peak value of the probability distribution, making it easier for high-probability words to be selected. , the generated results are more certain.
- - name: max_tokens
- use_template: max_tokens
- type: int
- default: 2000
- min: 1
- max: 2000
- help:
- zh_Hans: 用于指定模型在生成内容时token的最大数量,它定义了生成的上限,但不保证每次都会生成到这个数量。
- en_US: It is used to specify the maximum number of tokens when the model generates content. It defines the upper limit of generation, but does not guarantee that this number will be generated every time.
- - name: top_p
- use_template: top_p
- type: float
- default: 0.8
- min: 0.1
- max: 0.9
- help:
- zh_Hans: 生成过程中核采样方法概率阈值,例如,取值为0.8时,仅保留概率加起来大于等于0.8的最可能token的最小集合作为候选集。取值范围为(0,1.0),取值越大,生成的随机性越高;取值越低,生成的确定性越高。
- en_US: The probability threshold of the kernel sampling method during the generation process. For example, when the value is 0.8, only the smallest set of the most likely tokens with a sum of probabilities greater than or equal to 0.8 is retained as the candidate set. The value range is (0,1.0). The larger the value, the higher the randomness generated; the lower the value, the higher the certainty generated.
- - name: top_k
- type: int
- min: 0
- max: 99
- label:
- zh_Hans: 取样数量
- en_US: Top k
- help:
- zh_Hans: 生成时,采样候选集的大小。例如,取值为50时,仅将单次生成中得分最高的50个token组成随机采样的候选集。取值越大,生成的随机性越高;取值越小,生成的确定性越高。
- en_US: The size of the sample candidate set when generated. For example, when the value is 50, only the 50 highest-scoring tokens in a single generation form a randomly sampled candidate set. The larger the value, the higher the randomness generated; the smaller the value, the higher the certainty generated.
- - name: seed
- required: false
- type: int
- default: 1234
- label:
- zh_Hans: 随机种子
- en_US: Random seed
- help:
- zh_Hans: 生成时使用的随机数种子,用户控制模型生成内容的随机性。支持无符号64位整数,默认值为 1234。在使用seed时,模型将尽可能生成相同或相似的结果,但目前不保证每次生成的结果完全相同。
- en_US: The random number seed used when generating, the user controls the randomness of the content generated by the model. Supports unsigned 64-bit integers, default value is 1234. When using seed, the model will try its best to generate the same or similar results, but there is currently no guarantee that the results will be exactly the same every time.
- - name: repetition_penalty
- required: false
- type: float
- default: 1.1
- label:
- zh_Hans: 重复惩罚
- en_US: Repetition penalty
- help:
- zh_Hans: 用于控制模型生成时的重复度。提高repetition_penalty时可以降低模型生成的重复度。1.0表示不做惩罚。
- en_US: Used to control the repeatability when generating models. Increasing repetition_penalty can reduce the duplication of model generation. 1.0 means no punishment.
- - name: response_format
- label:
- zh_Hans: 回复格式
- en_US: Response Format
- type: string
- help:
- zh_Hans: 指定模型必须输出的格式
- en_US: specifying the format that the model must output
- required: false
- options:
- - text
- - json_object
-pricing:
- input: '21'
- output: '21'
- unit: '0.000001'
- currency: RMB
-deprecated: true
diff --git a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/janus-pro-7B.yaml b/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/janus-pro-7B.yaml
deleted file mode 100644
index dabbd745e5..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/janus-pro-7B.yaml
+++ /dev/null
@@ -1,22 +0,0 @@
-model: deepseek-ai/Janus-Pro-7B
-label:
- zh_Hans: deepseek-ai/Janus-Pro-7B
- en_US: deepseek-ai/Janus-Pro-7B
-model_type: llm
-features:
- - agent-thought
- - vision
-model_properties:
- mode: chat
- context_size: 32000
-parameter_rules:
- - name: max_tokens
- use_template: max_tokens
- min: 1
- max: 8192
- default: 4096
-pricing:
- input: "0.00"
- output: "0.00"
- unit: "0.000001"
- currency: RMB
diff --git a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/llm.py b/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/llm.py
deleted file mode 100644
index b26f30de1e..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/llm.py
+++ /dev/null
@@ -1,90 +0,0 @@
-from collections.abc import Generator
-from typing import Optional, Union
-from dify_plugin import OAICompatLargeLanguageModel
-from dify_plugin.entities.model import (
- AIModelEntity,
- FetchFrom,
- I18nObject,
- ModelFeature,
- ModelPropertyKey,
- ModelType,
- ParameterRule,
- ParameterType,
-)
-from dify_plugin.entities.model.llm import LLMMode, LLMResult
-from dify_plugin.entities.model.message import PromptMessage, PromptMessageTool
-
-
-class SiliconflowLargeLanguageModel(OAICompatLargeLanguageModel):
- def _invoke(
- self,
- model: str,
- credentials: dict,
- prompt_messages: list[PromptMessage],
- model_parameters: dict,
- tools: Optional[list[PromptMessageTool]] = None,
- stop: Optional[list[str]] = None,
- stream: bool = True,
- user: Optional[str] = None,
- ) -> Union[LLMResult, Generator]:
- self._add_custom_parameters(credentials)
- return super()._invoke(model, credentials, prompt_messages, model_parameters, tools, stop, stream)
-
- def validate_credentials(self, model: str, credentials: dict) -> None:
- self._add_custom_parameters(credentials)
- super().validate_credentials(model, credentials)
-
- @classmethod
- def _add_custom_parameters(cls, credentials: dict) -> None:
- credentials["mode"] = "chat"
- credentials["endpoint_url"] = "https://api.siliconflow.cn/v1"
-
- def get_customizable_model_schema(self, model: str, credentials: dict) -> Optional[AIModelEntity]:
- return AIModelEntity(
- model=model,
- label=I18nObject(en_US=model, zh_Hans=model),
- model_type=ModelType.LLM,
- features=[ModelFeature.TOOL_CALL, ModelFeature.MULTI_TOOL_CALL, ModelFeature.STREAM_TOOL_CALL]
- if credentials.get("function_calling_type") == "tool_call"
- else [],
- fetch_from=FetchFrom.CUSTOMIZABLE_MODEL,
- model_properties={
- ModelPropertyKey.CONTEXT_SIZE: int(credentials.get("context_size", 8000)),
- ModelPropertyKey.MODE: LLMMode.CHAT.value,
- },
- parameter_rules=[
- ParameterRule(
- name="temperature",
- use_template="temperature",
- label=I18nObject(en_US="Temperature", zh_Hans="温度"),
- type=ParameterType.FLOAT,
- ),
- ParameterRule(
- name="max_tokens",
- use_template="max_tokens",
- default=4096,
- min=1,
- max=int(credentials.get("max_tokens", 16384)),
- label=I18nObject(en_US="Max Tokens", zh_Hans="最大标记"),
- type=ParameterType.INT,
- ),
- ParameterRule(
- name="top_p",
- use_template="top_p",
- label=I18nObject(en_US="Top P", zh_Hans="Top P"),
- type=ParameterType.FLOAT,
- ),
- ParameterRule(
- name="top_k",
- use_template="top_k",
- label=I18nObject(en_US="Top K", zh_Hans="Top K"),
- type=ParameterType.FLOAT,
- ),
- ParameterRule(
- name="frequency_penalty",
- use_template="frequency_penalty",
- label=I18nObject(en_US="Frequency Penalty", zh_Hans="重复惩罚"),
- type=ParameterType.FLOAT,
- ),
- ],
- )
diff --git a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/meta-llama-3.3-70b-instruct.yaml b/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/meta-llama-3.3-70b-instruct.yaml
deleted file mode 100644
index 9373a8f4ca..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/meta-llama-3.3-70b-instruct.yaml
+++ /dev/null
@@ -1,53 +0,0 @@
-model: meta-llama/Llama-3.3-70B-Instruct
-label:
- en_US: meta-llama/Llama-3.3-70B-Instruct
-model_type: llm
-features:
- - agent-thought
- - tool-call
- - stream-tool-call
-model_properties:
- mode: chat
- context_size: 32768
-parameter_rules:
- - name: temperature
- use_template: temperature
- - name: max_tokens
- use_template: max_tokens
- type: int
- default: 512
- min: 1
- max: 4096
- help:
- zh_Hans: 指定生成结果长度的上限。如果生成结果截断,可以调大该参数。
- en_US: Specifies the upper limit on the length of generated results. If the generated results are truncated, you can increase this parameter.
- - name: top_p
- use_template: top_p
- - name: top_k
- label:
- zh_Hans: 取样数量
- en_US: Top k
- type: int
- help:
- zh_Hans: 仅从每个后续标记的前 K 个选项中采样。
- en_US: Only sample from the top K options for each subsequent token.
- required: false
- - name: frequency_penalty
- use_template: frequency_penalty
- - name: response_format
- label:
- zh_Hans: 回复格式
- en_US: Response Format
- type: string
- help:
- zh_Hans: 指定模型必须输出的格式
- en_US: specifying the format that the model must output
- required: false
- options:
- - text
- - json_object
-pricing:
- input: '4.13'
- output: '4.13'
- unit: '0.000001'
- currency: RMB
diff --git a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/meta-mlama-3-70b-instruct.yaml b/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/meta-mlama-3-70b-instruct.yaml
deleted file mode 100644
index 9825090759..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/meta-mlama-3-70b-instruct.yaml
+++ /dev/null
@@ -1,40 +0,0 @@
-model: meta-llama/Meta-Llama-3-70B-Instruct
-label:
- en_US: meta-llama/Meta-Llama-3-70B-Instruct
-model_type: llm
-features:
- - agent-thought
-model_properties:
- mode: chat
- context_size: 32768
-parameter_rules:
- - name: temperature
- use_template: temperature
- - name: max_tokens
- use_template: max_tokens
- type: int
- default: 512
- min: 1
- max: 4096
- help:
- zh_Hans: 指定生成结果长度的上限。如果生成结果截断,可以调大该参数。
- en_US: Specifies the upper limit on the length of generated results. If the generated results are truncated, you can increase this parameter.
- - name: top_p
- use_template: top_p
- - name: top_k
- label:
- zh_Hans: 取样数量
- en_US: Top k
- type: int
- help:
- zh_Hans: 仅从每个后续标记的前 K 个选项中采样。
- en_US: Only sample from the top K options for each subsequent token.
- required: false
- - name: frequency_penalty
- use_template: frequency_penalty
-pricing:
- input: '4.13'
- output: '4.13'
- unit: '0.000001'
- currency: RMB
-deprecated: true
diff --git a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/meta-mlama-3-8b-instruct.yaml b/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/meta-mlama-3-8b-instruct.yaml
deleted file mode 100644
index 0133fd15d4..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/meta-mlama-3-8b-instruct.yaml
+++ /dev/null
@@ -1,40 +0,0 @@
-model: meta-llama/Meta-Llama-3-8B-Instruct
-label:
- en_US: meta-llama/Meta-Llama-3-8B-Instruct
-model_type: llm
-features:
- - agent-thought
-model_properties:
- mode: chat
- context_size: 8192
-parameter_rules:
- - name: temperature
- use_template: temperature
- - name: max_tokens
- use_template: max_tokens
- type: int
- default: 512
- min: 1
- max: 4096
- help:
- zh_Hans: 指定生成结果长度的上限。如果生成结果截断,可以调大该参数。
- en_US: Specifies the upper limit on the length of generated results. If the generated results are truncated, you can increase this parameter.
- - name: top_p
- use_template: top_p
- - name: top_k
- label:
- zh_Hans: 取样数量
- en_US: Top k
- type: int
- help:
- zh_Hans: 仅从每个后续标记的前 K 个选项中采样。
- en_US: Only sample from the top K options for each subsequent token.
- required: false
- - name: frequency_penalty
- use_template: frequency_penalty
-pricing:
- input: '0'
- output: '0'
- unit: '0.000001'
- currency: RMB
-deprecated: true
diff --git a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/meta-mlama-3.1-405b-instruct.yaml b/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/meta-mlama-3.1-405b-instruct.yaml
deleted file mode 100644
index ceebbac515..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/meta-mlama-3.1-405b-instruct.yaml
+++ /dev/null
@@ -1,51 +0,0 @@
-model: meta-llama/Meta-Llama-3.1-405B-Instruct
-label:
- en_US: meta-llama/Meta-Llama-3.1-405B-Instruct
-model_type: llm
-features:
- - agent-thought
-model_properties:
- mode: chat
- context_size: 32768
-parameter_rules:
- - name: temperature
- use_template: temperature
- - name: max_tokens
- use_template: max_tokens
- type: int
- default: 512
- min: 1
- max: 4096
- help:
- zh_Hans: 指定生成结果长度的上限。如果生成结果截断,可以调大该参数。
- en_US: Specifies the upper limit on the length of generated results. If the generated results are truncated, you can increase this parameter.
- - name: top_p
- use_template: top_p
- - name: top_k
- label:
- zh_Hans: 取样数量
- en_US: Top k
- type: int
- help:
- zh_Hans: 仅从每个后续标记的前 K 个选项中采样。
- en_US: Only sample from the top K options for each subsequent token.
- required: false
- - name: frequency_penalty
- use_template: frequency_penalty
- - name: response_format
- label:
- zh_Hans: 回复格式
- en_US: Response Format
- type: string
- help:
- zh_Hans: 指定模型必须输出的格式
- en_US: specifying the format that the model must output
- required: false
- options:
- - text
- - json_object
-pricing:
- input: '21'
- output: '21'
- unit: '0.000001'
- currency: RMB
diff --git a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/meta-mlama-3.1-70b-instruct.yaml b/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/meta-mlama-3.1-70b-instruct.yaml
deleted file mode 100644
index f1fbb74cbd..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/meta-mlama-3.1-70b-instruct.yaml
+++ /dev/null
@@ -1,51 +0,0 @@
-model: meta-llama/Meta-Llama-3.1-70B-Instruct
-label:
- en_US: meta-llama/Meta-Llama-3.1-70B-Instruct
-model_type: llm
-features:
- - agent-thought
-model_properties:
- mode: chat
- context_size: 8192
-parameter_rules:
- - name: temperature
- use_template: temperature
- - name: max_tokens
- use_template: max_tokens
- type: int
- default: 512
- min: 1
- max: 4096
- help:
- zh_Hans: 指定生成结果长度的上限。如果生成结果截断,可以调大该参数。
- en_US: Specifies the upper limit on the length of generated results. If the generated results are truncated, you can increase this parameter.
- - name: top_p
- use_template: top_p
- - name: top_k
- label:
- zh_Hans: 取样数量
- en_US: Top k
- type: int
- help:
- zh_Hans: 仅从每个后续标记的前 K 个选项中采样。
- en_US: Only sample from the top K options for each subsequent token.
- required: false
- - name: frequency_penalty
- use_template: frequency_penalty
- - name: response_format
- label:
- zh_Hans: 回复格式
- en_US: Response Format
- type: string
- help:
- zh_Hans: 指定模型必须输出的格式
- en_US: specifying the format that the model must output
- required: false
- options:
- - text
- - json_object
-pricing:
- input: '4.13'
- output: '4.13'
- unit: '0.000001'
- currency: RMB
diff --git a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/meta-mlama-3.1-8b-instruct.yaml b/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/meta-mlama-3.1-8b-instruct.yaml
deleted file mode 100644
index a9a43545e8..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/meta-mlama-3.1-8b-instruct.yaml
+++ /dev/null
@@ -1,51 +0,0 @@
-model: meta-llama/Meta-Llama-3.1-8B-Instruct
-label:
- en_US: meta-llama/Meta-Llama-3.1-8B-Instruct
-model_type: llm
-features:
- - agent-thought
-model_properties:
- mode: chat
- context_size: 8192
-parameter_rules:
- - name: temperature
- use_template: temperature
- - name: max_tokens
- use_template: max_tokens
- type: int
- default: 512
- min: 1
- max: 4096
- help:
- zh_Hans: 指定生成结果长度的上限。如果生成结果截断,可以调大该参数。
- en_US: Specifies the upper limit on the length of generated results. If the generated results are truncated, you can increase this parameter.
- - name: top_p
- use_template: top_p
- - name: top_k
- label:
- zh_Hans: 取样数量
- en_US: Top k
- type: int
- help:
- zh_Hans: 仅从每个后续标记的前 K 个选项中采样。
- en_US: Only sample from the top K options for each subsequent token.
- required: false
- - name: frequency_penalty
- use_template: frequency_penalty
- - name: response_format
- label:
- zh_Hans: 回复格式
- en_US: Response Format
- type: string
- help:
- zh_Hans: 指定模型必须输出的格式
- en_US: specifying the format that the model must output
- required: false
- options:
- - text
- - json_object
-pricing:
- input: '0'
- output: '0'
- unit: '0.000001'
- currency: RMB
diff --git a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/mistral-7b-instruct-v0.2.yaml b/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/mistral-7b-instruct-v0.2.yaml
deleted file mode 100644
index a71d8688a8..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/mistral-7b-instruct-v0.2.yaml
+++ /dev/null
@@ -1,40 +0,0 @@
-model: mistralai/Mistral-7B-Instruct-v0.2
-label:
- en_US: mistralai/Mistral-7B-Instruct-v0.2
-model_type: llm
-features:
- - agent-thought
-model_properties:
- mode: chat
- context_size: 32768
-parameter_rules:
- - name: temperature
- use_template: temperature
- - name: max_tokens
- use_template: max_tokens
- type: int
- default: 512
- min: 1
- max: 4096
- help:
- zh_Hans: 指定生成结果长度的上限。如果生成结果截断,可以调大该参数。
- en_US: Specifies the upper limit on the length of generated results. If the generated results are truncated, you can increase this parameter.
- - name: top_p
- use_template: top_p
- - name: top_k
- label:
- zh_Hans: 取样数量
- en_US: Top k
- type: int
- help:
- zh_Hans: 仅从每个后续标记的前 K 个选项中采样。
- en_US: Only sample from the top K options for each subsequent token.
- required: false
- - name: frequency_penalty
- use_template: frequency_penalty
-pricing:
- input: '0'
- output: '0'
- unit: '0.000001'
- currency: RMB
-deprecated: true
diff --git a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/mistral-8x7b-instruct-v0.1.yaml b/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/mistral-8x7b-instruct-v0.1.yaml
deleted file mode 100644
index db45a75c6d..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/mistral-8x7b-instruct-v0.1.yaml
+++ /dev/null
@@ -1,40 +0,0 @@
-model: mistralai/Mixtral-8x7B-Instruct-v0.1
-label:
- en_US: mistralai/Mixtral-8x7B-Instruct-v0.1
-model_type: llm
-features:
- - agent-thought
-model_properties:
- mode: chat
- context_size: 32768
-parameter_rules:
- - name: temperature
- use_template: temperature
- - name: max_tokens
- use_template: max_tokens
- type: int
- default: 512
- min: 1
- max: 4096
- help:
- zh_Hans: 指定生成结果长度的上限。如果生成结果截断,可以调大该参数。
- en_US: Specifies the upper limit on the length of generated results. If the generated results are truncated, you can increase this parameter.
- - name: top_p
- use_template: top_p
- - name: top_k
- label:
- zh_Hans: 取样数量
- en_US: Top k
- type: int
- help:
- zh_Hans: 仅从每个后续标记的前 K 个选项中采样。
- en_US: Only sample from the top K options for each subsequent token.
- required: false
- - name: frequency_penalty
- use_template: frequency_penalty
-pricing:
- input: '1.26'
- output: '1.26'
- unit: '0.000001'
- currency: RMB
-deprecated: true
diff --git a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/qwen-qvq-72B-preview.yaml b/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/qwen-qvq-72B-preview.yaml
deleted file mode 100644
index dada6bb803..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/qwen-qvq-72B-preview.yaml
+++ /dev/null
@@ -1,54 +0,0 @@
-model: Qwen/QVQ-72B-Preview
-label:
- en_US: Qwen/QVQ-72B-Preview
-model_type: llm
-features:
- - agent-thought
- - tool-call
- - stream-tool-call
- - vision
-model_properties:
- mode: chat
- context_size: 32768
-parameter_rules:
- - name: temperature
- use_template: temperature
- - name: max_tokens
- use_template: max_tokens
- type: int
- default: 8192
- min: 1
- max: 16384
- help:
- zh_Hans: 指定生成结果长度的上限。如果生成结果截断,可以调大该参数。
- en_US: Specifies the upper limit on the length of generated results. If the generated results are truncated, you can increase this parameter.
- - name: top_p
- use_template: top_p
- - name: top_k
- label:
- zh_Hans: 取样数量
- en_US: Top k
- type: int
- help:
- zh_Hans: 仅从每个后续标记的前 K 个选项中采样。
- en_US: Only sample from the top K options for each subsequent token.
- required: false
- - name: frequency_penalty
- use_template: frequency_penalty
- - name: response_format
- label:
- zh_Hans: 回复格式
- en_US: Response Format
- type: string
- help:
- zh_Hans: 指定模型必须输出的格式
- en_US: specifying the format that the model must output
- required: false
- options:
- - text
- - json_object
-pricing:
- input: '9.90'
- output: '9.90'
- unit: '0.000001'
- currency: RMB
diff --git a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/qwen-qwq-32B-preview.yaml b/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/qwen-qwq-32B-preview.yaml
deleted file mode 100644
index e73c5d2030..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/qwen-qwq-32B-preview.yaml
+++ /dev/null
@@ -1,53 +0,0 @@
-model: Qwen/QwQ-32B-Preview
-label:
- en_US: Qwen/QwQ-32B-Preview
-model_type: llm
-features:
- - agent-thought
- - tool-call
- - stream-tool-call
-model_properties:
- mode: chat
- context_size: 32768
-parameter_rules:
- - name: temperature
- use_template: temperature
- - name: max_tokens
- use_template: max_tokens
- type: int
- default: 4096
- min: 1
- max: 8192
- help:
- zh_Hans: 指定生成结果长度的上限。如果生成结果截断,可以调大该参数。
- en_US: Specifies the upper limit on the length of generated results. If the generated results are truncated, you can increase this parameter.
- - name: top_p
- use_template: top_p
- - name: top_k
- label:
- zh_Hans: 取样数量
- en_US: Top k
- type: int
- help:
- zh_Hans: 仅从每个后续标记的前 K 个选项中采样。
- en_US: Only sample from the top K options for each subsequent token.
- required: false
- - name: frequency_penalty
- use_template: frequency_penalty
- - name: response_format
- label:
- zh_Hans: 回复格式
- en_US: Response Format
- type: string
- help:
- zh_Hans: 指定模型必须输出的格式
- en_US: specifying the format that the model must output
- required: false
- options:
- - text
- - json_object
-pricing:
- input: '1.26'
- output: '1.26'
- unit: '0.000001'
- currency: RMB
diff --git a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/qwen2-1.5b-instruct.yaml b/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/qwen2-1.5b-instruct.yaml
deleted file mode 100644
index bec5d37c57..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/qwen2-1.5b-instruct.yaml
+++ /dev/null
@@ -1,39 +0,0 @@
-model: Qwen/Qwen2-1.5B-Instruct
-label:
- en_US: Qwen/Qwen2-1.5B-Instruct
-model_type: llm
-features:
- - agent-thought
-model_properties:
- mode: chat
- context_size: 32768
-parameter_rules:
- - name: temperature
- use_template: temperature
- - name: max_tokens
- use_template: max_tokens
- type: int
- default: 512
- min: 1
- max: 4096
- help:
- zh_Hans: 指定生成结果长度的上限。如果生成结果截断,可以调大该参数。
- en_US: Specifies the upper limit on the length of generated results. If the generated results are truncated, you can increase this parameter.
- - name: top_p
- use_template: top_p
- - name: top_k
- label:
- zh_Hans: 取样数量
- en_US: Top k
- type: int
- help:
- zh_Hans: 仅从每个后续标记的前 K 个选项中采样。
- en_US: Only sample from the top K options for each subsequent token.
- required: false
- - name: frequency_penalty
- use_template: frequency_penalty
-pricing:
- input: '0'
- output: '0'
- unit: '0.000001'
- currency: RMB
diff --git a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/qwen2-57b-a14b-instruct.yaml b/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/qwen2-57b-a14b-instruct.yaml
deleted file mode 100644
index 0f56d16d9b..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/qwen2-57b-a14b-instruct.yaml
+++ /dev/null
@@ -1,40 +0,0 @@
-model: Qwen/Qwen2-57B-A14B-Instruct
-label:
- en_US: Qwen/Qwen2-57B-A14B-Instruct
-model_type: llm
-features:
- - agent-thought
-model_properties:
- mode: chat
- context_size: 32768
-parameter_rules:
- - name: temperature
- use_template: temperature
- - name: max_tokens
- use_template: max_tokens
- type: int
- default: 512
- min: 1
- max: 4096
- help:
- zh_Hans: 指定生成结果长度的上限。如果生成结果截断,可以调大该参数。
- en_US: Specifies the upper limit on the length of generated results. If the generated results are truncated, you can increase this parameter.
- - name: top_p
- use_template: top_p
- - name: top_k
- label:
- zh_Hans: 取样数量
- en_US: Top k
- type: int
- help:
- zh_Hans: 仅从每个后续标记的前 K 个选项中采样。
- en_US: Only sample from the top K options for each subsequent token.
- required: false
- - name: frequency_penalty
- use_template: frequency_penalty
-pricing:
- input: '1.26'
- output: '1.26'
- unit: '0.000001'
- currency: RMB
-deprecated: true
diff --git a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/qwen2-72b-instruct.yaml b/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/qwen2-72b-instruct.yaml
deleted file mode 100644
index af65cfb8ed..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/qwen2-72b-instruct.yaml
+++ /dev/null
@@ -1,40 +0,0 @@
-model: Qwen/Qwen2-72B-Instruct
-label:
- en_US: Qwen/Qwen2-72B-Instruct
-model_type: llm
-features:
- - agent-thought
-model_properties:
- mode: chat
- context_size: 32768
-parameter_rules:
- - name: temperature
- use_template: temperature
- - name: max_tokens
- use_template: max_tokens
- type: int
- default: 512
- min: 1
- max: 4096
- help:
- zh_Hans: 指定生成结果长度的上限。如果生成结果截断,可以调大该参数。
- en_US: Specifies the upper limit on the length of generated results. If the generated results are truncated, you can increase this parameter.
- - name: top_p
- use_template: top_p
- - name: top_k
- label:
- zh_Hans: 取样数量
- en_US: Top k
- type: int
- help:
- zh_Hans: 仅从每个后续标记的前 K 个选项中采样。
- en_US: Only sample from the top K options for each subsequent token.
- required: false
- - name: frequency_penalty
- use_template: frequency_penalty
-pricing:
- input: '4.13'
- output: '4.13'
- unit: '0.000001'
- currency: RMB
-deprecated: true
diff --git a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/qwen2-7b-instruct.yaml b/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/qwen2-7b-instruct.yaml
deleted file mode 100644
index f0f10ae625..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/qwen2-7b-instruct.yaml
+++ /dev/null
@@ -1,40 +0,0 @@
-model: Qwen/Qwen2-7B-Instruct
-label:
- en_US: Qwen/Qwen2-7B-Instruct
-model_type: llm
-features:
- - agent-thought
-model_properties:
- mode: chat
- context_size: 32768
-parameter_rules:
- - name: temperature
- use_template: temperature
- - name: max_tokens
- use_template: max_tokens
- type: int
- default: 512
- min: 1
- max: 4096
- help:
- zh_Hans: 指定生成结果长度的上限。如果生成结果截断,可以调大该参数。
- en_US: Specifies the upper limit on the length of generated results. If the generated results are truncated, you can increase this parameter.
- - name: top_p
- use_template: top_p
- - name: top_k
- label:
- zh_Hans: 取样数量
- en_US: Top k
- type: int
- help:
- zh_Hans: 仅从每个后续标记的前 K 个选项中采样。
- en_US: Only sample from the top K options for each subsequent token.
- required: false
- - name: frequency_penalty
- use_template: frequency_penalty
-pricing:
- input: '0'
- output: '0'
- unit: '0.000001'
- currency: RMB
-deprecated: true
diff --git a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/qwen2-vl-72b-instruct.yaml b/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/qwen2-vl-72b-instruct.yaml
deleted file mode 100644
index f5180b41f1..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/qwen2-vl-72b-instruct.yaml
+++ /dev/null
@@ -1,84 +0,0 @@
-model: Qwen/Qwen2-VL-72B-Instruct
-label:
- en_US: Qwen/Qwen2-VL-72B-Instruct
-model_type: llm
-features:
- - vision
-model_properties:
- mode: chat
- context_size: 32768
-parameter_rules:
- - name: temperature
- use_template: temperature
- type: float
- default: 0.3
- min: 0.0
- max: 2.0
- help:
- zh_Hans: 用于控制随机性和多样性的程度。具体来说,temperature值控制了生成文本时对每个候选词的概率分布进行平滑的程度。较高的temperature值会降低概率分布的峰值,使得更多的低概率词被选择,生成结果更加多样化;而较低的temperature值则会增强概率分布的峰值,使得高概率词更容易被选择,生成结果更加确定。
- en_US: Used to control the degree of randomness and diversity. Specifically, the temperature value controls the degree to which the probability distribution of each candidate word is smoothed when generating text. A higher temperature value will reduce the peak value of the probability distribution, allowing more low-probability words to be selected, and the generated results will be more diverse; while a lower temperature value will enhance the peak value of the probability distribution, making it easier for high-probability words to be selected. , the generated results are more certain.
- - name: max_tokens
- use_template: max_tokens
- type: int
- default: 2000
- min: 1
- max: 2000
- help:
- zh_Hans: 用于指定模型在生成内容时token的最大数量,它定义了生成的上限,但不保证每次都会生成到这个数量。
- en_US: It is used to specify the maximum number of tokens when the model generates content. It defines the upper limit of generation, but does not guarantee that this number will be generated every time.
- - name: top_p
- use_template: top_p
- type: float
- default: 0.8
- min: 0.1
- max: 0.9
- help:
- zh_Hans: 生成过程中核采样方法概率阈值,例如,取值为0.8时,仅保留概率加起来大于等于0.8的最可能token的最小集合作为候选集。取值范围为(0,1.0),取值越大,生成的随机性越高;取值越低,生成的确定性越高。
- en_US: The probability threshold of the kernel sampling method during the generation process. For example, when the value is 0.8, only the smallest set of the most likely tokens with a sum of probabilities greater than or equal to 0.8 is retained as the candidate set. The value range is (0,1.0). The larger the value, the higher the randomness generated; the lower the value, the higher the certainty generated.
- - name: top_k
- type: int
- min: 0
- max: 99
- label:
- zh_Hans: 取样数量
- en_US: Top k
- help:
- zh_Hans: 生成时,采样候选集的大小。例如,取值为50时,仅将单次生成中得分最高的50个token组成随机采样的候选集。取值越大,生成的随机性越高;取值越小,生成的确定性越高。
- en_US: The size of the sample candidate set when generated. For example, when the value is 50, only the 50 highest-scoring tokens in a single generation form a randomly sampled candidate set. The larger the value, the higher the randomness generated; the smaller the value, the higher the certainty generated.
- - name: seed
- required: false
- type: int
- default: 1234
- label:
- zh_Hans: 随机种子
- en_US: Random seed
- help:
- zh_Hans: 生成时使用的随机数种子,用户控制模型生成内容的随机性。支持无符号64位整数,默认值为 1234。在使用seed时,模型将尽可能生成相同或相似的结果,但目前不保证每次生成的结果完全相同。
- en_US: The random number seed used when generating, the user controls the randomness of the content generated by the model. Supports unsigned 64-bit integers, default value is 1234. When using seed, the model will try its best to generate the same or similar results, but there is currently no guarantee that the results will be exactly the same every time.
- - name: repetition_penalty
- required: false
- type: float
- default: 1.1
- label:
- zh_Hans: 重复惩罚
- en_US: Repetition penalty
- help:
- zh_Hans: 用于控制模型生成时的重复度。提高repetition_penalty时可以降低模型生成的重复度。1.0表示不做惩罚。
- en_US: Used to control the repeatability when generating models. Increasing repetition_penalty can reduce the duplication of model generation. 1.0 means no punishment.
- - name: response_format
- label:
- zh_Hans: 回复格式
- en_US: Response Format
- type: string
- help:
- zh_Hans: 指定模型必须输出的格式
- en_US: specifying the format that the model must output
- required: false
- options:
- - text
- - json_object
-pricing:
- input: '4.13'
- output: '4.13'
- unit: '0.000001'
- currency: RMB
diff --git a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/qwen2-vl-7b-Instruct.yaml b/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/qwen2-vl-7b-Instruct.yaml
deleted file mode 100644
index 0ffbaee383..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/qwen2-vl-7b-Instruct.yaml
+++ /dev/null
@@ -1,84 +0,0 @@
-model: Pro/Qwen/Qwen2-VL-7B-Instruct
-label:
- en_US: Pro/Qwen/Qwen2-VL-7B-Instruct
-model_type: llm
-features:
- - vision
-model_properties:
- mode: chat
- context_size: 32768
-parameter_rules:
- - name: temperature
- use_template: temperature
- type: float
- default: 0.3
- min: 0.0
- max: 2.0
- help:
- zh_Hans: 用于控制随机性和多样性的程度。具体来说,temperature值控制了生成文本时对每个候选词的概率分布进行平滑的程度。较高的temperature值会降低概率分布的峰值,使得更多的低概率词被选择,生成结果更加多样化;而较低的temperature值则会增强概率分布的峰值,使得高概率词更容易被选择,生成结果更加确定。
- en_US: Used to control the degree of randomness and diversity. Specifically, the temperature value controls the degree to which the probability distribution of each candidate word is smoothed when generating text. A higher temperature value will reduce the peak value of the probability distribution, allowing more low-probability words to be selected, and the generated results will be more diverse; while a lower temperature value will enhance the peak value of the probability distribution, making it easier for high-probability words to be selected. , the generated results are more certain.
- - name: max_tokens
- use_template: max_tokens
- type: int
- default: 2000
- min: 1
- max: 2000
- help:
- zh_Hans: 用于指定模型在生成内容时token的最大数量,它定义了生成的上限,但不保证每次都会生成到这个数量。
- en_US: It is used to specify the maximum number of tokens when the model generates content. It defines the upper limit of generation, but does not guarantee that this number will be generated every time.
- - name: top_p
- use_template: top_p
- type: float
- default: 0.8
- min: 0.1
- max: 0.9
- help:
- zh_Hans: 生成过程中核采样方法概率阈值,例如,取值为0.8时,仅保留概率加起来大于等于0.8的最可能token的最小集合作为候选集。取值范围为(0,1.0),取值越大,生成的随机性越高;取值越低,生成的确定性越高。
- en_US: The probability threshold of the kernel sampling method during the generation process. For example, when the value is 0.8, only the smallest set of the most likely tokens with a sum of probabilities greater than or equal to 0.8 is retained as the candidate set. The value range is (0,1.0). The larger the value, the higher the randomness generated; the lower the value, the higher the certainty generated.
- - name: top_k
- type: int
- min: 0
- max: 99
- label:
- zh_Hans: 取样数量
- en_US: Top k
- help:
- zh_Hans: 生成时,采样候选集的大小。例如,取值为50时,仅将单次生成中得分最高的50个token组成随机采样的候选集。取值越大,生成的随机性越高;取值越小,生成的确定性越高。
- en_US: The size of the sample candidate set when generated. For example, when the value is 50, only the 50 highest-scoring tokens in a single generation form a randomly sampled candidate set. The larger the value, the higher the randomness generated; the smaller the value, the higher the certainty generated.
- - name: seed
- required: false
- type: int
- default: 1234
- label:
- zh_Hans: 随机种子
- en_US: Random seed
- help:
- zh_Hans: 生成时使用的随机数种子,用户控制模型生成内容的随机性。支持无符号64位整数,默认值为 1234。在使用seed时,模型将尽可能生成相同或相似的结果,但目前不保证每次生成的结果完全相同。
- en_US: The random number seed used when generating, the user controls the randomness of the content generated by the model. Supports unsigned 64-bit integers, default value is 1234. When using seed, the model will try its best to generate the same or similar results, but there is currently no guarantee that the results will be exactly the same every time.
- - name: repetition_penalty
- required: false
- type: float
- default: 1.1
- label:
- zh_Hans: 重复惩罚
- en_US: Repetition penalty
- help:
- zh_Hans: 用于控制模型生成时的重复度。提高repetition_penalty时可以降低模型生成的重复度。1.0表示不做惩罚。
- en_US: Used to control the repeatability when generating models. Increasing repetition_penalty can reduce the duplication of model generation. 1.0 means no punishment.
- - name: response_format
- label:
- zh_Hans: 回复格式
- en_US: Response Format
- type: string
- help:
- zh_Hans: 指定模型必须输出的格式
- en_US: specifying the format that the model must output
- required: false
- options:
- - text
- - json_object
-pricing:
- input: '0.35'
- output: '0.35'
- unit: '0.000001'
- currency: RMB
diff --git a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/qwen2.5-14b-instruct.yaml b/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/qwen2.5-14b-instruct.yaml
deleted file mode 100644
index 8a045b818a..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/qwen2.5-14b-instruct.yaml
+++ /dev/null
@@ -1,51 +0,0 @@
-model: Qwen/Qwen2.5-14B-Instruct
-label:
- en_US: Qwen/Qwen2.5-14B-Instruct
-model_type: llm
-features:
- - agent-thought
-model_properties:
- mode: chat
- context_size: 32768
-parameter_rules:
- - name: temperature
- use_template: temperature
- - name: max_tokens
- use_template: max_tokens
- type: int
- default: 512
- min: 1
- max: 8192
- help:
- zh_Hans: 指定生成结果长度的上限。如果生成结果截断,可以调大该参数。
- en_US: Specifies the upper limit on the length of generated results. If the generated results are truncated, you can increase this parameter.
- - name: top_p
- use_template: top_p
- - name: top_k
- label:
- zh_Hans: 取样数量
- en_US: Top k
- type: int
- help:
- zh_Hans: 仅从每个后续标记的前 K 个选项中采样。
- en_US: Only sample from the top K options for each subsequent token.
- required: false
- - name: frequency_penalty
- use_template: frequency_penalty
- - name: response_format
- label:
- zh_Hans: 回复格式
- en_US: Response Format
- type: string
- help:
- zh_Hans: 指定模型必须输出的格式
- en_US: specifying the format that the model must output
- required: false
- options:
- - text
- - json_object
-pricing:
- input: '0.7'
- output: '0.7'
- unit: '0.000001'
- currency: RMB
diff --git a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/qwen2.5-32b-instruct.yaml b/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/qwen2.5-32b-instruct.yaml
deleted file mode 100644
index 9c308d2ab4..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/qwen2.5-32b-instruct.yaml
+++ /dev/null
@@ -1,51 +0,0 @@
-model: Qwen/Qwen2.5-32B-Instruct
-label:
- en_US: Qwen/Qwen2.5-32B-Instruct
-model_type: llm
-features:
- - agent-thought
-model_properties:
- mode: chat
- context_size: 32768
-parameter_rules:
- - name: temperature
- use_template: temperature
- - name: max_tokens
- use_template: max_tokens
- type: int
- default: 512
- min: 1
- max: 8192
- help:
- zh_Hans: 指定生成结果长度的上限。如果生成结果截断,可以调大该参数。
- en_US: Specifies the upper limit on the length of generated results. If the generated results are truncated, you can increase this parameter.
- - name: top_p
- use_template: top_p
- - name: top_k
- label:
- zh_Hans: 取样数量
- en_US: Top k
- type: int
- help:
- zh_Hans: 仅从每个后续标记的前 K 个选项中采样。
- en_US: Only sample from the top K options for each subsequent token.
- required: false
- - name: frequency_penalty
- use_template: frequency_penalty
- - name: response_format
- label:
- zh_Hans: 回复格式
- en_US: Response Format
- type: string
- help:
- zh_Hans: 指定模型必须输出的格式
- en_US: specifying the format that the model must output
- required: false
- options:
- - text
- - json_object
-pricing:
- input: '1.26'
- output: '1.26'
- unit: '0.000001'
- currency: RMB
diff --git a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/qwen2.5-72b-instruct-128k.yaml b/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/qwen2.5-72b-instruct-128k.yaml
deleted file mode 100644
index 79f94da376..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/qwen2.5-72b-instruct-128k.yaml
+++ /dev/null
@@ -1,51 +0,0 @@
-model: Qwen/Qwen2.5-72B-Instruct-128K
-label:
- en_US: Qwen/Qwen2.5-72B-Instruct-128K
-model_type: llm
-features:
- - agent-thought
-model_properties:
- mode: chat
- context_size: 131072
-parameter_rules:
- - name: temperature
- use_template: temperature
- - name: max_tokens
- use_template: max_tokens
- type: int
- default: 512
- min: 1
- max: 4096
- help:
- zh_Hans: 指定生成结果长度的上限。如果生成结果截断,可以调大该参数。
- en_US: Specifies the upper limit on the length of generated results. If the generated results are truncated, you can increase this parameter.
- - name: top_p
- use_template: top_p
- - name: top_k
- label:
- zh_Hans: 取样数量
- en_US: Top k
- type: int
- help:
- zh_Hans: 仅从每个后续标记的前 K 个选项中采样。
- en_US: Only sample from the top K options for each subsequent token.
- required: false
- - name: frequency_penalty
- use_template: frequency_penalty
- - name: response_format
- label:
- zh_Hans: 回复格式
- en_US: Response Format
- type: string
- help:
- zh_Hans: 指定模型必须输出的格式
- en_US: specifying the format that the model must output
- required: false
- options:
- - text
- - json_object
-pricing:
- input: '4.13'
- output: '4.13'
- unit: '0.000001'
- currency: RMB
diff --git a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/qwen2.5-72b-instruct-vendorA.yaml b/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/qwen2.5-72b-instruct-vendorA.yaml
deleted file mode 100644
index fdbe38ff21..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/qwen2.5-72b-instruct-vendorA.yaml
+++ /dev/null
@@ -1,51 +0,0 @@
-model: Vendor-A/Qwen/Qwen2.5-72B-Instruct
-label:
- en_US: Vendor-A/Qwen/Qwen2.5-72B-Instruct
-model_type: llm
-features:
- - agent-thought
-model_properties:
- mode: chat
- context_size: 32768
-parameter_rules:
- - name: temperature
- use_template: temperature
- - name: max_tokens
- use_template: max_tokens
- type: int
- default: 512
- min: 1
- max: 4096
- help:
- zh_Hans: 指定生成结果长度的上限。如果生成结果截断,可以调大该参数。
- en_US: Specifies the upper limit on the length of generated results. If the generated results are truncated, you can increase this parameter.
- - name: top_p
- use_template: top_p
- - name: top_k
- label:
- zh_Hans: 取样数量
- en_US: Top k
- type: int
- help:
- zh_Hans: 仅从每个后续标记的前 K 个选项中采样。
- en_US: Only sample from the top K options for each subsequent token.
- required: false
- - name: frequency_penalty
- use_template: frequency_penalty
- - name: response_format
- label:
- zh_Hans: 回复格式
- en_US: Response Format
- type: string
- help:
- zh_Hans: 指定模型必须输出的格式
- en_US: specifying the format that the model must output
- required: false
- options:
- - text
- - json_object
-pricing:
- input: '1.00'
- output: '1.00'
- unit: '0.000001'
- currency: RMB
diff --git a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/qwen2.5-72b-instruct.yaml b/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/qwen2.5-72b-instruct.yaml
deleted file mode 100644
index de9d9d97bf..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/qwen2.5-72b-instruct.yaml
+++ /dev/null
@@ -1,51 +0,0 @@
-model: Qwen/Qwen2.5-72B-Instruct
-label:
- en_US: Qwen/Qwen2.5-72B-Instruct
-model_type: llm
-features:
- - agent-thought
-model_properties:
- mode: chat
- context_size: 32768
-parameter_rules:
- - name: temperature
- use_template: temperature
- - name: max_tokens
- use_template: max_tokens
- type: int
- default: 512
- min: 1
- max: 4096
- help:
- zh_Hans: 指定生成结果长度的上限。如果生成结果截断,可以调大该参数。
- en_US: Specifies the upper limit on the length of generated results. If the generated results are truncated, you can increase this parameter.
- - name: top_p
- use_template: top_p
- - name: top_k
- label:
- zh_Hans: 取样数量
- en_US: Top k
- type: int
- help:
- zh_Hans: 仅从每个后续标记的前 K 个选项中采样。
- en_US: Only sample from the top K options for each subsequent token.
- required: false
- - name: frequency_penalty
- use_template: frequency_penalty
- - name: response_format
- label:
- zh_Hans: 回复格式
- en_US: Response Format
- type: string
- help:
- zh_Hans: 指定模型必须输出的格式
- en_US: specifying the format that the model must output
- required: false
- options:
- - text
- - json_object
-pricing:
- input: '4.13'
- output: '4.13'
- unit: '0.000001'
- currency: RMB
diff --git a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/qwen2.5-7b-instruct.yaml b/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/qwen2.5-7b-instruct.yaml
deleted file mode 100644
index bb85dbe948..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/qwen2.5-7b-instruct.yaml
+++ /dev/null
@@ -1,51 +0,0 @@
-model: Qwen/Qwen2.5-7B-Instruct
-label:
- en_US: Qwen/Qwen2.5-7B-Instruct
-model_type: llm
-features:
- - agent-thought
-model_properties:
- mode: chat
- context_size: 32768
-parameter_rules:
- - name: temperature
- use_template: temperature
- - name: max_tokens
- use_template: max_tokens
- type: int
- default: 512
- min: 1
- max: 8192
- help:
- zh_Hans: 指定生成结果长度的上限。如果生成结果截断,可以调大该参数。
- en_US: Specifies the upper limit on the length of generated results. If the generated results are truncated, you can increase this parameter.
- - name: top_p
- use_template: top_p
- - name: top_k
- label:
- zh_Hans: 取样数量
- en_US: Top k
- type: int
- help:
- zh_Hans: 仅从每个后续标记的前 K 个选项中采样。
- en_US: Only sample from the top K options for each subsequent token.
- required: false
- - name: frequency_penalty
- use_template: frequency_penalty
- - name: response_format
- label:
- zh_Hans: 回复格式
- en_US: Response Format
- type: string
- help:
- zh_Hans: 指定模型必须输出的格式
- en_US: specifying the format that the model must output
- required: false
- options:
- - text
- - json_object
-pricing:
- input: '0'
- output: '0'
- unit: '0.000001'
- currency: RMB
diff --git a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/qwen2.5-coder-32b-instruct.yaml b/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/qwen2.5-coder-32b-instruct.yaml
deleted file mode 100644
index de2224a67b..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/qwen2.5-coder-32b-instruct.yaml
+++ /dev/null
@@ -1,84 +0,0 @@
-model: Qwen/Qwen2.5-Coder-32B-Instruct
-label:
- en_US: Qwen/Qwen2.5-Coder-32B-Instruct
-model_type: llm
-features:
- - agent-thought
-model_properties:
- mode: chat
- context_size: 32768
-parameter_rules:
- - name: temperature
- use_template: temperature
- type: float
- default: 0.3
- min: 0.0
- max: 2.0
- help:
- zh_Hans: 用于控制随机性和多样性的程度。具体来说,temperature值控制了生成文本时对每个候选词的概率分布进行平滑的程度。较高的temperature值会降低概率分布的峰值,使得更多的低概率词被选择,生成结果更加多样化;而较低的temperature值则会增强概率分布的峰值,使得高概率词更容易被选择,生成结果更加确定。
- en_US: Used to control the degree of randomness and diversity. Specifically, the temperature value controls the degree to which the probability distribution of each candidate word is smoothed when generating text. A higher temperature value will reduce the peak value of the probability distribution, allowing more low-probability words to be selected, and the generated results will be more diverse; while a lower temperature value will enhance the peak value of the probability distribution, making it easier for high-probability words to be selected. , the generated results are more certain.
- - name: max_tokens
- use_template: max_tokens
- type: int
- default: 8192
- min: 1
- max: 8192
- help:
- zh_Hans: 用于指定模型在生成内容时token的最大数量,它定义了生成的上限,但不保证每次都会生成到这个数量。
- en_US: It is used to specify the maximum number of tokens when the model generates content. It defines the upper limit of generation, but does not guarantee that this number will be generated every time.
- - name: top_p
- use_template: top_p
- type: float
- default: 0.8
- min: 0.1
- max: 0.9
- help:
- zh_Hans: 生成过程中核采样方法概率阈值,例如,取值为0.8时,仅保留概率加起来大于等于0.8的最可能token的最小集合作为候选集。取值范围为(0,1.0),取值越大,生成的随机性越高;取值越低,生成的确定性越高。
- en_US: The probability threshold of the kernel sampling method during the generation process. For example, when the value is 0.8, only the smallest set of the most likely tokens with a sum of probabilities greater than or equal to 0.8 is retained as the candidate set. The value range is (0,1.0). The larger the value, the higher the randomness generated; the lower the value, the higher the certainty generated.
- - name: top_k
- type: int
- min: 0
- max: 99
- label:
- zh_Hans: 取样数量
- en_US: Top k
- help:
- zh_Hans: 生成时,采样候选集的大小。例如,取值为50时,仅将单次生成中得分最高的50个token组成随机采样的候选集。取值越大,生成的随机性越高;取值越小,生成的确定性越高。
- en_US: The size of the sample candidate set when generated. For example, when the value is 50, only the 50 highest-scoring tokens in a single generation form a randomly sampled candidate set. The larger the value, the higher the randomness generated; the smaller the value, the higher the certainty generated.
- - name: seed
- required: false
- type: int
- default: 1234
- label:
- zh_Hans: 随机种子
- en_US: Random seed
- help:
- zh_Hans: 生成时使用的随机数种子,用户控制模型生成内容的随机性。支持无符号64位整数,默认值为 1234。在使用seed时,模型将尽可能生成相同或相似的结果,但目前不保证每次生成的结果完全相同。
- en_US: The random number seed used when generating, the user controls the randomness of the content generated by the model. Supports unsigned 64-bit integers, default value is 1234. When using seed, the model will try its best to generate the same or similar results, but there is currently no guarantee that the results will be exactly the same every time.
- - name: repetition_penalty
- required: false
- type: float
- default: 1.1
- label:
- zh_Hans: 重复惩罚
- en_US: Repetition penalty
- help:
- zh_Hans: 用于控制模型生成时的重复度。提高repetition_penalty时可以降低模型生成的重复度。1.0表示不做惩罚。
- en_US: Used to control the repeatability when generating models. Increasing repetition_penalty can reduce the duplication of model generation. 1.0 means no punishment.
- - name: response_format
- label:
- zh_Hans: 回复格式
- en_US: Response Format
- type: string
- help:
- zh_Hans: 指定模型必须输出的格式
- en_US: specifying the format that the model must output
- required: false
- options:
- - text
- - json_object
-pricing:
- input: '1.26'
- output: '1.26'
- unit: '0.000001'
- currency: RMB
diff --git a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/qwen2.5-coder-7b-instruct.yaml b/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/qwen2.5-coder-7b-instruct.yaml
deleted file mode 100644
index c31a338cdd..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/qwen2.5-coder-7b-instruct.yaml
+++ /dev/null
@@ -1,84 +0,0 @@
-model: Qwen/Qwen2.5-Coder-7B-Instruct
-label:
- en_US: Qwen/Qwen2.5-Coder-7B-Instruct
-model_type: llm
-features:
- - agent-thought
-model_properties:
- mode: chat
- context_size: 131072
-parameter_rules:
- - name: temperature
- use_template: temperature
- type: float
- default: 0.3
- min: 0.0
- max: 2.0
- help:
- zh_Hans: 用于控制随机性和多样性的程度。具体来说,temperature值控制了生成文本时对每个候选词的概率分布进行平滑的程度。较高的temperature值会降低概率分布的峰值,使得更多的低概率词被选择,生成结果更加多样化;而较低的temperature值则会增强概率分布的峰值,使得高概率词更容易被选择,生成结果更加确定。
- en_US: Used to control the degree of randomness and diversity. Specifically, the temperature value controls the degree to which the probability distribution of each candidate word is smoothed when generating text. A higher temperature value will reduce the peak value of the probability distribution, allowing more low-probability words to be selected, and the generated results will be more diverse; while a lower temperature value will enhance the peak value of the probability distribution, making it easier for high-probability words to be selected. , the generated results are more certain.
- - name: max_tokens
- use_template: max_tokens
- type: int
- default: 8192
- min: 1
- max: 8192
- help:
- zh_Hans: 用于指定模型在生成内容时token的最大数量,它定义了生成的上限,但不保证每次都会生成到这个数量。
- en_US: It is used to specify the maximum number of tokens when the model generates content. It defines the upper limit of generation, but does not guarantee that this number will be generated every time.
- - name: top_p
- use_template: top_p
- type: float
- default: 0.8
- min: 0.1
- max: 0.9
- help:
- zh_Hans: 生成过程中核采样方法概率阈值,例如,取值为0.8时,仅保留概率加起来大于等于0.8的最可能token的最小集合作为候选集。取值范围为(0,1.0),取值越大,生成的随机性越高;取值越低,生成的确定性越高。
- en_US: The probability threshold of the kernel sampling method during the generation process. For example, when the value is 0.8, only the smallest set of the most likely tokens with a sum of probabilities greater than or equal to 0.8 is retained as the candidate set. The value range is (0,1.0). The larger the value, the higher the randomness generated; the lower the value, the higher the certainty generated.
- - name: top_k
- type: int
- min: 0
- max: 99
- label:
- zh_Hans: 取样数量
- en_US: Top k
- help:
- zh_Hans: 生成时,采样候选集的大小。例如,取值为50时,仅将单次生成中得分最高的50个token组成随机采样的候选集。取值越大,生成的随机性越高;取值越小,生成的确定性越高。
- en_US: The size of the sample candidate set when generated. For example, when the value is 50, only the 50 highest-scoring tokens in a single generation form a randomly sampled candidate set. The larger the value, the higher the randomness generated; the smaller the value, the higher the certainty generated.
- - name: seed
- required: false
- type: int
- default: 1234
- label:
- zh_Hans: 随机种子
- en_US: Random seed
- help:
- zh_Hans: 生成时使用的随机数种子,用户控制模型生成内容的随机性。支持无符号64位整数,默认值为 1234。在使用seed时,模型将尽可能生成相同或相似的结果,但目前不保证每次生成的结果完全相同。
- en_US: The random number seed used when generating, the user controls the randomness of the content generated by the model. Supports unsigned 64-bit integers, default value is 1234. When using seed, the model will try its best to generate the same or similar results, but there is currently no guarantee that the results will be exactly the same every time.
- - name: repetition_penalty
- required: false
- type: float
- default: 1.1
- label:
- zh_Hans: 重复惩罚
- en_US: Repetition penalty
- help:
- zh_Hans: 用于控制模型生成时的重复度。提高repetition_penalty时可以降低模型生成的重复度。1.0表示不做惩罚。
- en_US: Used to control the repeatability when generating models. Increasing repetition_penalty can reduce the duplication of model generation. 1.0 means no punishment.
- - name: response_format
- label:
- zh_Hans: 回复格式
- en_US: Response Format
- type: string
- help:
- zh_Hans: 指定模型必须输出的格式
- en_US: specifying the format that the model must output
- required: false
- options:
- - text
- - json_object
-pricing:
- input: '0'
- output: '0'
- unit: '0.000001'
- currency: RMB
diff --git a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/qwen2.5-math-72b-instruct.yaml b/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/qwen2.5-math-72b-instruct.yaml
deleted file mode 100644
index 40c9ab48ca..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/qwen2.5-math-72b-instruct.yaml
+++ /dev/null
@@ -1,85 +0,0 @@
-model: Qwen/Qwen2.5-Math-72B-Instruct
-label:
- en_US: Qwen/Qwen2.5-Math-72B-Instruct
-model_type: llm
-features:
- - agent-thought
-model_properties:
- mode: chat
- context_size: 4096
-parameter_rules:
- - name: temperature
- use_template: temperature
- type: float
- default: 0.3
- min: 0.0
- max: 2.0
- help:
- zh_Hans: 用于控制随机性和多样性的程度。具体来说,temperature值控制了生成文本时对每个候选词的概率分布进行平滑的程度。较高的temperature值会降低概率分布的峰值,使得更多的低概率词被选择,生成结果更加多样化;而较低的temperature值则会增强概率分布的峰值,使得高概率词更容易被选择,生成结果更加确定。
- en_US: Used to control the degree of randomness and diversity. Specifically, the temperature value controls the degree to which the probability distribution of each candidate word is smoothed when generating text. A higher temperature value will reduce the peak value of the probability distribution, allowing more low-probability words to be selected, and the generated results will be more diverse; while a lower temperature value will enhance the peak value of the probability distribution, making it easier for high-probability words to be selected. , the generated results are more certain.
- - name: max_tokens
- use_template: max_tokens
- type: int
- default: 2000
- min: 1
- max: 2000
- help:
- zh_Hans: 用于指定模型在生成内容时token的最大数量,它定义了生成的上限,但不保证每次都会生成到这个数量。
- en_US: It is used to specify the maximum number of tokens when the model generates content. It defines the upper limit of generation, but does not guarantee that this number will be generated every time.
- - name: top_p
- use_template: top_p
- type: float
- default: 0.8
- min: 0.1
- max: 0.9
- help:
- zh_Hans: 生成过程中核采样方法概率阈值,例如,取值为0.8时,仅保留概率加起来大于等于0.8的最可能token的最小集合作为候选集。取值范围为(0,1.0),取值越大,生成的随机性越高;取值越低,生成的确定性越高。
- en_US: The probability threshold of the kernel sampling method during the generation process. For example, when the value is 0.8, only the smallest set of the most likely tokens with a sum of probabilities greater than or equal to 0.8 is retained as the candidate set. The value range is (0,1.0). The larger the value, the higher the randomness generated; the lower the value, the higher the certainty generated.
- - name: top_k
- type: int
- min: 0
- max: 99
- label:
- zh_Hans: 取样数量
- en_US: Top k
- help:
- zh_Hans: 生成时,采样候选集的大小。例如,取值为50时,仅将单次生成中得分最高的50个token组成随机采样的候选集。取值越大,生成的随机性越高;取值越小,生成的确定性越高。
- en_US: The size of the sample candidate set when generated. For example, when the value is 50, only the 50 highest-scoring tokens in a single generation form a randomly sampled candidate set. The larger the value, the higher the randomness generated; the smaller the value, the higher the certainty generated.
- - name: seed
- required: false
- type: int
- default: 1234
- label:
- zh_Hans: 随机种子
- en_US: Random seed
- help:
- zh_Hans: 生成时使用的随机数种子,用户控制模型生成内容的随机性。支持无符号64位整数,默认值为 1234。在使用seed时,模型将尽可能生成相同或相似的结果,但目前不保证每次生成的结果完全相同。
- en_US: The random number seed used when generating, the user controls the randomness of the content generated by the model. Supports unsigned 64-bit integers, default value is 1234. When using seed, the model will try its best to generate the same or similar results, but there is currently no guarantee that the results will be exactly the same every time.
- - name: repetition_penalty
- required: false
- type: float
- default: 1.1
- label:
- zh_Hans: 重复惩罚
- en_US: Repetition penalty
- help:
- zh_Hans: 用于控制模型生成时的重复度。提高repetition_penalty时可以降低模型生成的重复度。1.0表示不做惩罚。
- en_US: Used to control the repeatability when generating models. Increasing repetition_penalty can reduce the duplication of model generation. 1.0 means no punishment.
- - name: response_format
- label:
- zh_Hans: 回复格式
- en_US: Response Format
- type: string
- help:
- zh_Hans: 指定模型必须输出的格式
- en_US: specifying the format that the model must output
- required: false
- options:
- - text
- - json_object
-pricing:
- input: '4.13'
- output: '4.13'
- unit: '0.000001'
- currency: RMB
-deprecated: true
diff --git a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/yi-1.5-34b-chat.yaml b/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/yi-1.5-34b-chat.yaml
deleted file mode 100644
index 3e25f82369..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/yi-1.5-34b-chat.yaml
+++ /dev/null
@@ -1,39 +0,0 @@
-model: 01-ai/Yi-1.5-34B-Chat
-label:
- en_US: 01-ai/Yi-1.5-34B-Chat-16K
-model_type: llm
-features:
- - agent-thought
-model_properties:
- mode: chat
- context_size: 16384
-parameter_rules:
- - name: temperature
- use_template: temperature
- - name: max_tokens
- use_template: max_tokens
- type: int
- default: 512
- min: 1
- max: 4096
- help:
- zh_Hans: 指定生成结果长度的上限。如果生成结果截断,可以调大该参数。
- en_US: Specifies the upper limit on the length of generated results. If the generated results are truncated, you can increase this parameter.
- - name: top_p
- use_template: top_p
- - name: top_k
- label:
- zh_Hans: 取样数量
- en_US: Top k
- type: int
- help:
- zh_Hans: 仅从每个后续标记的前 K 个选项中采样。
- en_US: Only sample from the top K options for each subsequent token.
- required: false
- - name: frequency_penalty
- use_template: frequency_penalty
-pricing:
- input: '1.26'
- output: '1.26'
- unit: '0.000001'
- currency: RMB
diff --git a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/yi-1.5-6b-chat.yaml b/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/yi-1.5-6b-chat.yaml
deleted file mode 100644
index 827b2ce1e5..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/yi-1.5-6b-chat.yaml
+++ /dev/null
@@ -1,39 +0,0 @@
-model: 01-ai/Yi-1.5-6B-Chat
-label:
- en_US: 01-ai/Yi-1.5-6B-Chat
-model_type: llm
-features:
- - agent-thought
-model_properties:
- mode: chat
- context_size: 4096
-parameter_rules:
- - name: temperature
- use_template: temperature
- - name: max_tokens
- use_template: max_tokens
- type: int
- default: 512
- min: 1
- max: 4096
- help:
- zh_Hans: 指定生成结果长度的上限。如果生成结果截断,可以调大该参数。
- en_US: Specifies the upper limit on the length of generated results. If the generated results are truncated, you can increase this parameter.
- - name: top_p
- use_template: top_p
- - name: top_k
- label:
- zh_Hans: 取样数量
- en_US: Top k
- type: int
- help:
- zh_Hans: 仅从每个后续标记的前 K 个选项中采样。
- en_US: Only sample from the top K options for each subsequent token.
- required: false
- - name: frequency_penalty
- use_template: frequency_penalty
-pricing:
- input: '0'
- output: '0'
- unit: '0.000001'
- currency: RMB
diff --git a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/yi-1.5-9b-chat.yaml b/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/yi-1.5-9b-chat.yaml
deleted file mode 100644
index 112fcbfe97..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/llm/yi-1.5-9b-chat.yaml
+++ /dev/null
@@ -1,39 +0,0 @@
-model: 01-ai/Yi-1.5-9B-Chat-16K
-label:
- en_US: 01-ai/Yi-1.5-9B-Chat-16K
-model_type: llm
-features:
- - agent-thought
-model_properties:
- mode: chat
- context_size: 16384
-parameter_rules:
- - name: temperature
- use_template: temperature
- - name: max_tokens
- use_template: max_tokens
- type: int
- default: 512
- min: 1
- max: 4096
- help:
- zh_Hans: 指定生成结果长度的上限。如果生成结果截断,可以调大该参数。
- en_US: Specifies the upper limit on the length of generated results. If the generated results are truncated, you can increase this parameter.
- - name: top_p
- use_template: top_p
- - name: top_k
- label:
- zh_Hans: 取样数量
- en_US: Top k
- type: int
- help:
- zh_Hans: 仅从每个后续标记的前 K 个选项中采样。
- en_US: Only sample from the top K options for each subsequent token.
- required: false
- - name: frequency_penalty
- use_template: frequency_penalty
-pricing:
- input: '0'
- output: '0'
- unit: '0.000001'
- currency: RMB
diff --git a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/rerank/__init__.py b/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/rerank/__init__.py
deleted file mode 100644
index e69de29bb2..0000000000
diff --git a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/rerank/bce-reranker-base_v1.yaml b/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/rerank/bce-reranker-base_v1.yaml
deleted file mode 100644
index ff3635bfeb..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/rerank/bce-reranker-base_v1.yaml
+++ /dev/null
@@ -1,4 +0,0 @@
-model: netease-youdao/bce-reranker-base_v1
-model_type: rerank
-model_properties:
- context_size: 512
diff --git a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/rerank/bge-reranker-v2-m3.yaml b/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/rerank/bge-reranker-v2-m3.yaml
deleted file mode 100644
index 807f531b08..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/rerank/bge-reranker-v2-m3.yaml
+++ /dev/null
@@ -1,4 +0,0 @@
-model: BAAI/bge-reranker-v2-m3
-model_type: rerank
-model_properties:
- context_size: 8192
diff --git a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/rerank/rerank.py b/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/rerank/rerank.py
deleted file mode 100644
index 2587dc2242..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/rerank/rerank.py
+++ /dev/null
@@ -1,76 +0,0 @@
-from typing import Optional
-import httpx
-from dify_plugin.entities.model.rerank import RerankDocument, RerankResult
-from dify_plugin.errors.model import (
- CredentialsValidateFailedError,
- InvokeAuthorizationError,
- InvokeBadRequestError,
- InvokeConnectionError,
- InvokeError,
- InvokeRateLimitError,
- InvokeServerUnavailableError,
-)
-from dify_plugin.interfaces.model.rerank_model import RerankModel
-
-
-class SiliconflowRerankModel(RerankModel):
- def _invoke(
- self,
- model: str,
- credentials: dict,
- query: str,
- docs: list[str],
- score_threshold: Optional[float] = None,
- top_n: Optional[int] = None,
- user: Optional[str] = None,
- ) -> RerankResult:
- if len(docs) == 0:
- return RerankResult(model=model, docs=[])
- base_url = credentials.get("base_url", "https://api.siliconflow.cn/v1")
- base_url = base_url.removesuffix("/")
- try:
- response = httpx.post(
- base_url + "/rerank",
- json={"model": model, "query": query, "documents": docs, "top_n": top_n, "return_documents": True},
- headers={"Authorization": f"Bearer {credentials.get('api_key')}"},
- )
- response.raise_for_status()
- results = response.json()
- rerank_documents = []
- for result in results["results"]:
- rerank_document = RerankDocument(
- index=result["index"], text=result["document"]["text"], score=result["relevance_score"]
- )
- if score_threshold is None or result["relevance_score"] >= score_threshold:
- rerank_documents.append(rerank_document)
- return RerankResult(model=model, docs=rerank_documents)
- except httpx.HTTPStatusError as e:
- raise InvokeServerUnavailableError(str(e))
-
- def validate_credentials(self, model: str, credentials: dict) -> None:
- try:
- self._invoke(
- model=model,
- credentials=credentials,
- query="What is the capital of the United States?",
- docs=[
- "Carson City is the capital city of the American state of Nevada. At the 2010 United States Census, Carson City had a population of 55,274.",
- "The Commonwealth of the Northern Mariana Islands is a group of islands in the Pacific Ocean that are a political division controlled by the United States. Its capital is Saipan.",
- ],
- score_threshold=0.8,
- )
- except Exception as ex:
- raise CredentialsValidateFailedError(str(ex))
-
- @property
- def _invoke_error_mapping(self) -> dict[type[InvokeError], list[type[Exception]]]:
- """
- Map model invoke error to unified error
- """
- return {
- InvokeConnectionError: [httpx.ConnectError],
- InvokeServerUnavailableError: [httpx.RemoteProtocolError],
- InvokeRateLimitError: [],
- InvokeAuthorizationError: [httpx.HTTPStatusError],
- InvokeBadRequestError: [httpx.RequestError],
- }
diff --git a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/speech2text/__init__.py b/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/speech2text/__init__.py
deleted file mode 100644
index e69de29bb2..0000000000
diff --git a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/speech2text/funaudio-sense-voice-small.yaml b/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/speech2text/funaudio-sense-voice-small.yaml
deleted file mode 100644
index d4bc33c68e..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/speech2text/funaudio-sense-voice-small.yaml
+++ /dev/null
@@ -1,5 +0,0 @@
-model: FunAudioLLM/SenseVoiceSmall
-model_type: speech2text
-model_properties:
- file_upload_limit: 1
- supported_file_extensions: mp3,wav
diff --git a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/speech2text/sense-voice-small.yaml b/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/speech2text/sense-voice-small.yaml
deleted file mode 100644
index 455b2ad467..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/speech2text/sense-voice-small.yaml
+++ /dev/null
@@ -1,6 +0,0 @@
-model: iic/SenseVoiceSmall
-model_type: speech2text
-model_properties:
- file_upload_limit: 1
- supported_file_extensions: mp3,wav
-deprecated: true
diff --git a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/speech2text/speech2text.py b/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/speech2text/speech2text.py
deleted file mode 100644
index f5b2f3447f..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/speech2text/speech2text.py
+++ /dev/null
@@ -1,29 +0,0 @@
-from typing import IO, Optional
-from dify_plugin import OAICompatSpeech2TextModel
-
-
-class SiliconflowSpeech2TextModel(OAICompatSpeech2TextModel):
- """
- Model class for Siliconflow Speech to text model.
- """
-
- def _invoke(self, model: str, credentials: dict, file: IO[bytes], user: Optional[str] = None) -> str:
- """
- Invoke speech2text model
-
- :param model: model name
- :param credentials: model credentials
- :param file: audio file
- :param user: unique user id
- :return: text for given audio file
- """
- self._add_custom_parameters(credentials)
- return super()._invoke(model, credentials, file)
-
- def validate_credentials(self, model: str, credentials: dict) -> None:
- self._add_custom_parameters(credentials)
- return super().validate_credentials(model, credentials)
-
- @classmethod
- def _add_custom_parameters(cls, credentials: dict) -> None:
- credentials["endpoint_url"] = "https://api.siliconflow.cn/v1"
diff --git a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/text_embedding/bce-embedding-base-v1.yaml b/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/text_embedding/bce-embedding-base-v1.yaml
deleted file mode 100644
index 710fbc04f6..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/text_embedding/bce-embedding-base-v1.yaml
+++ /dev/null
@@ -1,5 +0,0 @@
-model: netease-youdao/bce-embedding-base_v1
-model_type: text-embedding
-model_properties:
- context_size: 512
- max_chunks: 1
diff --git a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/text_embedding/bge-large-en-v1.5.yaml b/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/text_embedding/bge-large-en-v1.5.yaml
deleted file mode 100644
index 84f69b41a0..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/text_embedding/bge-large-en-v1.5.yaml
+++ /dev/null
@@ -1,5 +0,0 @@
-model: BAAI/bge-large-en-v1.5
-model_type: text-embedding
-model_properties:
- context_size: 512
- max_chunks: 1
diff --git a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/text_embedding/bge-large-zh-v1.5.yaml b/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/text_embedding/bge-large-zh-v1.5.yaml
deleted file mode 100644
index 5248375d0b..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/text_embedding/bge-large-zh-v1.5.yaml
+++ /dev/null
@@ -1,5 +0,0 @@
-model: BAAI/bge-large-zh-v1.5
-model_type: text-embedding
-model_properties:
- context_size: 512
- max_chunks: 1
diff --git a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/text_embedding/bge-m3.yaml b/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/text_embedding/bge-m3.yaml
deleted file mode 100644
index f0b12dd420..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/text_embedding/bge-m3.yaml
+++ /dev/null
@@ -1,5 +0,0 @@
-model: BAAI/bge-m3
-model_type: text-embedding
-model_properties:
- context_size: 8192
- max_chunks: 1
diff --git a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/text_embedding/text_embedding.py b/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/text_embedding/text_embedding.py
deleted file mode 100644
index ab86738dae..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/text_embedding/text_embedding.py
+++ /dev/null
@@ -1,43 +0,0 @@
-from typing import Optional
-from dify_plugin import OAICompatEmbeddingModel
-from dify_plugin.entities.model import EmbeddingInputType
-from dify_plugin.entities.model.text_embedding import TextEmbeddingResult
-
-
-class SiliconflowTextEmbeddingModel(OAICompatEmbeddingModel):
- """
- Model class for Siliconflow text embedding model.
- """
-
- def validate_credentials(self, model: str, credentials: dict) -> None:
- self._add_custom_parameters(credentials)
- super().validate_credentials(model, credentials)
-
- def _invoke(
- self,
- model: str,
- credentials: dict,
- texts: list[str],
- user: Optional[str] = None,
- input_type: EmbeddingInputType = EmbeddingInputType.DOCUMENT,
- ) -> TextEmbeddingResult:
- """
- Invoke text embedding model
-
- :param model: model name
- :param credentials: model credentials
- :param texts: texts to embed
- :param user: unique user id
- :param input_type: input type
- :return: embeddings result
- """
- self._add_custom_parameters(credentials)
- return super()._invoke(model, credentials, texts, user)
-
- def get_num_tokens(self, model: str, credentials: dict, texts: list[str]) -> int:
- self._add_custom_parameters(credentials)
- return super().get_num_tokens(model, credentials, texts)
-
- @classmethod
- def _add_custom_parameters(cls, credentials: dict) -> None:
- credentials["endpoint_url"] = "https://api.siliconflow.cn/v1"
diff --git a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/tts/__init__.py b/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/tts/__init__.py
deleted file mode 100644
index e69de29bb2..0000000000
diff --git a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/tts/cosyvoice2-0.5b.yaml b/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/tts/cosyvoice2-0.5b.yaml
deleted file mode 100644
index d2e02ed21b..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/tts/cosyvoice2-0.5b.yaml
+++ /dev/null
@@ -1,38 +0,0 @@
-model: FunAudioLLM/CosyVoice2-0.5B
-model_type: tts
-model_properties:
- default_voice: 'FunAudioLLM/CosyVoice2-0.5B:alex'
- voices:
- - mode: "FunAudioLLM/CosyVoice2-0.5B:alex"
- name: "Alex(男声)"
- language: [ "zh-Hans", "en-US" ]
- - mode: "FunAudioLLM/CosyVoice2-0.5B:benjamin"
- name: "Benjamin(男声)"
- language: [ "zh-Hans", "en-US" ]
- - mode: "FunAudioLLM/CosyVoice2-0.5B:charles"
- name: "Charles(男声)"
- language: [ "zh-Hans", "en-US" ]
- - mode: "FunAudioLLM/CosyVoice2-0.5B:david"
- name: "David(男声)"
- language: [ "zh-Hans", "en-US" ]
- - mode: "FunAudioLLM/CosyVoice2-0.5B:anna"
- name: "Anna(女声)"
- language: [ "zh-Hans", "en-US" ]
- - mode: "FunAudioLLM/CosyVoice2-0.5B:bella"
- name: "Bella(女声)"
- language: [ "zh-Hans", "en-US" ]
- - mode: "FunAudioLLM/CosyVoice2-0.5B:claire"
- name: "Claire(女声)"
- language: [ "zh-Hans", "en-US" ]
- - mode: "FunAudioLLM/CosyVoice2-0.5B:diana"
- name: "Diana(女声)"
- language: [ "zh-Hans", "en-US" ]
- audio_type: 'mp3'
- max_workers: 5
- # stream: false
-pricing:
- input: '50'
- output: '0'
- unit: '0.000001'
- currency: RMB
-
diff --git a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/tts/fish-speech-1.4.yaml b/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/tts/fish-speech-1.4.yaml
deleted file mode 100644
index d8af252241..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/tts/fish-speech-1.4.yaml
+++ /dev/null
@@ -1,37 +0,0 @@
-model: fishaudio/fish-speech-1.4
-model_type: tts
-model_properties:
- default_voice: 'fishaudio/fish-speech-1.4:alex'
- voices:
- - mode: "fishaudio/fish-speech-1.4:alex"
- name: "Alex(男声)"
- language: [ "zh-Hans", "en-US" ]
- - mode: "fishaudio/fish-speech-1.4:benjamin"
- name: "Benjamin(男声)"
- language: [ "zh-Hans", "en-US" ]
- - mode: "fishaudio/fish-speech-1.4:charles"
- name: "Charles(男声)"
- language: [ "zh-Hans", "en-US" ]
- - mode: "fishaudio/fish-speech-1.4:david"
- name: "David(男声)"
- language: [ "zh-Hans", "en-US" ]
- - mode: "fishaudio/fish-speech-1.4:anna"
- name: "Anna(女声)"
- language: [ "zh-Hans", "en-US" ]
- - mode: "fishaudio/fish-speech-1.4:bella"
- name: "Bella(女声)"
- language: [ "zh-Hans", "en-US" ]
- - mode: "fishaudio/fish-speech-1.4:claire"
- name: "Claire(女声)"
- language: [ "zh-Hans", "en-US" ]
- - mode: "fishaudio/fish-speech-1.4:diana"
- name: "Diana(女声)"
- language: [ "zh-Hans", "en-US" ]
- audio_type: 'mp3'
- max_workers: 5
- # stream: false
-pricing:
- input: '105'
- output: '0'
- unit: '0.000001'
- currency: RMB
diff --git a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/tts/fish-speech-1.5.yaml b/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/tts/fish-speech-1.5.yaml
deleted file mode 100644
index df09c19526..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/tts/fish-speech-1.5.yaml
+++ /dev/null
@@ -1,37 +0,0 @@
-model: fishaudio/fish-speech-1.5
-model_type: tts
-model_properties:
- default_voice: 'fishaudio/fish-speech-1.5:alex'
- voices:
- - mode: "fishaudio/fish-speech-1.5:alex"
- name: "Alex(男声)"
- language: [ "zh-Hans", "en-US" ]
- - mode: "fishaudio/fish-speech-1.5:benjamin"
- name: "Benjamin(男声)"
- language: [ "zh-Hans", "en-US" ]
- - mode: "fishaudio/fish-speech-1.5:charles"
- name: "Charles(男声)"
- language: [ "zh-Hans", "en-US" ]
- - mode: "fishaudio/fish-speech-1.5:david"
- name: "David(男声)"
- language: [ "zh-Hans", "en-US" ]
- - mode: "fishaudio/fish-speech-1.5:anna"
- name: "Anna(女声)"
- language: [ "zh-Hans", "en-US" ]
- - mode: "fishaudio/fish-speech-1.5:bella"
- name: "Bella(女声)"
- language: [ "zh-Hans", "en-US" ]
- - mode: "fishaudio/fish-speech-1.5:claire"
- name: "Claire(女声)"
- language: [ "zh-Hans", "en-US" ]
- - mode: "fishaudio/fish-speech-1.5:diana"
- name: "Diana(女声)"
- language: [ "zh-Hans", "en-US" ]
- audio_type: 'mp3'
- max_workers: 5
- # stream: false
-pricing:
- input: '105'
- output: '0'
- unit: '0.000001'
- currency: RMB
diff --git a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/tts/gpt-sovits.yaml b/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/tts/gpt-sovits.yaml
deleted file mode 100644
index 66b1dc99c2..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/tts/gpt-sovits.yaml
+++ /dev/null
@@ -1,38 +0,0 @@
-model: RVC-Boss/GPT-SoVITS
-model_type: tts
-model_properties:
- default_voice: 'RVC-Boss/GPT-SoVITS:alex'
- voices:
- - mode: "RVC-Boss/GPT-SoVITS:alex"
- name: "Alex(男声)"
- language: [ "zh-Hans", "en-US" ]
- - mode: "RVC-Boss/GPT-SoVITS:benjamin"
- name: "Benjamin(男声)"
- language: [ "zh-Hans", "en-US" ]
- - mode: "RVC-Boss/GPT-SoVITS:charles"
- name: "Charles(男声)"
- language: [ "zh-Hans", "en-US" ]
- - mode: "RVC-Boss/GPT-SoVITS:david"
- name: "David(男声)"
- language: [ "zh-Hans", "en-US" ]
- - mode: "RVC-Boss/GPT-SoVITS:anna"
- name: "Anna(女声)"
- language: [ "zh-Hans", "en-US" ]
- - mode: "RVC-Boss/GPT-SoVITS:bella"
- name: "Bella(女声)"
- language: [ "zh-Hans", "en-US" ]
- - mode: "RVC-Boss/GPT-SoVITS:claire"
- name: "Claire(女声)"
- language: [ "zh-Hans", "en-US" ]
- - mode: "RVC-Boss/GPT-SoVITS:diana"
- name: "Diana(女声)"
- language: [ "zh-Hans", "en-US" ]
- audio_type: 'mp3'
- max_workers: 5
- # stream: false
-pricing:
- input: '50'
- output: '0'
- unit: '0.000001'
- currency: RMB
-
diff --git a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/tts/tts.py b/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/tts/tts.py
deleted file mode 100644
index 3a4454b7b8..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/models/tts/tts.py
+++ /dev/null
@@ -1,142 +0,0 @@
-import concurrent.futures
-from typing import Any, Mapping, Optional
-from dify_plugin.interfaces.model.openai_compatible.common import _CommonOaiApiCompat
-from httpx import Timeout
-from dify_plugin.errors.model import (
- CredentialsValidateFailedError,
- InvokeBadRequestError,
-)
-from dify_plugin.interfaces.model.tts_model import TTSModel
-from openai import OpenAI
-
-
-class SiliconFlowText2SpeechModel(_CommonOaiApiCompat, TTSModel):
- """
- Model class for SiliconFlow Speech to text model.
- """
-
- def _invoke(
- self,
- model: str,
- tenant_id: str,
- credentials: dict,
- content_text: str,
- voice: str,
- user: Optional[str] = None,
- ) -> Any:
- """
- _invoke text2speech model
-
- :param model: model name
- :param tenant_id: user tenant id
- :param credentials: model credentials
- :param content_text: text content to be translated
- :param voice: model timbre
- :param user: unique user id
- :return: text translated to audio file
- """
- voices = self.get_tts_model_voices(model=model, credentials=credentials) or []
- if not voice or voice not in [d["value"] for d in voices]:
- voice = self._get_model_default_voice(model, credentials)
- return self._tts_invoke_streaming(
- model=model, credentials=credentials, content_text=content_text, voice=voice
- )
-
- def validate_credentials(self, model: str, credentials: Mapping) -> None:
- """
- validate credentials text2speech model
-
- :param model: model name
- :param credentials: model credentials
- :param user: unique user id
- :return: text translated to audio file
- """
- try:
- self._tts_invoke_streaming(
- model=model,
- credentials=credentials,
- content_text="Hello SiliconFlow!",
- voice=self._get_model_default_voice(model, credentials),
- )
- except Exception as ex:
- raise CredentialsValidateFailedError(str(ex))
-
- def _tts_invoke_streaming(
- self, model: str, credentials: Mapping, content_text: str, voice: str
- ) -> Any:
- """
- _tts_invoke_streaming text2speech model
-
- :param model: model name
- :param credentials: model credentials
- :param content_text: text content to be translated
- :param voice: model timbre
- :return: text translated to audio file
- """
- credentials = dict(credentials)
- try:
- self._add_custom_parameters(credentials)
- credentials_kwargs = self._to_credential_kwargs(credentials)
- client = OpenAI(**credentials_kwargs)
- voices = (
- self.get_tts_model_voices(model=model, credentials=credentials) or []
- )
- model_support_voice = [x.get("value") for x in voices]
- if not voice or voice not in model_support_voice:
- voice = self._get_model_default_voice(model, credentials)
- if len(content_text) > 4096:
- sentences = self._split_text_into_sentences(
- content_text, max_length=4096
- )
- executor = concurrent.futures.ThreadPoolExecutor(
- max_workers=min(3, len(sentences))
- )
- futures = [
- executor.submit(
- client.audio.speech.with_streaming_response.create,
- model=model,
- response_format="mp3",
- input=sentences[i],
- voice=voice,
- )
- for i in range(len(sentences))
- ]
- for future in futures:
- yield from future.result().__enter__().iter_bytes(1024)
- else:
- response = client.audio.speech.with_streaming_response.create(
- model=model,
- voice=voice,
- response_format="mp3",
- input=content_text.strip(),
- )
- yield from response.__enter__().iter_bytes(1024)
- except Exception as ex:
- raise InvokeBadRequestError(str(ex))
-
- @classmethod
- def _add_custom_parameters(cls, credentials: dict) -> None:
- credentials["openai_api_base"] = "https://api.siliconflow.cn"
- credentials["openai_api_key"] = credentials["api_key"]
-
- def _to_credential_kwargs(self, credentials: Mapping) -> dict:
- """
- Transform credentials to kwargs for model instance
-
- :param credentials:
- :return:
- """
- credentials_kwargs = {
- "api_key": credentials["openai_api_key"],
- "timeout": Timeout(315.0, read=300.0, write=10.0, connect=5.0),
- "max_retries": 1,
- }
-
- if credentials.get("openai_api_base"):
- openai_api_base = credentials["openai_api_base"].rstrip("/")
- credentials_kwargs["base_url"] = openai_api_base + "/v1"
-
- if "openai_organization" in credentials:
- credentials_kwargs["organization"] = credentials["openai_organization"]
-
- return credentials_kwargs
diff --git a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/provider/siliconflow.py b/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/provider/siliconflow.py
deleted file mode 100644
index 087751d3d1..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/provider/siliconflow.py
+++ /dev/null
@@ -1,24 +0,0 @@
-import logging
-from dify_plugin import ModelProvider
-from dify_plugin.entities.model import ModelType
-from dify_plugin.errors.model import CredentialsValidateFailedError
-
-logger = logging.getLogger(__name__)
-
-
-class SiliconflowProvider(ModelProvider):
- def validate_provider_credentials(self, credentials: dict) -> None:
- """
- Validate provider credentials
- if validate failed, raise exception
-
- :param credentials: provider credentials, credentials form defined in `provider_credential_schema`.
- """
- try:
- model_instance = self.get_model_instance(ModelType.LLM)
- model_instance.validate_credentials(model="deepseek-ai/DeepSeek-V2.5", credentials=credentials)
- except CredentialsValidateFailedError as ex:
- raise ex
- except Exception as ex:
- logger.exception(f"{self.get_provider_schema().provider} credentials validate failed")
- raise ex
diff --git a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/provider/siliconflow.yaml b/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/provider/siliconflow.yaml
deleted file mode 100644
index 0c22f041e0..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/provider/siliconflow.yaml
+++ /dev/null
@@ -1,114 +0,0 @@
-background: "#ffecff"
-configurate_methods:
- - predefined-model
- - customizable-model
-extra:
- python:
- model_sources:
- - models/llm/llm.py
- - models/rerank/rerank.py
- - models/text_embedding/text_embedding.py
- - models/tts/tts.py
- - models/speech2text/speech2text.py
- provider_source: provider/siliconflow.py
-help:
- title:
- en_US: Get your API Key from SiliconFlow
- zh_Hans: 从 SiliconFlow 获取 API Key
- url:
- en_US: https://cloud.siliconflow.cn/account/ak
-icon_large:
- en_US: siliconflow.svg
-icon_small:
- en_US: siliconflow_square.svg
-label:
- en_US: SiliconFlow
- zh_Hans: 硅基流动
-model_credential_schema:
- credential_form_schemas:
- - label:
- en_US: API Key
- placeholder:
- en_US: Enter your API Key
- zh_Hans: 在此输入您的 API Key
- required: true
- type: secret-input
- variable: api_key
- - default: "4096"
- label:
- en_US: Model context size
- zh_Hans: 模型上下文长度
- placeholder:
- en_US: Enter your Model context size
- zh_Hans: 在此输入您的模型上下文长度
- required: true
- type: text-input
- variable: context_size
- - default: "4096"
- label:
- en_US: Upper bound for max tokens
- zh_Hans: 最大 token 上限
- show_on:
- - value: llm
- variable: __model_type
- type: text-input
- variable: max_tokens
- - default: no_call
- label:
- en_US: Function calling
- options:
- - label:
- en_US: Not Support
- zh_Hans: 不支持
- value: no_call
- - label:
- en_US: Support
- zh_Hans: 支持
- value: function_call
- required: false
- show_on:
- - value: llm
- variable: __model_type
- type: select
- variable: function_calling_type
- model:
- label:
- en_US: Model Name
- zh_Hans: 模型名称
- placeholder:
- en_US: Enter your model name
- zh_Hans: 输入模型名称
-models:
- llm:
- position: models/llm/_position.yaml
- predefined:
- - models/llm/*.yaml
- rerank:
- predefined:
- - models/rerank/*.yaml
- speech2text:
- predefined:
- - models/speech2text/*.yaml
- text_embedding:
- predefined:
- - models/text_embedding/*.yaml
- tts:
- predefined:
- - models/tts/*.yaml
-provider: siliconflow
-provider_credential_schema:
- credential_form_schemas:
- - label:
- en_US: API Key
- placeholder:
- en_US: Enter your API Key
- zh_Hans: 在此输入您的 API Key
- required: true
- type: secret-input
- variable: api_key
-supported_model_types:
- - llm
- - text-embedding
- - rerank
- - speech2text
- - tts
diff --git a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/requirements.txt b/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/requirements.txt
deleted file mode 100644
index 555a9390ba..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/siliconflow-0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3/requirements.txt
+++ /dev/null
@@ -1,3 +0,0 @@
-dify_plugin==0.0.1b73
-httpx~=0.27.2
-openai~=1.57.0
diff --git a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/.env.example b/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/.env.example
deleted file mode 100644
index dbb75b858b..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/.env.example
+++ /dev/null
@@ -1,4 +0,0 @@
-INSTALL_METHOD=remote
-REMOTE_INSTALL_HOST=debug-plugin.dify.dev
-REMOTE_INSTALL_PORT=5003
-REMOTE_INSTALL_KEY=********-****-****-****-************
diff --git a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/README.md b/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/README.md
deleted file mode 100644
index 54bc105805..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/README.md
+++ /dev/null
@@ -1,7 +0,0 @@
-# Overview
-Tongyi Qwen, developed by Alibaba Cloud, is a sophisticated series of LLMs. It includes multiple variants, such as Qwen for text processing, Qwen-VL for vision-language tasks, and Qwen-Audio for audio understanding. The models are notable for their impressive scale, with the flagship Qwen-72B model featuring 72 billion parameters and trained on over 3 trillion tokens.
-
-# Configure
-After installation, you need to get API keys from [Alibaba Cloud](https://bailian.console.aliyun.com/?apiKey=1#/api-key) and setup in Settings -> Model Provider.
-
-
diff --git a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/_assets/icon_l_en.png b/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/_assets/icon_l_en.png
deleted file mode 100644
index 94de01136a..0000000000
Binary files a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/_assets/icon_l_en.png and /dev/null differ
diff --git a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/_assets/icon_l_zh.png b/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/_assets/icon_l_zh.png
deleted file mode 100644
index bd8f2762d1..0000000000
Binary files a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/_assets/icon_l_zh.png and /dev/null differ
diff --git a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/_assets/icon_s_en.png b/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/_assets/icon_s_en.png
deleted file mode 100644
index c1aff40ee0..0000000000
Binary files a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/_assets/icon_s_en.png and /dev/null differ
diff --git a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/_assets/tongyi.PNG b/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/_assets/tongyi.PNG
deleted file mode 100644
index ff8806744b..0000000000
Binary files a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/_assets/tongyi.PNG and /dev/null differ
diff --git a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/main.py b/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/main.py
deleted file mode 100644
index f2bfcdfc0e..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/main.py
+++ /dev/null
@@ -1,6 +0,0 @@
-from dify_plugin import Plugin, DifyPluginEnv
-
-plugin = Plugin(DifyPluginEnv())
-
-if __name__ == '__main__':
- plugin.run()
diff --git a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/manifest.yaml b/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/manifest.yaml
deleted file mode 100644
index e1cb6ef016..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/manifest.yaml
+++ /dev/null
@@ -1,29 +0,0 @@
-meta:
- arch:
- - amd64
- - arm64
- runner:
- entrypoint: main
- language: python
- version: "3.12"
- version: 0.0.1
-name: tongyi
-author: langgenius
-label:
- en_US: TONGYI
- zh_Hans: 通义千问
-description:
- en_US: TONGYI
- zh_Hans: 通义千问
-icon: icon_s_en.png
-plugins:
- models:
- - provider/tongyi.yaml
-resource:
- memory: 268435456
- permission:
- model:
- enabled: false
-type: plugin
-version: 0.0.14
-created_at: "2024-09-20T00:13:50.29298939-04:00"
diff --git a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/_common.py b/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/_common.py
deleted file mode 100644
index e22441e834..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/_common.py
+++ /dev/null
@@ -1,55 +0,0 @@
-from dashscope.common.error import (
- AuthenticationError,
- InvalidParameter,
- RequestFailure,
- ServiceUnavailableError,
- UnsupportedHTTPMethod,
- UnsupportedModel,
-)
-
-from dify_plugin.errors.model import (
- InvokeAuthorizationError,
- InvokeBadRequestError,
- InvokeConnectionError,
- InvokeError,
- InvokeRateLimitError,
- InvokeServerUnavailableError,
-)
-
-
-class _CommonTongyi:
- @staticmethod
- def _to_credential_kwargs(credentials: dict) -> dict:
- credentials_kwargs = {
- "dashscope_api_key": credentials["dashscope_api_key"],
- }
-
- return credentials_kwargs
-
- @property
- def _invoke_error_mapping(self) -> dict[type[InvokeError], list[type[Exception]]]:
- """
- Map model invoke error to unified error
- The key is the error type thrown to the caller
- The value is the error type thrown by the model,
- which needs to be converted into a unified error type for the caller.
-
- :return: Invoke error mapping
- """
- return {
- InvokeConnectionError: [
- RequestFailure,
- ],
- InvokeServerUnavailableError: [
- ServiceUnavailableError,
- ],
- InvokeRateLimitError: [],
- InvokeAuthorizationError: [
- AuthenticationError,
- ],
- InvokeBadRequestError: [
- InvalidParameter,
- UnsupportedModel,
- UnsupportedHTTPMethod,
- ],
- }
diff --git a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/__init__.py b/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/__init__.py
deleted file mode 100644
index e69de29bb2..0000000000
diff --git a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/_position.yaml b/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/_position.yaml
deleted file mode 100644
index 0cf4612f18..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/_position.yaml
+++ /dev/null
@@ -1,67 +0,0 @@
-- qwq-32b
-- qwq-plus
-- qwq-plus-0305
-- deepseek-r1
-- deepseek-r1-distill-qwen-14b
-- deepseek-r1-distill-qwen-32b
-- deepseek-v3
-- qwen2.5-vl-72b-instruct
-- qwen2.5-vl-7b-instruct
-- qwen2.5-vl-3b-instruct
-- qwen-vl-max-latest
-- qwen-vl-max-2025-01-25
-- qwen-vl-max-0809
-- qwen-vl-max-0201
-- qwen-vl-max
-- qwen-max-latest
-- qwen-max-1201
-- qwen-max-0919
-- qwen-max-0428
-- qwen-max-0403
-- qwen-max-0107
-- qwen-max
-- qwen-max-longcontext
-- qwen-plus-latest
-- qwen-plus-0919
-- qwen-plus-0806
-- qwen-plus-0723
-- qwen-plus-0624
-- qwen-plus-0206
-- qwen-plus-chat
-- qwen-plus
-- qwen-vl-plus-latest
-- qwen-vl-plus-2025-01-25
-- qwen-vl-plus-2025-01-02
-- qwen-vl-plus-0809
-- qwen-vl-plus
-- qwen-turbo-latest
-- qwen-turbo-0919
-- qwen-turbo-0624
-- qwen-turbo-0206
-- qwen-turbo-chat
-- qwen-turbo
-- qwen2.5-72b-instruct
-- qwen2.5-32b-instruct
-- qwen2.5-14b-instruct-1m
-- qwen2.5-14b-instruct
-- qwen2.5-7b-instruct-1m
-- qwen2.5-7b-instruct
-- qwen2.5-3b-instruct
-- qwen2.5-1.5b-instruct
-- qwen2.5-0.5b-instruct
-- qwen2.5-coder-7b-instruct
-- qwen2-math-72b-instruct
-- qwen2-math-7b-instruct
-- qwen2-math-1.5b-instruct
-- qwen-long
-- qwen-math-plus-latest
-- qwen-math-plus-0919
-- qwen-math-plus-0816
-- qwen-math-plus
-- qwen-math-turbo-latest
-- qwen-math-turbo-0919
-- qwen-math-turbo
-- qwen-coder-turbo-latest
-- qwen-coder-turbo-0919
-- qwen-coder-turbo
-- farui-plus
diff --git a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/deepseek-r1-distill-qwen-14B.yaml b/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/deepseek-r1-distill-qwen-14B.yaml
deleted file mode 100644
index 2bce8805c6..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/deepseek-r1-distill-qwen-14B.yaml
+++ /dev/null
@@ -1,21 +0,0 @@
-model: deepseek-r1-distill-qwen-14b
-label:
- zh_Hans: DeepSeek-R1-Distill-Qwen-14B
- en_US: DeepSeek-R1-Distill-Qwen-14B
-model_type: llm
-features:
- - agent-thought
-model_properties:
- mode: chat
- context_size: 32000
-parameter_rules:
- - name: max_tokens
- use_template: max_tokens
- min: 1
- max: 8192
- default: 4096
-pricing:
- input: "0.001"
- output: "0.003"
- unit: "0.001"
- currency: RMB
diff --git a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/deepseek-r1-distill-qwen-32B.yaml b/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/deepseek-r1-distill-qwen-32B.yaml
deleted file mode 100644
index dfc155ff6a..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/deepseek-r1-distill-qwen-32B.yaml
+++ /dev/null
@@ -1,21 +0,0 @@
-model: deepseek-r1-distill-qwen-32b
-label:
- zh_Hans: DeepSeek-R1-Distill-Qwen-32B
- en_US: DeepSeek-R1-Distill-Qwen-32B
-model_type: llm
-features:
- - agent-thought
-model_properties:
- mode: chat
- context_size: 32000
-parameter_rules:
- - name: max_tokens
- use_template: max_tokens
- min: 1
- max: 8192
- default: 4096
-pricing:
- input: "0.002"
- output: "0.006"
- unit: "0.001"
- currency: RMB
diff --git a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/deepseek-r1.yaml b/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/deepseek-r1.yaml
deleted file mode 100644
index b97356e641..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/deepseek-r1.yaml
+++ /dev/null
@@ -1,21 +0,0 @@
-model: deepseek-r1
-label:
- zh_Hans: DeepSeek-R1
- en_US: DeepSeek-R1
-model_type: llm
-features:
- - agent-thought
-model_properties:
- mode: chat
- context_size: 64000
-parameter_rules:
- - name: max_tokens
- use_template: max_tokens
- min: 1
- max: 8192
- default: 4096
-pricing:
- input: "0.004"
- output: "0.016"
- unit: "0.001"
- currency: RMB
diff --git a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/deepseek-v3.yaml b/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/deepseek-v3.yaml
deleted file mode 100644
index 23f38d60d3..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/deepseek-v3.yaml
+++ /dev/null
@@ -1,52 +0,0 @@
-model: deepseek-v3
-label:
- zh_Hans: DeepSeek-V3
- en_US: DeepSeek-V3
-model_type: llm
-features:
- - agent-thought
-model_properties:
- mode: chat
- context_size: 64000
-parameter_rules:
- - name: temperature
- use_template: temperature
- - name: max_tokens
- use_template: max_tokens
- type: int
- default: 512
- min: 1
- max: 4096
- help:
- zh_Hans: 指定生成结果长度的上限。如果生成结果截断,可以调大该参数。
- en_US: Specifies the upper limit on the length of generated results. If the generated results are truncated, you can increase this parameter.
- - name: top_p
- use_template: top_p
- - name: top_k
- label:
- zh_Hans: 取样数量
- en_US: Top k
- type: int
- help:
- zh_Hans: 仅从每个后续标记的前 K 个选项中采样。
- en_US: Only sample from the top K options for each subsequent token.
- required: false
- - name: frequency_penalty
- use_template: frequency_penalty
- - name: response_format
- label:
- zh_Hans: 回复格式
- en_US: Response Format
- type: string
- help:
- zh_Hans: 指定模型必须输出的格式
- en_US: specifying the format that the model must output
- required: false
- options:
- - text
- - json_object
-pricing:
- input: "0.002"
- output: "0.008"
- unit: "0.001"
- currency: RMB
diff --git a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/farui-plus.yaml b/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/farui-plus.yaml
deleted file mode 100644
index 34a57d1fc0..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/farui-plus.yaml
+++ /dev/null
@@ -1,77 +0,0 @@
-# for more details, please refer to https://help.aliyun.com/zh/model-studio/getting-started/models
-model: farui-plus
-label:
- en_US: farui-plus
-model_type: llm
-features:
- - multi-tool-call
- - agent-thought
- - stream-tool-call
-model_properties:
- mode: chat
- context_size: 12288
-parameter_rules:
- - name: temperature
- use_template: temperature
- type: float
- default: 0.3
- min: 0.0
- max: 2.0
- help:
- zh_Hans: 用于控制随机性和多样性的程度。具体来说,temperature值控制了生成文本时对每个候选词的概率分布进行平滑的程度。较高的temperature值会降低概率分布的峰值,使得更多的低概率词被选择,生成结果更加多样化;而较低的temperature值则会增强概率分布的峰值,使得高概率词更容易被选择,生成结果更加确定。
- en_US: Used to control the degree of randomness and diversity. Specifically, the temperature value controls the degree to which the probability distribution of each candidate word is smoothed when generating text. A higher temperature value will reduce the peak value of the probability distribution, allowing more low-probability words to be selected, and the generated results will be more diverse; while a lower temperature value will enhance the peak value of the probability distribution, making it easier for high-probability words to be selected. , the generated results are more certain.
- - name: max_tokens
- use_template: max_tokens
- type: int
- default: 2000
- min: 1
- max: 2000
- help:
- zh_Hans: 用于指定模型在生成内容时token的最大数量,它定义了生成的上限,但不保证每次都会生成到这个数量。
- en_US: It is used to specify the maximum number of tokens when the model generates content. It defines the upper limit of generation, but does not guarantee that this number will be generated every time.
- - name: top_p
- use_template: top_p
- type: float
- default: 0.8
- min: 0.1
- max: 0.9
- help:
- zh_Hans: 生成过程中核采样方法概率阈值,例如,取值为0.8时,仅保留概率加起来大于等于0.8的最可能token的最小集合作为候选集。取值范围为(0,1.0),取值越大,生成的随机性越高;取值越低,生成的确定性越高。
- en_US: The probability threshold of the kernel sampling method during the generation process. For example, when the value is 0.8, only the smallest set of the most likely tokens with a sum of probabilities greater than or equal to 0.8 is retained as the candidate set. The value range is (0,1.0). The larger the value, the higher the randomness generated; the lower the value, the higher the certainty generated.
- - name: top_k
- type: int
- min: 0
- max: 99
- label:
- zh_Hans: 取样数量
- en_US: Top k
- help:
- zh_Hans: 生成时,采样候选集的大小。例如,取值为50时,仅将单次生成中得分最高的50个token组成随机采样的候选集。取值越大,生成的随机性越高;取值越小,生成的确定性越高。
- en_US: The size of the sample candidate set when generated. For example, when the value is 50, only the 50 highest-scoring tokens in a single generation form a randomly sampled candidate set. The larger the value, the higher the randomness generated; the smaller the value, the higher the certainty generated.
- - name: seed
- required: false
- type: int
- default: 1234
- label:
- zh_Hans: 随机种子
- en_US: Random seed
- help:
- zh_Hans: 生成时使用的随机数种子,用户控制模型生成内容的随机性。支持无符号64位整数,默认值为 1234。在使用seed时,模型将尽可能生成相同或相似的结果,但目前不保证每次生成的结果完全相同。
- en_US: The random number seed used when generating, the user controls the randomness of the content generated by the model. Supports unsigned 64-bit integers, default value is 1234. When using seed, the model will try its best to generate the same or similar results, but there is currently no guarantee that the results will be exactly the same every time.
- - name: repetition_penalty
- required: false
- type: float
- default: 1.1
- label:
- zh_Hans: 重复惩罚
- en_US: Repetition penalty
- help:
- zh_Hans: 用于控制模型生成时的重复度。提高repetition_penalty时可以降低模型生成的重复度。1.0表示不做惩罚。
- en_US: Used to control the repeatability when generating models. Increasing repetition_penalty can reduce the duplication of model generation. 1.0 means no punishment.
- - name: response_format
- use_template: response_format
-pricing:
- input: '0.02'
- output: '0.02'
- unit: '0.001'
- currency: RMB
diff --git a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/llm.py b/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/llm.py
deleted file mode 100644
index df3b80f12b..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/llm.py
+++ /dev/null
@@ -1,699 +0,0 @@
-import base64
-import os
-import tempfile
-import uuid
-from collections.abc import Generator
-from http import HTTPStatus
-from pathlib import Path
-from typing import Optional, Union, cast
-
-import requests
-from dashscope import Generation, MultiModalConversation, get_tokenizer
-from dashscope.api_entities.dashscope_response import GenerationResponse
-from dashscope.common.error import (
- AuthenticationError,
- InvalidParameter,
- RequestFailure,
- ServiceUnavailableError,
- UnsupportedHTTPMethod,
- UnsupportedModel,
-)
-from dify_plugin.entities.model import (
- AIModelEntity,
- FetchFrom,
- I18nObject,
- ModelFeature,
- ModelPropertyKey,
- ModelType,
- ParameterRule,
- ParameterType,
-)
-from dify_plugin.entities.model.llm import (
- LLMMode,
- LLMResult,
- LLMResultChunk,
- LLMResultChunkDelta,
-)
-from dify_plugin.entities.model.message import (
- AssistantPromptMessage,
- DocumentPromptMessageContent,
- ImagePromptMessageContent,
- PromptMessage,
- PromptMessageContentType,
- PromptMessageTool,
- SystemPromptMessage,
- TextPromptMessageContent,
- ToolPromptMessage,
- UserPromptMessage,
- VideoPromptMessageContent,
-)
-from dify_plugin.errors.model import (
- CredentialsValidateFailedError,
- InvokeAuthorizationError,
- InvokeBadRequestError,
- InvokeConnectionError,
- InvokeError,
- InvokeRateLimitError,
- InvokeServerUnavailableError,
-)
-from dify_plugin.interfaces.model.large_language_model import LargeLanguageModel
-from openai import OpenAI
-
-
-class TongyiLargeLanguageModel(LargeLanguageModel):
- tokenizers = {}
-
- def _invoke(
- self,
- model: str,
- credentials: dict,
- prompt_messages: list[PromptMessage],
- model_parameters: dict,
- tools: Optional[list[PromptMessageTool]] = None,
- stop: Optional[list[str]] = None,
- stream: bool = True,
- user: Optional[str] = None,
- ) -> Union[LLMResult, Generator]:
- """
- Invoke large language model
-
- :param model: model name
- :param credentials: model credentials
- :param prompt_messages: prompt messages
- :param model_parameters: model parameters
- :param tools: tools for tool calling
- :param stop: stop words
- :param stream: is stream response
- :param user: unique user id
- :return: full response or stream response chunk generator result
- """
- return self._generate(
- model,
- credentials,
- prompt_messages,
- model_parameters,
- tools,
- stop,
- stream,
- user,
- )
-
- def get_num_tokens(
- self,
- model: str,
- credentials: dict,
- prompt_messages: list[PromptMessage],
- tools: Optional[list[PromptMessageTool]] = None,
- ) -> int:
- """
- Get number of tokens for given prompt messages
-
- :param model: model name
- :param credentials: model credentials
- :param prompt_messages: prompt messages
- :param tools: tools for tool calling
- :return:
- """
- if self.get_customizable_model_schema(model, credentials) is not None:
- return 0
- if model in {"qwen-turbo-chat", "qwen-plus-chat"}:
- model = model.replace("-chat", "")
- if model == "farui-plus":
- model = "qwen-farui-plus"
- if model in self.tokenizers:
- tokenizer = self.tokenizers[model]
- else:
- tokenizer = get_tokenizer(model)
- self.tokenizers[model] = tokenizer
- tokens = tokenizer.encode(self._convert_messages_to_prompt(prompt_messages))
- return len(tokens)
-
- def validate_credentials(self, model: str, credentials: dict) -> None:
- """
- Validate model credentials
-
- :param model: model name
- :param credentials: model credentials
- :return:
- """
- try:
- self._generate(
- model=model,
- credentials=credentials,
- prompt_messages=[UserPromptMessage(content="ping")],
- model_parameters={"temperature": 0.5},
- stream=False,
- )
- except Exception as ex:
- raise CredentialsValidateFailedError(str(ex))
-
- def _generate(
- self,
- model: str,
- credentials: dict,
- prompt_messages: list[PromptMessage],
- model_parameters: dict,
- tools: Optional[list[PromptMessageTool]] = None,
- stop: Optional[list[str]] = None,
- stream: bool = True,
- user: Optional[str] = None,
- ) -> Union[LLMResult, Generator]:
- """
- Invoke large language model
-
- :param model: model name
- :param credentials: credentials
- :param prompt_messages: prompt messages
- :param tools: tools for tool calling
- :param model_parameters: model parameters
- :param stop: stop words
- :param stream: is stream response
- :param user: unique user id
- :return: full response or stream response chunk generator result
- """
- credentials_kwargs = self._to_credential_kwargs(credentials)
- mode = self.get_model_mode(model, credentials)
- if model in {"qwen-turbo-chat", "qwen-plus-chat"}:
- model = model.replace("-chat", "")
- extra_model_kwargs = {}
- if tools:
- extra_model_kwargs["tools"] = self._convert_tools(tools)
- if stop:
- extra_model_kwargs["stop"] = stop
- params = {
- "model": model,
- **model_parameters,
- **credentials_kwargs,
- **extra_model_kwargs,
- }
- model_schema = self.get_model_schema(model, credentials)
- if ModelFeature.VISION in (model_schema.features or []):
- params["messages"] = self._convert_prompt_messages_to_tongyi_messages(
- credentials, prompt_messages, rich_content=True
- )
- response = MultiModalConversation.call(**params, stream=stream)
- else:
- params["messages"] = self._convert_prompt_messages_to_tongyi_messages(
- credentials, prompt_messages
- )
- response = Generation.call(
- **params,
- result_format="message",
- stream=stream,
- incremental_output=False if tools else stream,
- )
- if stream:
- return self._handle_generate_stream_response(
- model, credentials, response, prompt_messages
- )
- return self._handle_generate_response(
- model, credentials, response, prompt_messages
- )
-
- def _handle_generate_response(
- self,
- model: str,
- credentials: dict,
- response: GenerationResponse,
- prompt_messages: list[PromptMessage],
- ) -> LLMResult:
- """
- Handle llm response
-
- :param model: model name
- :param credentials: credentials
- :param response: response
- :param prompt_messages: prompt messages
- :return: llm response
- """
- if response.status_code not in {200, HTTPStatus.OK}:
- raise ServiceUnavailableError(response.message)
- resp_content = response.output.choices[0].message.content
- # special for qwen-vl
- if isinstance(resp_content, list):
- resp_content = resp_content[0]["text"]
- assistant_prompt_message = AssistantPromptMessage(content=resp_content)
- usage = self._calc_response_usage(
- model,
- credentials,
- response.usage.input_tokens,
- response.usage.output_tokens,
- )
- result = LLMResult(
- model=model,
- message=assistant_prompt_message,
- prompt_messages=prompt_messages,
- usage=usage,
- )
- return result
-
- def _handle_tool_call_stream(self, response, tool_calls):
- tool_calls_stream = response.output.choices[0].message["tool_calls"]
- for tool_call_stream in tool_calls_stream:
- idx = tool_call_stream.get('index')
- if idx >= len(tool_calls):
- tool_calls.append(tool_call_stream)
- else:
- if tool_call_stream.get('function'):
- func_name = tool_call_stream.get('function').get('name')
- tool_call_obj = tool_calls[idx]
- if func_name:
- tool_call_obj['function']['name'] += func_name
- args = tool_call_stream.get('function').get('arguments')
- if args:
- tool_call_obj['function']['arguments'] += args
-
- def _handle_generate_stream_response(
- self,
- model: str,
- credentials: dict,
- responses: Generator[GenerationResponse, None, None],
- prompt_messages: list[PromptMessage],
- ) -> Generator:
- """
- Handle llm stream response
-
- :param model: model name
- :param credentials: credentials
- :param responses: response
- :param prompt_messages: prompt messages
- :return: llm response chunk generator result
- """
- is_reasoning = False
- full_text = ""
- tool_calls = []
- for index, response in enumerate(responses):
- if response.status_code not in {200, HTTPStatus.OK}:
- raise ServiceUnavailableError(
- f"Failed to invoke model {model}, status code: {response.status_code}, message: {response.message}"
- )
- resp_finish_reason = response.output.choices[0].finish_reason
- if resp_finish_reason is not None and resp_finish_reason != "null":
- resp_content = response.output.choices[0].message.content
- assistant_prompt_message = AssistantPromptMessage(content="")
- if "tool_calls" in response.output.choices[0].message:
- self._handle_tool_call_stream(response, tool_calls)
- elif resp_content:
- if isinstance(resp_content, list):
- resp_content = resp_content[0]["text"]
- assistant_prompt_message.content = resp_content.replace(
- full_text, "", 1
- )
- full_text = resp_content
- if tool_calls:
- message_tool_calls = []
- for tool_call_obj in tool_calls:
- message_tool_call = AssistantPromptMessage.ToolCall(
- id=tool_call_obj["function"]["name"],
- type="function",
- function=AssistantPromptMessage.ToolCall.ToolCallFunction(
- name=tool_call_obj["function"]["name"],
- arguments=tool_call_obj["function"]["arguments"],
- ),
- )
- message_tool_calls.append(message_tool_call)
- assistant_prompt_message.tool_calls = message_tool_calls
- usage = response.usage
- usage = self._calc_response_usage(
- model, credentials, usage.input_tokens, usage.output_tokens
- )
- yield LLMResultChunk(
- model=model,
- prompt_messages=prompt_messages,
- delta=LLMResultChunkDelta(
- index=index,
- message=assistant_prompt_message,
- finish_reason=resp_finish_reason,
- usage=usage,
- ),
- )
- else:
- message = response.output.choices[0].message
-
- resp_content, is_reasoning = self._wrap_thinking_by_reasoning_content(
- message, is_reasoning
- )
- if not resp_content:
- if "tool_calls" in response.output.choices[0].message:
- self._handle_tool_call_stream(response, tool_calls)
- continue
- if isinstance(resp_content, list):
- resp_content = resp_content[0]["text"]
- assistant_prompt_message = AssistantPromptMessage(
- content=resp_content.replace(full_text, "", 1)
- )
- full_text = resp_content
- yield LLMResultChunk(
- model=model,
- prompt_messages=prompt_messages,
- delta=LLMResultChunkDelta(
- index=index, message=assistant_prompt_message
- ),
- )
-
- def _to_credential_kwargs(self, credentials: dict) -> dict:
- """
- Transform credentials to kwargs for model instance
-
- :param credentials:
- :return:
- """
- credentials_kwargs = {"api_key": credentials["dashscope_api_key"]}
- return credentials_kwargs
-
- def _convert_one_message_to_text(self, message: PromptMessage) -> str:
- """
- Convert a single message to a string.
-
- :param message: PromptMessage to convert.
- :return: String representation of the message.
- """
- human_prompt = "\n\nHuman:"
- ai_prompt = "\n\nAssistant:"
- content = message.content
- if isinstance(message, UserPromptMessage):
- if isinstance(content, str):
- message_text = f"{human_prompt} {content}"
- else:
- message_text = ""
- for sub_message in content:
- if sub_message.type == PromptMessageContentType.TEXT:
- message_text = f"{human_prompt} {sub_message.data}"
- break
- elif isinstance(message, AssistantPromptMessage):
- message_text = f"{ai_prompt} {content}"
- elif isinstance(message, SystemPromptMessage | ToolPromptMessage):
- message_text = content
- else:
- raise ValueError(f"Got unknown type {message}")
- return message_text
-
- def _convert_messages_to_prompt(self, messages: list[PromptMessage]) -> str:
- """
- Format a list of messages into a full prompt for the Anthropic model
-
- :param messages: List of PromptMessage to combine.
- :return: Combined string with necessary human_prompt and ai_prompt tags.
- """
- messages = messages.copy()
- text = "".join(
- (self._convert_one_message_to_text(message) for message in messages)
- )
- return text.rstrip()
-
- def _convert_prompt_messages_to_tongyi_messages(
- self,
- credentials: dict,
- prompt_messages: list[PromptMessage],
- rich_content: bool = False,
- ) -> list[dict]:
- """
- Convert prompt messages to tongyi messages
-
- :param prompt_messages: prompt messages
- :return: tongyi messages
- """
- tongyi_messages = []
- for prompt_message in prompt_messages:
- if isinstance(prompt_message, SystemPromptMessage):
- tongyi_messages.append(
- {
- "role": "system",
- "content": (
- prompt_message.content
- if not rich_content
- else [{"text": prompt_message.content}]
- ),
- }
- )
- elif isinstance(prompt_message, UserPromptMessage):
- if isinstance(prompt_message.content, str):
- tongyi_messages.append(
- {
- "role": "user",
- "content": (
- prompt_message.content
- if not rich_content
- else [{"text": prompt_message.content}]
- ),
- }
- )
- else:
- user_messages = []
- file_id_list = []
- for message_content in prompt_message.content:
- if message_content.type == PromptMessageContentType.TEXT:
- message_content = cast(
- TextPromptMessageContent, message_content
- )
- sub_message_dict = {"text": message_content.data}
- user_messages.append(sub_message_dict)
- elif message_content.type == PromptMessageContentType.IMAGE:
- message_content = cast(
- ImagePromptMessageContent, message_content
- )
- image_url = message_content.data
- if message_content.data.startswith("data:"):
- image_url = self._save_base64_image_to_file(
- message_content.data
- )
- sub_message_dict = {"image": image_url}
- user_messages.append(sub_message_dict)
- elif message_content.type == PromptMessageContentType.VIDEO:
- message_content = cast(
- VideoPromptMessageContent, message_content
- )
- video_url = message_content.data
- if message_content.data.startswith("data:"):
- raise InvokeError(
- "not support base64, please set MULTIMODAL_SEND_VIDEO_FORMAT to url"
- )
- sub_message_dict = {"video": video_url}
- user_messages.append(sub_message_dict)
- elif message_content.type == PromptMessageContentType.DOCUMENT:
- message_content = cast(
- DocumentPromptMessageContent, message_content
- )
- file_id = self._upload_file_to_tongyi(
- credentials, message_content
- )
- file_id_url = f"fileid://{file_id}"
- file_id_list.append(file_id_url)
- if len(file_id_list) > 0:
- tongyi_messages.append(
- {"role": "system", "content": ",".join(file_id_list)}
- )
- user_messages = sorted(user_messages, key=lambda x: "text" in x)
- tongyi_messages.append({"role": "user", "content": user_messages})
- elif isinstance(prompt_message, AssistantPromptMessage):
- content = prompt_message.content
- if not content:
- content = " "
- message = {
- "role": "assistant",
- "content": content if not rich_content else [{"text": content}],
- }
- if prompt_message.tool_calls:
- message["tool_calls"] = [
- tool_call.model_dump()
- for tool_call in prompt_message.tool_calls
- ]
- tongyi_messages.append(message)
- elif isinstance(prompt_message, ToolPromptMessage):
- tongyi_messages.append(
- {
- "role": "tool",
- "content": prompt_message.content,
- "name": prompt_message.tool_call_id,
- }
- )
- else:
- raise ValueError(f"Got unknown type {prompt_message}")
- return tongyi_messages
-
- def _save_base64_image_to_file(self, base64_image: str) -> str:
- """
- Save base64 image to file
- 'data:{upload_file.mime_type};base64,{encoded_string}'
-
- :param base64_image: base64 image data
- :return: image file path
- """
- (mime_type, encoded_string) = (
- base64_image.split(",")[0].split(";")[0].split(":")[1],
- base64_image.split(",")[1],
- )
- temp_dir = tempfile.gettempdir()
- file_path = os.path.join(temp_dir, f"{uuid.uuid4()}.{mime_type.split('/')[1]}")
- Path(file_path).write_bytes(base64.b64decode(encoded_string))
- return f"file://{file_path}"
-
- def _upload_file_to_tongyi(
- self, credentials: dict, message_content: DocumentPromptMessageContent
- ) -> str:
- """
- Upload file to Tongyi
-
- :param credentials: credentials for Tongyi
- :param message_content: message content to upload
- :return: file ID in Tongyi
- """
- client = OpenAI(
- api_key=credentials.dashscope_api_key,
- base_url="https://dashscope.aliyuncs.com/compatible-mode/v1",
- )
- with tempfile.NamedTemporaryFile(delete=False) as temp_file:
- if message_content.base64_data:
- file_content = base64.b64decode(message_content.base64_data)
- temp_file.write(file_content)
- else:
- try:
- response = requests.get(message_content.url, timeout=60)
- response.raise_for_status()
- temp_file.write(response.content)
- except Exception as ex:
- raise ValueError(
- f"Failed to fetch data from url {message_content.url}, {ex}"
- ) from ex
- temp_file.flush()
- response = client.files.create(file=temp_file, purpose="file-extract")
- return response.id
-
- def _convert_tools(self, tools: list[PromptMessageTool]) -> list[dict]:
- """
- Convert tools
- """
- tool_definitions = []
- for tool in tools:
- properties = tool.parameters["properties"]
- required_properties = tool.parameters["required"]
- properties_definitions = {}
- for p_key, p_val in properties.items():
- desc = p_val["description"]
- if "enum" in p_val:
- desc += f"; Only accepts one of the following predefined options: [{', '.join(p_val['enum'])}]"
- properties_definitions[p_key] = {
- "description": desc,
- "type": p_val["type"],
- }
- tool_definition = {
- "type": "function",
- "function": {
- "name": tool.name,
- "description": tool.description,
- "parameters": properties_definitions,
- "required": required_properties,
- },
- }
- tool_definitions.append(tool_definition)
- return tool_definitions
- def _wrap_thinking_by_reasoning_content(self, delta: dict, is_reasoning: bool) -> tuple[str, bool]:
- """
- If the reasoning response is from delta.get("reasoning_content"), we wrap
- it with HTML think tag.
- :param delta: delta dictionary from LLM streaming response
- :param is_reasoning: is reasoning
- :return: tuple of (processed_content, is_reasoning)
- """
-
- content = delta.get("content") or ""
- reasoning_content = delta.get("reasoning_content")
-
- if reasoning_content:
- if not is_reasoning:
- content = "\n" + reasoning_content
- is_reasoning = True
- else:
- content = reasoning_content
- elif is_reasoning and content:
- content = "\n" + content
- is_reasoning = False
- return content, is_reasoning
- @property
- def _invoke_error_mapping(self) -> dict[type[InvokeError], list[type[Exception]]]:
- """
- Map model invoke error to unified error
- The key is the error type thrown to the caller
- The value is the error type thrown by the model,
- which needs to be converted into a unified error type for the caller.
-
- :return: Invoke error mapping
- """
- return {
- InvokeConnectionError: [RequestFailure],
- InvokeServerUnavailableError: [ServiceUnavailableError],
- InvokeRateLimitError: [],
- InvokeAuthorizationError: [AuthenticationError],
- InvokeBadRequestError: [
- InvalidParameter,
- UnsupportedModel,
- UnsupportedHTTPMethod,
- ],
- }
-
- def get_customizable_model_schema(
- self, model: str, credentials: dict
- ) -> Optional[AIModelEntity]:
- """
- Architecture for defining customizable models
-
- :param model: model name
- :param credentials: model credentials
- :return: AIModelEntity or None
- """
- return AIModelEntity(
- model=model,
- label=I18nObject(en_US=model, zh_Hans=model),
- model_type=ModelType.LLM,
- features=(
- [
- ModelFeature.TOOL_CALL,
- ModelFeature.MULTI_TOOL_CALL,
- ModelFeature.STREAM_TOOL_CALL,
- ]
- if credentials.get("function_calling_type") == "tool_call"
- else []
- ),
- fetch_from=FetchFrom.CUSTOMIZABLE_MODEL,
- model_properties={
- ModelPropertyKey.CONTEXT_SIZE: int(
- credentials.get("context_size", 8000)
- ),
- ModelPropertyKey.MODE: LLMMode.CHAT.value,
- },
- parameter_rules=[
- ParameterRule(
- name="temperature",
- use_template="temperature",
- label=I18nObject(en_US="Temperature", zh_Hans="温度"),
- type=ParameterType.FLOAT,
- ),
- ParameterRule(
- name="max_tokens",
- use_template="max_tokens",
- default=512,
- min=1,
- max=int(credentials.get("max_tokens", 1024)),
- label=I18nObject(en_US="Max Tokens", zh_Hans="最大标记"),
- type=ParameterType.INT,
- ),
- ParameterRule(
- name="top_p",
- use_template="top_p",
- label=I18nObject(en_US="Top P", zh_Hans="Top P"),
- type=ParameterType.FLOAT,
- ),
- ParameterRule(
- name="top_k",
- use_template="top_k",
- label=I18nObject(en_US="Top K", zh_Hans="Top K"),
- type=ParameterType.FLOAT,
- ),
- ParameterRule(
- name="frequency_penalty",
- use_template="frequency_penalty",
- label=I18nObject(en_US="Frequency Penalty", zh_Hans="重复惩罚"),
- type=ParameterType.FLOAT,
- ),
- ],
- )
diff --git a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-coder-turbo-0919.yaml b/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-coder-turbo-0919.yaml
deleted file mode 100644
index 64a3f33133..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-coder-turbo-0919.yaml
+++ /dev/null
@@ -1,75 +0,0 @@
-# for more details, please refer to https://help.aliyun.com/zh/model-studio/getting-started/models
-model: qwen-coder-turbo-0919
-label:
- en_US: qwen-coder-turbo-0919
-model_type: llm
-features:
- - agent-thought
-model_properties:
- mode: chat
- context_size: 131072
-parameter_rules:
- - name: temperature
- use_template: temperature
- type: float
- default: 0.3
- min: 0.0
- max: 2.0
- help:
- zh_Hans: 用于控制随机性和多样性的程度。具体来说,temperature值控制了生成文本时对每个候选词的概率分布进行平滑的程度。较高的temperature值会降低概率分布的峰值,使得更多的低概率词被选择,生成结果更加多样化;而较低的temperature值则会增强概率分布的峰值,使得高概率词更容易被选择,生成结果更加确定。
- en_US: Used to control the degree of randomness and diversity. Specifically, the temperature value controls the degree to which the probability distribution of each candidate word is smoothed when generating text. A higher temperature value will reduce the peak value of the probability distribution, allowing more low-probability words to be selected, and the generated results will be more diverse; while a lower temperature value will enhance the peak value of the probability distribution, making it easier for high-probability words to be selected. , the generated results are more certain.
- - name: max_tokens
- use_template: max_tokens
- type: int
- default: 8192
- min: 1
- max: 8192
- help:
- zh_Hans: 用于指定模型在生成内容时token的最大数量,它定义了生成的上限,但不保证每次都会生成到这个数量。
- en_US: It is used to specify the maximum number of tokens when the model generates content. It defines the upper limit of generation, but does not guarantee that this number will be generated every time.
- - name: top_p
- use_template: top_p
- type: float
- default: 0.8
- min: 0.1
- max: 0.9
- help:
- zh_Hans: 生成过程中核采样方法概率阈值,例如,取值为0.8时,仅保留概率加起来大于等于0.8的最可能token的最小集合作为候选集。取值范围为(0,1.0),取值越大,生成的随机性越高;取值越低,生成的确定性越高。
- en_US: The probability threshold of the kernel sampling method during the generation process. For example, when the value is 0.8, only the smallest set of the most likely tokens with a sum of probabilities greater than or equal to 0.8 is retained as the candidate set. The value range is (0,1.0). The larger the value, the higher the randomness generated; the lower the value, the higher the certainty generated.
- - name: top_k
- type: int
- min: 0
- max: 99
- label:
- zh_Hans: 取样数量
- en_US: Top k
- help:
- zh_Hans: 生成时,采样候选集的大小。例如,取值为50时,仅将单次生成中得分最高的50个token组成随机采样的候选集。取值越大,生成的随机性越高;取值越小,生成的确定性越高。
- en_US: The size of the sample candidate set when generated. For example, when the value is 50, only the 50 highest-scoring tokens in a single generation form a randomly sampled candidate set. The larger the value, the higher the randomness generated; the smaller the value, the higher the certainty generated.
- - name: seed
- required: false
- type: int
- default: 1234
- label:
- zh_Hans: 随机种子
- en_US: Random seed
- help:
- zh_Hans: 生成时使用的随机数种子,用户控制模型生成内容的随机性。支持无符号64位整数,默认值为 1234。在使用seed时,模型将尽可能生成相同或相似的结果,但目前不保证每次生成的结果完全相同。
- en_US: The random number seed used when generating, the user controls the randomness of the content generated by the model. Supports unsigned 64-bit integers, default value is 1234. When using seed, the model will try its best to generate the same or similar results, but there is currently no guarantee that the results will be exactly the same every time.
- - name: repetition_penalty
- required: false
- type: float
- default: 1.1
- label:
- zh_Hans: 重复惩罚
- en_US: Repetition penalty
- help:
- zh_Hans: 用于控制模型生成时的重复度。提高repetition_penalty时可以降低模型生成的重复度。1.0表示不做惩罚。
- en_US: Used to control the repeatability when generating models. Increasing repetition_penalty can reduce the duplication of model generation. 1.0 means no punishment.
- - name: response_format
- use_template: response_format
-pricing:
- input: '0.002'
- output: '0.006'
- unit: '0.001'
- currency: RMB
diff --git a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-coder-turbo-latest.yaml b/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-coder-turbo-latest.yaml
deleted file mode 100644
index a4c93f7047..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-coder-turbo-latest.yaml
+++ /dev/null
@@ -1,75 +0,0 @@
-# for more details, please refer to https://help.aliyun.com/zh/model-studio/getting-started/models
-model: qwen-coder-turbo-latest
-label:
- en_US: qwen-coder-turbo-latest
-model_type: llm
-features:
- - agent-thought
-model_properties:
- mode: chat
- context_size: 131072
-parameter_rules:
- - name: temperature
- use_template: temperature
- type: float
- default: 0.3
- min: 0.0
- max: 2.0
- help:
- zh_Hans: 用于控制随机性和多样性的程度。具体来说,temperature值控制了生成文本时对每个候选词的概率分布进行平滑的程度。较高的temperature值会降低概率分布的峰值,使得更多的低概率词被选择,生成结果更加多样化;而较低的temperature值则会增强概率分布的峰值,使得高概率词更容易被选择,生成结果更加确定。
- en_US: Used to control the degree of randomness and diversity. Specifically, the temperature value controls the degree to which the probability distribution of each candidate word is smoothed when generating text. A higher temperature value will reduce the peak value of the probability distribution, allowing more low-probability words to be selected, and the generated results will be more diverse; while a lower temperature value will enhance the peak value of the probability distribution, making it easier for high-probability words to be selected. , the generated results are more certain.
- - name: max_tokens
- use_template: max_tokens
- type: int
- default: 8192
- min: 1
- max: 8192
- help:
- zh_Hans: 用于指定模型在生成内容时token的最大数量,它定义了生成的上限,但不保证每次都会生成到这个数量。
- en_US: It is used to specify the maximum number of tokens when the model generates content. It defines the upper limit of generation, but does not guarantee that this number will be generated every time.
- - name: top_p
- use_template: top_p
- type: float
- default: 0.8
- min: 0.1
- max: 0.9
- help:
- zh_Hans: 生成过程中核采样方法概率阈值,例如,取值为0.8时,仅保留概率加起来大于等于0.8的最可能token的最小集合作为候选集。取值范围为(0,1.0),取值越大,生成的随机性越高;取值越低,生成的确定性越高。
- en_US: The probability threshold of the kernel sampling method during the generation process. For example, when the value is 0.8, only the smallest set of the most likely tokens with a sum of probabilities greater than or equal to 0.8 is retained as the candidate set. The value range is (0,1.0). The larger the value, the higher the randomness generated; the lower the value, the higher the certainty generated.
- - name: top_k
- type: int
- min: 0
- max: 99
- label:
- zh_Hans: 取样数量
- en_US: Top k
- help:
- zh_Hans: 生成时,采样候选集的大小。例如,取值为50时,仅将单次生成中得分最高的50个token组成随机采样的候选集。取值越大,生成的随机性越高;取值越小,生成的确定性越高。
- en_US: The size of the sample candidate set when generated. For example, when the value is 50, only the 50 highest-scoring tokens in a single generation form a randomly sampled candidate set. The larger the value, the higher the randomness generated; the smaller the value, the higher the certainty generated.
- - name: seed
- required: false
- type: int
- default: 1234
- label:
- zh_Hans: 随机种子
- en_US: Random seed
- help:
- zh_Hans: 生成时使用的随机数种子,用户控制模型生成内容的随机性。支持无符号64位整数,默认值为 1234。在使用seed时,模型将尽可能生成相同或相似的结果,但目前不保证每次生成的结果完全相同。
- en_US: The random number seed used when generating, the user controls the randomness of the content generated by the model. Supports unsigned 64-bit integers, default value is 1234. When using seed, the model will try its best to generate the same or similar results, but there is currently no guarantee that the results will be exactly the same every time.
- - name: repetition_penalty
- required: false
- type: float
- default: 1.1
- label:
- zh_Hans: 重复惩罚
- en_US: Repetition penalty
- help:
- zh_Hans: 用于控制模型生成时的重复度。提高repetition_penalty时可以降低模型生成的重复度。1.0表示不做惩罚。
- en_US: Used to control the repeatability when generating models. Increasing repetition_penalty can reduce the duplication of model generation. 1.0 means no punishment.
- - name: response_format
- use_template: response_format
-pricing:
- input: '0.002'
- output: '0.006'
- unit: '0.001'
- currency: RMB
diff --git a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-coder-turbo.yaml b/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-coder-turbo.yaml
deleted file mode 100644
index ff68faed80..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-coder-turbo.yaml
+++ /dev/null
@@ -1,75 +0,0 @@
-# for more details, please refer to https://help.aliyun.com/zh/model-studio/getting-started/models
-model: qwen-coder-turbo
-label:
- en_US: qwen-coder-turbo
-model_type: llm
-features:
- - agent-thought
-model_properties:
- mode: chat
- context_size: 131072
-parameter_rules:
- - name: temperature
- use_template: temperature
- type: float
- default: 0.3
- min: 0.0
- max: 2.0
- help:
- zh_Hans: 用于控制随机性和多样性的程度。具体来说,temperature值控制了生成文本时对每个候选词的概率分布进行平滑的程度。较高的temperature值会降低概率分布的峰值,使得更多的低概率词被选择,生成结果更加多样化;而较低的temperature值则会增强概率分布的峰值,使得高概率词更容易被选择,生成结果更加确定。
- en_US: Used to control the degree of randomness and diversity. Specifically, the temperature value controls the degree to which the probability distribution of each candidate word is smoothed when generating text. A higher temperature value will reduce the peak value of the probability distribution, allowing more low-probability words to be selected, and the generated results will be more diverse; while a lower temperature value will enhance the peak value of the probability distribution, making it easier for high-probability words to be selected. , the generated results are more certain.
- - name: max_tokens
- use_template: max_tokens
- type: int
- default: 8192
- min: 1
- max: 8192
- help:
- zh_Hans: 用于指定模型在生成内容时token的最大数量,它定义了生成的上限,但不保证每次都会生成到这个数量。
- en_US: It is used to specify the maximum number of tokens when the model generates content. It defines the upper limit of generation, but does not guarantee that this number will be generated every time.
- - name: top_p
- use_template: top_p
- type: float
- default: 0.8
- min: 0.1
- max: 0.9
- help:
- zh_Hans: 生成过程中核采样方法概率阈值,例如,取值为0.8时,仅保留概率加起来大于等于0.8的最可能token的最小集合作为候选集。取值范围为(0,1.0),取值越大,生成的随机性越高;取值越低,生成的确定性越高。
- en_US: The probability threshold of the kernel sampling method during the generation process. For example, when the value is 0.8, only the smallest set of the most likely tokens with a sum of probabilities greater than or equal to 0.8 is retained as the candidate set. The value range is (0,1.0). The larger the value, the higher the randomness generated; the lower the value, the higher the certainty generated.
- - name: top_k
- type: int
- min: 0
- max: 99
- label:
- zh_Hans: 取样数量
- en_US: Top k
- help:
- zh_Hans: 生成时,采样候选集的大小。例如,取值为50时,仅将单次生成中得分最高的50个token组成随机采样的候选集。取值越大,生成的随机性越高;取值越小,生成的确定性越高。
- en_US: The size of the sample candidate set when generated. For example, when the value is 50, only the 50 highest-scoring tokens in a single generation form a randomly sampled candidate set. The larger the value, the higher the randomness generated; the smaller the value, the higher the certainty generated.
- - name: seed
- required: false
- type: int
- default: 1234
- label:
- zh_Hans: 随机种子
- en_US: Random seed
- help:
- zh_Hans: 生成时使用的随机数种子,用户控制模型生成内容的随机性。支持无符号64位整数,默认值为 1234。在使用seed时,模型将尽可能生成相同或相似的结果,但目前不保证每次生成的结果完全相同。
- en_US: The random number seed used when generating, the user controls the randomness of the content generated by the model. Supports unsigned 64-bit integers, default value is 1234. When using seed, the model will try its best to generate the same or similar results, but there is currently no guarantee that the results will be exactly the same every time.
- - name: repetition_penalty
- required: false
- type: float
- default: 1.1
- label:
- zh_Hans: 重复惩罚
- en_US: Repetition penalty
- help:
- zh_Hans: 用于控制模型生成时的重复度。提高repetition_penalty时可以降低模型生成的重复度。1.0表示不做惩罚。
- en_US: Used to control the repeatability when generating models. Increasing repetition_penalty can reduce the duplication of model generation. 1.0 means no punishment.
- - name: response_format
- use_template: response_format
-pricing:
- input: '0.002'
- output: '0.006'
- unit: '0.001'
- currency: RMB
diff --git a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-long.yaml b/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-long.yaml
deleted file mode 100644
index be0a522709..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-long.yaml
+++ /dev/null
@@ -1,78 +0,0 @@
-# for more details, please refer to https://help.aliyun.com/zh/model-studio/getting-started/models
-model: qwen-long
-label:
- en_US: qwen-long
-model_type: llm
-features:
- - multi-tool-call
- - agent-thought
- - stream-tool-call
- - document
-model_properties:
- mode: chat
- context_size: 10000000
-parameter_rules:
- - name: temperature
- use_template: temperature
- type: float
- default: 0.3
- min: 0.0
- max: 2.0
- help:
- zh_Hans: 用于控制随机性和多样性的程度。具体来说,temperature值控制了生成文本时对每个候选词的概率分布进行平滑的程度。较高的temperature值会降低概率分布的峰值,使得更多的低概率词被选择,生成结果更加多样化;而较低的temperature值则会增强概率分布的峰值,使得高概率词更容易被选择,生成结果更加确定。
- en_US: Used to control the degree of randomness and diversity. Specifically, the temperature value controls the degree to which the probability distribution of each candidate word is smoothed when generating text. A higher temperature value will reduce the peak value of the probability distribution, allowing more low-probability words to be selected, and the generated results will be more diverse; while a lower temperature value will enhance the peak value of the probability distribution, making it easier for high-probability words to be selected. , the generated results are more certain.
- - name: max_tokens
- use_template: max_tokens
- type: int
- default: 2000
- min: 1
- max: 6000
- help:
- zh_Hans: 用于指定模型在生成内容时token的最大数量,它定义了生成的上限,但不保证每次都会生成到这个数量。
- en_US: It is used to specify the maximum number of tokens when the model generates content. It defines the upper limit of generation, but does not guarantee that this number will be generated every time.
- - name: top_p
- use_template: top_p
- type: float
- default: 0.8
- min: 0.1
- max: 0.9
- help:
- zh_Hans: 生成过程中核采样方法概率阈值,例如,取值为0.8时,仅保留概率加起来大于等于0.8的最可能token的最小集合作为候选集。取值范围为(0,1.0),取值越大,生成的随机性越高;取值越低,生成的确定性越高。
- en_US: The probability threshold of the kernel sampling method during the generation process. For example, when the value is 0.8, only the smallest set of the most likely tokens with a sum of probabilities greater than or equal to 0.8 is retained as the candidate set. The value range is (0,1.0). The larger the value, the higher the randomness generated; the lower the value, the higher the certainty generated.
- - name: top_k
- type: int
- min: 0
- max: 99
- label:
- zh_Hans: 取样数量
- en_US: Top k
- help:
- zh_Hans: 生成时,采样候选集的大小。例如,取值为50时,仅将单次生成中得分最高的50个token组成随机采样的候选集。取值越大,生成的随机性越高;取值越小,生成的确定性越高。
- en_US: The size of the sample candidate set when generated. For example, when the value is 50, only the 50 highest-scoring tokens in a single generation form a randomly sampled candidate set. The larger the value, the higher the randomness generated; the smaller the value, the higher the certainty generated.
- - name: seed
- required: false
- type: int
- default: 1234
- label:
- zh_Hans: 随机种子
- en_US: Random seed
- help:
- zh_Hans: 生成时使用的随机数种子,用户控制模型生成内容的随机性。支持无符号64位整数,默认值为 1234。在使用seed时,模型将尽可能生成相同或相似的结果,但目前不保证每次生成的结果完全相同。
- en_US: The random number seed used when generating, the user controls the randomness of the content generated by the model. Supports unsigned 64-bit integers, default value is 1234. When using seed, the model will try its best to generate the same or similar results, but there is currently no guarantee that the results will be exactly the same every time.
- - name: repetition_penalty
- required: false
- type: float
- default: 1.1
- label:
- zh_Hans: 重复惩罚
- en_US: Repetition penalty
- help:
- zh_Hans: 用于控制模型生成时的重复度。提高repetition_penalty时可以降低模型生成的重复度。1.0表示不做惩罚。
- en_US: Used to control the repeatability when generating models. Increasing repetition_penalty can reduce the duplication of model generation. 1.0 means no punishment.
- - name: response_format
- use_template: response_format
-pricing:
- input: "0.0005"
- output: "0.002"
- unit: "0.001"
- currency: RMB
diff --git a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-math-plus-0816.yaml b/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-math-plus-0816.yaml
deleted file mode 100644
index 42fe1f6862..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-math-plus-0816.yaml
+++ /dev/null
@@ -1,75 +0,0 @@
-# for more details, please refer to https://help.aliyun.com/zh/model-studio/getting-started/models
-model: qwen-math-plus-0816
-label:
- en_US: qwen-math-plus-0816
-model_type: llm
-features:
- - agent-thought
-model_properties:
- mode: chat
- context_size: 4096
-parameter_rules:
- - name: temperature
- use_template: temperature
- type: float
- default: 0.3
- min: 0.0
- max: 2.0
- help:
- zh_Hans: 用于控制随机性和多样性的程度。具体来说,temperature值控制了生成文本时对每个候选词的概率分布进行平滑的程度。较高的temperature值会降低概率分布的峰值,使得更多的低概率词被选择,生成结果更加多样化;而较低的temperature值则会增强概率分布的峰值,使得高概率词更容易被选择,生成结果更加确定。
- en_US: Used to control the degree of randomness and diversity. Specifically, the temperature value controls the degree to which the probability distribution of each candidate word is smoothed when generating text. A higher temperature value will reduce the peak value of the probability distribution, allowing more low-probability words to be selected, and the generated results will be more diverse; while a lower temperature value will enhance the peak value of the probability distribution, making it easier for high-probability words to be selected. , the generated results are more certain.
- - name: max_tokens
- use_template: max_tokens
- type: int
- default: 3072
- min: 1
- max: 3072
- help:
- zh_Hans: 用于指定模型在生成内容时token的最大数量,它定义了生成的上限,但不保证每次都会生成到这个数量。
- en_US: It is used to specify the maximum number of tokens when the model generates content. It defines the upper limit of generation, but does not guarantee that this number will be generated every time.
- - name: top_p
- use_template: top_p
- type: float
- default: 0.8
- min: 0.1
- max: 0.9
- help:
- zh_Hans: 生成过程中核采样方法概率阈值,例如,取值为0.8时,仅保留概率加起来大于等于0.8的最可能token的最小集合作为候选集。取值范围为(0,1.0),取值越大,生成的随机性越高;取值越低,生成的确定性越高。
- en_US: The probability threshold of the kernel sampling method during the generation process. For example, when the value is 0.8, only the smallest set of the most likely tokens with a sum of probabilities greater than or equal to 0.8 is retained as the candidate set. The value range is (0,1.0). The larger the value, the higher the randomness generated; the lower the value, the higher the certainty generated.
- - name: top_k
- type: int
- min: 0
- max: 99
- label:
- zh_Hans: 取样数量
- en_US: Top k
- help:
- zh_Hans: 生成时,采样候选集的大小。例如,取值为50时,仅将单次生成中得分最高的50个token组成随机采样的候选集。取值越大,生成的随机性越高;取值越小,生成的确定性越高。
- en_US: The size of the sample candidate set when generated. For example, when the value is 50, only the 50 highest-scoring tokens in a single generation form a randomly sampled candidate set. The larger the value, the higher the randomness generated; the smaller the value, the higher the certainty generated.
- - name: seed
- required: false
- type: int
- default: 1234
- label:
- zh_Hans: 随机种子
- en_US: Random seed
- help:
- zh_Hans: 生成时使用的随机数种子,用户控制模型生成内容的随机性。支持无符号64位整数,默认值为 1234。在使用seed时,模型将尽可能生成相同或相似的结果,但目前不保证每次生成的结果完全相同。
- en_US: The random number seed used when generating, the user controls the randomness of the content generated by the model. Supports unsigned 64-bit integers, default value is 1234. When using seed, the model will try its best to generate the same or similar results, but there is currently no guarantee that the results will be exactly the same every time.
- - name: repetition_penalty
- required: false
- type: float
- default: 1.1
- label:
- zh_Hans: 重复惩罚
- en_US: Repetition penalty
- help:
- zh_Hans: 用于控制模型生成时的重复度。提高repetition_penalty时可以降低模型生成的重复度。1.0表示不做惩罚。
- en_US: Used to control the repeatability when generating models. Increasing repetition_penalty can reduce the duplication of model generation. 1.0 means no punishment.
- - name: response_format
- use_template: response_format
-pricing:
- input: '0.004'
- output: '0.012'
- unit: '0.001'
- currency: RMB
diff --git a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-math-plus-0919.yaml b/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-math-plus-0919.yaml
deleted file mode 100644
index 9b6567b8cd..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-math-plus-0919.yaml
+++ /dev/null
@@ -1,75 +0,0 @@
-# for more details, please refer to https://help.aliyun.com/zh/model-studio/getting-started/models
-model: qwen-math-plus-0919
-label:
- en_US: qwen-math-plus-0919
-model_type: llm
-features:
- - agent-thought
-model_properties:
- mode: chat
- context_size: 4096
-parameter_rules:
- - name: temperature
- use_template: temperature
- type: float
- default: 0.3
- min: 0.0
- max: 2.0
- help:
- zh_Hans: 用于控制随机性和多样性的程度。具体来说,temperature值控制了生成文本时对每个候选词的概率分布进行平滑的程度。较高的temperature值会降低概率分布的峰值,使得更多的低概率词被选择,生成结果更加多样化;而较低的temperature值则会增强概率分布的峰值,使得高概率词更容易被选择,生成结果更加确定。
- en_US: Used to control the degree of randomness and diversity. Specifically, the temperature value controls the degree to which the probability distribution of each candidate word is smoothed when generating text. A higher temperature value will reduce the peak value of the probability distribution, allowing more low-probability words to be selected, and the generated results will be more diverse; while a lower temperature value will enhance the peak value of the probability distribution, making it easier for high-probability words to be selected. , the generated results are more certain.
- - name: max_tokens
- use_template: max_tokens
- type: int
- default: 3072
- min: 1
- max: 3072
- help:
- zh_Hans: 用于指定模型在生成内容时token的最大数量,它定义了生成的上限,但不保证每次都会生成到这个数量。
- en_US: It is used to specify the maximum number of tokens when the model generates content. It defines the upper limit of generation, but does not guarantee that this number will be generated every time.
- - name: top_p
- use_template: top_p
- type: float
- default: 0.8
- min: 0.1
- max: 0.9
- help:
- zh_Hans: 生成过程中核采样方法概率阈值,例如,取值为0.8时,仅保留概率加起来大于等于0.8的最可能token的最小集合作为候选集。取值范围为(0,1.0),取值越大,生成的随机性越高;取值越低,生成的确定性越高。
- en_US: The probability threshold of the kernel sampling method during the generation process. For example, when the value is 0.8, only the smallest set of the most likely tokens with a sum of probabilities greater than or equal to 0.8 is retained as the candidate set. The value range is (0,1.0). The larger the value, the higher the randomness generated; the lower the value, the higher the certainty generated.
- - name: top_k
- type: int
- min: 0
- max: 99
- label:
- zh_Hans: 取样数量
- en_US: Top k
- help:
- zh_Hans: 生成时,采样候选集的大小。例如,取值为50时,仅将单次生成中得分最高的50个token组成随机采样的候选集。取值越大,生成的随机性越高;取值越小,生成的确定性越高。
- en_US: The size of the sample candidate set when generated. For example, when the value is 50, only the 50 highest-scoring tokens in a single generation form a randomly sampled candidate set. The larger the value, the higher the randomness generated; the smaller the value, the higher the certainty generated.
- - name: seed
- required: false
- type: int
- default: 1234
- label:
- zh_Hans: 随机种子
- en_US: Random seed
- help:
- zh_Hans: 生成时使用的随机数种子,用户控制模型生成内容的随机性。支持无符号64位整数,默认值为 1234。在使用seed时,模型将尽可能生成相同或相似的结果,但目前不保证每次生成的结果完全相同。
- en_US: The random number seed used when generating, the user controls the randomness of the content generated by the model. Supports unsigned 64-bit integers, default value is 1234. When using seed, the model will try its best to generate the same or similar results, but there is currently no guarantee that the results will be exactly the same every time.
- - name: repetition_penalty
- required: false
- type: float
- default: 1.1
- label:
- zh_Hans: 重复惩罚
- en_US: Repetition penalty
- help:
- zh_Hans: 用于控制模型生成时的重复度。提高repetition_penalty时可以降低模型生成的重复度。1.0表示不做惩罚。
- en_US: Used to control the repeatability when generating models. Increasing repetition_penalty can reduce the duplication of model generation. 1.0 means no punishment.
- - name: response_format
- use_template: response_format
-pricing:
- input: '0.004'
- output: '0.012'
- unit: '0.001'
- currency: RMB
diff --git a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-math-plus-latest.yaml b/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-math-plus-latest.yaml
deleted file mode 100644
index b2a2393b36..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-math-plus-latest.yaml
+++ /dev/null
@@ -1,75 +0,0 @@
-# for more details, please refer to https://help.aliyun.com/zh/model-studio/getting-started/models
-model: qwen-math-plus-latest
-label:
- en_US: qwen-math-plus-latest
-model_type: llm
-features:
- - agent-thought
-model_properties:
- mode: chat
- context_size: 4096
-parameter_rules:
- - name: temperature
- use_template: temperature
- type: float
- default: 0.3
- min: 0.0
- max: 2.0
- help:
- zh_Hans: 用于控制随机性和多样性的程度。具体来说,temperature值控制了生成文本时对每个候选词的概率分布进行平滑的程度。较高的temperature值会降低概率分布的峰值,使得更多的低概率词被选择,生成结果更加多样化;而较低的temperature值则会增强概率分布的峰值,使得高概率词更容易被选择,生成结果更加确定。
- en_US: Used to control the degree of randomness and diversity. Specifically, the temperature value controls the degree to which the probability distribution of each candidate word is smoothed when generating text. A higher temperature value will reduce the peak value of the probability distribution, allowing more low-probability words to be selected, and the generated results will be more diverse; while a lower temperature value will enhance the peak value of the probability distribution, making it easier for high-probability words to be selected. , the generated results are more certain.
- - name: max_tokens
- use_template: max_tokens
- type: int
- default: 3072
- min: 1
- max: 3072
- help:
- zh_Hans: 用于指定模型在生成内容时token的最大数量,它定义了生成的上限,但不保证每次都会生成到这个数量。
- en_US: It is used to specify the maximum number of tokens when the model generates content. It defines the upper limit of generation, but does not guarantee that this number will be generated every time.
- - name: top_p
- use_template: top_p
- type: float
- default: 0.8
- min: 0.1
- max: 0.9
- help:
- zh_Hans: 生成过程中核采样方法概率阈值,例如,取值为0.8时,仅保留概率加起来大于等于0.8的最可能token的最小集合作为候选集。取值范围为(0,1.0),取值越大,生成的随机性越高;取值越低,生成的确定性越高。
- en_US: The probability threshold of the kernel sampling method during the generation process. For example, when the value is 0.8, only the smallest set of the most likely tokens with a sum of probabilities greater than or equal to 0.8 is retained as the candidate set. The value range is (0,1.0). The larger the value, the higher the randomness generated; the lower the value, the higher the certainty generated.
- - name: top_k
- type: int
- min: 0
- max: 99
- label:
- zh_Hans: 取样数量
- en_US: Top k
- help:
- zh_Hans: 生成时,采样候选集的大小。例如,取值为50时,仅将单次生成中得分最高的50个token组成随机采样的候选集。取值越大,生成的随机性越高;取值越小,生成的确定性越高。
- en_US: The size of the sample candidate set when generated. For example, when the value is 50, only the 50 highest-scoring tokens in a single generation form a randomly sampled candidate set. The larger the value, the higher the randomness generated; the smaller the value, the higher the certainty generated.
- - name: seed
- required: false
- type: int
- default: 1234
- label:
- zh_Hans: 随机种子
- en_US: Random seed
- help:
- zh_Hans: 生成时使用的随机数种子,用户控制模型生成内容的随机性。支持无符号64位整数,默认值为 1234。在使用seed时,模型将尽可能生成相同或相似的结果,但目前不保证每次生成的结果完全相同。
- en_US: The random number seed used when generating, the user controls the randomness of the content generated by the model. Supports unsigned 64-bit integers, default value is 1234. When using seed, the model will try its best to generate the same or similar results, but there is currently no guarantee that the results will be exactly the same every time.
- - name: repetition_penalty
- required: false
- type: float
- default: 1.1
- label:
- zh_Hans: 重复惩罚
- en_US: Repetition penalty
- help:
- zh_Hans: 用于控制模型生成时的重复度。提高repetition_penalty时可以降低模型生成的重复度。1.0表示不做惩罚。
- en_US: Used to control the repeatability when generating models. Increasing repetition_penalty can reduce the duplication of model generation. 1.0 means no punishment.
- - name: response_format
- use_template: response_format
-pricing:
- input: '0.004'
- output: '0.012'
- unit: '0.001'
- currency: RMB
diff --git a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-math-plus.yaml b/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-math-plus.yaml
deleted file mode 100644
index 63f4b7ff0a..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-math-plus.yaml
+++ /dev/null
@@ -1,75 +0,0 @@
-# for more details, please refer to https://help.aliyun.com/zh/model-studio/getting-started/models
-model: qwen-math-plus
-label:
- en_US: qwen-math-plus
-model_type: llm
-features:
- - agent-thought
-model_properties:
- mode: chat
- context_size: 4096
-parameter_rules:
- - name: temperature
- use_template: temperature
- type: float
- default: 0.3
- min: 0.0
- max: 2.0
- help:
- zh_Hans: 用于控制随机性和多样性的程度。具体来说,temperature值控制了生成文本时对每个候选词的概率分布进行平滑的程度。较高的temperature值会降低概率分布的峰值,使得更多的低概率词被选择,生成结果更加多样化;而较低的temperature值则会增强概率分布的峰值,使得高概率词更容易被选择,生成结果更加确定。
- en_US: Used to control the degree of randomness and diversity. Specifically, the temperature value controls the degree to which the probability distribution of each candidate word is smoothed when generating text. A higher temperature value will reduce the peak value of the probability distribution, allowing more low-probability words to be selected, and the generated results will be more diverse; while a lower temperature value will enhance the peak value of the probability distribution, making it easier for high-probability words to be selected. , the generated results are more certain.
- - name: max_tokens
- use_template: max_tokens
- type: int
- default: 3072
- min: 1
- max: 3072
- help:
- zh_Hans: 用于指定模型在生成内容时token的最大数量,它定义了生成的上限,但不保证每次都会生成到这个数量。
- en_US: It is used to specify the maximum number of tokens when the model generates content. It defines the upper limit of generation, but does not guarantee that this number will be generated every time.
- - name: top_p
- use_template: top_p
- type: float
- default: 0.8
- min: 0.1
- max: 0.9
- help:
- zh_Hans: 生成过程中核采样方法概率阈值,例如,取值为0.8时,仅保留概率加起来大于等于0.8的最可能token的最小集合作为候选集。取值范围为(0,1.0),取值越大,生成的随机性越高;取值越低,生成的确定性越高。
- en_US: The probability threshold of the kernel sampling method during the generation process. For example, when the value is 0.8, only the smallest set of the most likely tokens with a sum of probabilities greater than or equal to 0.8 is retained as the candidate set. The value range is (0,1.0). The larger the value, the higher the randomness generated; the lower the value, the higher the certainty generated.
- - name: top_k
- type: int
- min: 0
- max: 99
- label:
- zh_Hans: 取样数量
- en_US: Top k
- help:
- zh_Hans: 生成时,采样候选集的大小。例如,取值为50时,仅将单次生成中得分最高的50个token组成随机采样的候选集。取值越大,生成的随机性越高;取值越小,生成的确定性越高。
- en_US: The size of the sample candidate set when generated. For example, when the value is 50, only the 50 highest-scoring tokens in a single generation form a randomly sampled candidate set. The larger the value, the higher the randomness generated; the smaller the value, the higher the certainty generated.
- - name: seed
- required: false
- type: int
- default: 1234
- label:
- zh_Hans: 随机种子
- en_US: Random seed
- help:
- zh_Hans: 生成时使用的随机数种子,用户控制模型生成内容的随机性。支持无符号64位整数,默认值为 1234。在使用seed时,模型将尽可能生成相同或相似的结果,但目前不保证每次生成的结果完全相同。
- en_US: The random number seed used when generating, the user controls the randomness of the content generated by the model. Supports unsigned 64-bit integers, default value is 1234. When using seed, the model will try its best to generate the same or similar results, but there is currently no guarantee that the results will be exactly the same every time.
- - name: repetition_penalty
- required: false
- type: float
- default: 1.1
- label:
- zh_Hans: 重复惩罚
- en_US: Repetition penalty
- help:
- zh_Hans: 用于控制模型生成时的重复度。提高repetition_penalty时可以降低模型生成的重复度。1.0表示不做惩罚。
- en_US: Used to control the repeatability when generating models. Increasing repetition_penalty can reduce the duplication of model generation. 1.0 means no punishment.
- - name: response_format
- use_template: response_format
-pricing:
- input: '0.004'
- output: '0.012'
- unit: '0.001'
- currency: RMB
diff --git a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-math-turbo-0919.yaml b/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-math-turbo-0919.yaml
deleted file mode 100644
index 4da90eec3e..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-math-turbo-0919.yaml
+++ /dev/null
@@ -1,75 +0,0 @@
-# for more details, please refer to https://help.aliyun.com/zh/model-studio/getting-started/models
-model: qwen-math-turbo-0919
-label:
- en_US: qwen-math-turbo-0919
-model_type: llm
-features:
- - agent-thought
-model_properties:
- mode: chat
- context_size: 4096
-parameter_rules:
- - name: temperature
- use_template: temperature
- type: float
- default: 0.3
- min: 0.0
- max: 2.0
- help:
- zh_Hans: 用于控制随机性和多样性的程度。具体来说,temperature值控制了生成文本时对每个候选词的概率分布进行平滑的程度。较高的temperature值会降低概率分布的峰值,使得更多的低概率词被选择,生成结果更加多样化;而较低的temperature值则会增强概率分布的峰值,使得高概率词更容易被选择,生成结果更加确定。
- en_US: Used to control the degree of randomness and diversity. Specifically, the temperature value controls the degree to which the probability distribution of each candidate word is smoothed when generating text. A higher temperature value will reduce the peak value of the probability distribution, allowing more low-probability words to be selected, and the generated results will be more diverse; while a lower temperature value will enhance the peak value of the probability distribution, making it easier for high-probability words to be selected. , the generated results are more certain.
- - name: max_tokens
- use_template: max_tokens
- type: int
- default: 3072
- min: 1
- max: 3072
- help:
- zh_Hans: 用于指定模型在生成内容时token的最大数量,它定义了生成的上限,但不保证每次都会生成到这个数量。
- en_US: It is used to specify the maximum number of tokens when the model generates content. It defines the upper limit of generation, but does not guarantee that this number will be generated every time.
- - name: top_p
- use_template: top_p
- type: float
- default: 0.8
- min: 0.1
- max: 0.9
- help:
- zh_Hans: 生成过程中核采样方法概率阈值,例如,取值为0.8时,仅保留概率加起来大于等于0.8的最可能token的最小集合作为候选集。取值范围为(0,1.0),取值越大,生成的随机性越高;取值越低,生成的确定性越高。
- en_US: The probability threshold of the kernel sampling method during the generation process. For example, when the value is 0.8, only the smallest set of the most likely tokens with a sum of probabilities greater than or equal to 0.8 is retained as the candidate set. The value range is (0,1.0). The larger the value, the higher the randomness generated; the lower the value, the higher the certainty generated.
- - name: top_k
- type: int
- min: 0
- max: 99
- label:
- zh_Hans: 取样数量
- en_US: Top k
- help:
- zh_Hans: 生成时,采样候选集的大小。例如,取值为50时,仅将单次生成中得分最高的50个token组成随机采样的候选集。取值越大,生成的随机性越高;取值越小,生成的确定性越高。
- en_US: The size of the sample candidate set when generated. For example, when the value is 50, only the 50 highest-scoring tokens in a single generation form a randomly sampled candidate set. The larger the value, the higher the randomness generated; the smaller the value, the higher the certainty generated.
- - name: seed
- required: false
- type: int
- default: 1234
- label:
- zh_Hans: 随机种子
- en_US: Random seed
- help:
- zh_Hans: 生成时使用的随机数种子,用户控制模型生成内容的随机性。支持无符号64位整数,默认值为 1234。在使用seed时,模型将尽可能生成相同或相似的结果,但目前不保证每次生成的结果完全相同。
- en_US: The random number seed used when generating, the user controls the randomness of the content generated by the model. Supports unsigned 64-bit integers, default value is 1234. When using seed, the model will try its best to generate the same or similar results, but there is currently no guarantee that the results will be exactly the same every time.
- - name: repetition_penalty
- required: false
- type: float
- default: 1.1
- label:
- zh_Hans: 重复惩罚
- en_US: Repetition penalty
- help:
- zh_Hans: 用于控制模型生成时的重复度。提高repetition_penalty时可以降低模型生成的重复度。1.0表示不做惩罚。
- en_US: Used to control the repeatability when generating models. Increasing repetition_penalty can reduce the duplication of model generation. 1.0 means no punishment.
- - name: response_format
- use_template: response_format
-pricing:
- input: '0.002'
- output: '0.006'
- unit: '0.001'
- currency: RMB
diff --git a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-math-turbo-latest.yaml b/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-math-turbo-latest.yaml
deleted file mode 100644
index d29f8851dd..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-math-turbo-latest.yaml
+++ /dev/null
@@ -1,75 +0,0 @@
-# for more details, please refer to https://help.aliyun.com/zh/model-studio/getting-started/models
-model: qwen-math-turbo-latest
-label:
- en_US: qwen-math-turbo-latest
-model_type: llm
-features:
- - agent-thought
-model_properties:
- mode: chat
- context_size: 4096
-parameter_rules:
- - name: temperature
- use_template: temperature
- type: float
- default: 0.3
- min: 0.0
- max: 2.0
- help:
- zh_Hans: 用于控制随机性和多样性的程度。具体来说,temperature值控制了生成文本时对每个候选词的概率分布进行平滑的程度。较高的temperature值会降低概率分布的峰值,使得更多的低概率词被选择,生成结果更加多样化;而较低的temperature值则会增强概率分布的峰值,使得高概率词更容易被选择,生成结果更加确定。
- en_US: Used to control the degree of randomness and diversity. Specifically, the temperature value controls the degree to which the probability distribution of each candidate word is smoothed when generating text. A higher temperature value will reduce the peak value of the probability distribution, allowing more low-probability words to be selected, and the generated results will be more diverse; while a lower temperature value will enhance the peak value of the probability distribution, making it easier for high-probability words to be selected. , the generated results are more certain.
- - name: max_tokens
- use_template: max_tokens
- type: int
- default: 3072
- min: 1
- max: 3072
- help:
- zh_Hans: 用于指定模型在生成内容时token的最大数量,它定义了生成的上限,但不保证每次都会生成到这个数量。
- en_US: It is used to specify the maximum number of tokens when the model generates content. It defines the upper limit of generation, but does not guarantee that this number will be generated every time.
- - name: top_p
- use_template: top_p
- type: float
- default: 0.8
- min: 0.1
- max: 0.9
- help:
- zh_Hans: 生成过程中核采样方法概率阈值,例如,取值为0.8时,仅保留概率加起来大于等于0.8的最可能token的最小集合作为候选集。取值范围为(0,1.0),取值越大,生成的随机性越高;取值越低,生成的确定性越高。
- en_US: The probability threshold of the kernel sampling method during the generation process. For example, when the value is 0.8, only the smallest set of the most likely tokens with a sum of probabilities greater than or equal to 0.8 is retained as the candidate set. The value range is (0,1.0). The larger the value, the higher the randomness generated; the lower the value, the higher the certainty generated.
- - name: top_k
- type: int
- min: 0
- max: 99
- label:
- zh_Hans: 取样数量
- en_US: Top k
- help:
- zh_Hans: 生成时,采样候选集的大小。例如,取值为50时,仅将单次生成中得分最高的50个token组成随机采样的候选集。取值越大,生成的随机性越高;取值越小,生成的确定性越高。
- en_US: The size of the sample candidate set when generated. For example, when the value is 50, only the 50 highest-scoring tokens in a single generation form a randomly sampled candidate set. The larger the value, the higher the randomness generated; the smaller the value, the higher the certainty generated.
- - name: seed
- required: false
- type: int
- default: 1234
- label:
- zh_Hans: 随机种子
- en_US: Random seed
- help:
- zh_Hans: 生成时使用的随机数种子,用户控制模型生成内容的随机性。支持无符号64位整数,默认值为 1234。在使用seed时,模型将尽可能生成相同或相似的结果,但目前不保证每次生成的结果完全相同。
- en_US: The random number seed used when generating, the user controls the randomness of the content generated by the model. Supports unsigned 64-bit integers, default value is 1234. When using seed, the model will try its best to generate the same or similar results, but there is currently no guarantee that the results will be exactly the same every time.
- - name: repetition_penalty
- required: false
- type: float
- default: 1.1
- label:
- zh_Hans: 重复惩罚
- en_US: Repetition penalty
- help:
- zh_Hans: 用于控制模型生成时的重复度。提高repetition_penalty时可以降低模型生成的重复度。1.0表示不做惩罚。
- en_US: Used to control the repeatability when generating models. Increasing repetition_penalty can reduce the duplication of model generation. 1.0 means no punishment.
- - name: response_format
- use_template: response_format
-pricing:
- input: '0.002'
- output: '0.006'
- unit: '0.001'
- currency: RMB
diff --git a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-math-turbo.yaml b/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-math-turbo.yaml
deleted file mode 100644
index 2a8f7f725e..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-math-turbo.yaml
+++ /dev/null
@@ -1,75 +0,0 @@
-# for more details, please refer to https://help.aliyun.com/zh/model-studio/getting-started/models
-model: qwen-math-turbo
-label:
- en_US: qwen-math-turbo
-model_type: llm
-features:
- - agent-thought
-model_properties:
- mode: chat
- context_size: 4096
-parameter_rules:
- - name: temperature
- use_template: temperature
- type: float
- default: 0.3
- min: 0.0
- max: 2.0
- help:
- zh_Hans: 用于控制随机性和多样性的程度。具体来说,temperature值控制了生成文本时对每个候选词的概率分布进行平滑的程度。较高的temperature值会降低概率分布的峰值,使得更多的低概率词被选择,生成结果更加多样化;而较低的temperature值则会增强概率分布的峰值,使得高概率词更容易被选择,生成结果更加确定。
- en_US: Used to control the degree of randomness and diversity. Specifically, the temperature value controls the degree to which the probability distribution of each candidate word is smoothed when generating text. A higher temperature value will reduce the peak value of the probability distribution, allowing more low-probability words to be selected, and the generated results will be more diverse; while a lower temperature value will enhance the peak value of the probability distribution, making it easier for high-probability words to be selected. , the generated results are more certain.
- - name: max_tokens
- use_template: max_tokens
- type: int
- default: 3072
- min: 1
- max: 3072
- help:
- zh_Hans: 用于指定模型在生成内容时token的最大数量,它定义了生成的上限,但不保证每次都会生成到这个数量。
- en_US: It is used to specify the maximum number of tokens when the model generates content. It defines the upper limit of generation, but does not guarantee that this number will be generated every time.
- - name: top_p
- use_template: top_p
- type: float
- default: 0.8
- min: 0.1
- max: 0.9
- help:
- zh_Hans: 生成过程中核采样方法概率阈值,例如,取值为0.8时,仅保留概率加起来大于等于0.8的最可能token的最小集合作为候选集。取值范围为(0,1.0),取值越大,生成的随机性越高;取值越低,生成的确定性越高。
- en_US: The probability threshold of the kernel sampling method during the generation process. For example, when the value is 0.8, only the smallest set of the most likely tokens with a sum of probabilities greater than or equal to 0.8 is retained as the candidate set. The value range is (0,1.0). The larger the value, the higher the randomness generated; the lower the value, the higher the certainty generated.
- - name: top_k
- type: int
- min: 0
- max: 99
- label:
- zh_Hans: 取样数量
- en_US: Top k
- help:
- zh_Hans: 生成时,采样候选集的大小。例如,取值为50时,仅将单次生成中得分最高的50个token组成随机采样的候选集。取值越大,生成的随机性越高;取值越小,生成的确定性越高。
- en_US: The size of the sample candidate set when generated. For example, when the value is 50, only the 50 highest-scoring tokens in a single generation form a randomly sampled candidate set. The larger the value, the higher the randomness generated; the smaller the value, the higher the certainty generated.
- - name: seed
- required: false
- type: int
- default: 1234
- label:
- zh_Hans: 随机种子
- en_US: Random seed
- help:
- zh_Hans: 生成时使用的随机数种子,用户控制模型生成内容的随机性。支持无符号64位整数,默认值为 1234。在使用seed时,模型将尽可能生成相同或相似的结果,但目前不保证每次生成的结果完全相同。
- en_US: The random number seed used when generating, the user controls the randomness of the content generated by the model. Supports unsigned 64-bit integers, default value is 1234. When using seed, the model will try its best to generate the same or similar results, but there is currently no guarantee that the results will be exactly the same every time.
- - name: repetition_penalty
- required: false
- type: float
- default: 1.1
- label:
- zh_Hans: 重复惩罚
- en_US: Repetition penalty
- help:
- zh_Hans: 用于控制模型生成时的重复度。提高repetition_penalty时可以降低模型生成的重复度。1.0表示不做惩罚。
- en_US: Used to control the repeatability when generating models. Increasing repetition_penalty can reduce the duplication of model generation. 1.0 means no punishment.
- - name: response_format
- use_template: response_format
-pricing:
- input: '0.002'
- output: '0.006'
- unit: '0.001'
- currency: RMB
diff --git a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-max-0107.yaml b/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-max-0107.yaml
deleted file mode 100644
index 661311f178..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-max-0107.yaml
+++ /dev/null
@@ -1,87 +0,0 @@
-# this model corresponds to qwen-max, for more details
-# please refer to (https://help.aliyun.com/zh/model-studio/getting-started/models#cf6cc4aa2aokf)
-model: qwen-max-0107
-label:
- en_US: qwen-max-0107
-model_type: llm
-features:
- - multi-tool-call
- - agent-thought
- - stream-tool-call
-model_properties:
- mode: chat
- context_size: 8000
-parameter_rules:
- - name: temperature
- use_template: temperature
- type: float
- default: 0.3
- min: 0.0
- max: 2.0
- help:
- zh_Hans: 用于控制随机性和多样性的程度。具体来说,temperature值控制了生成文本时对每个候选词的概率分布进行平滑的程度。较高的temperature值会降低概率分布的峰值,使得更多的低概率词被选择,生成结果更加多样化;而较低的temperature值则会增强概率分布的峰值,使得高概率词更容易被选择,生成结果更加确定。
- en_US: Used to control the degree of randomness and diversity. Specifically, the temperature value controls the degree to which the probability distribution of each candidate word is smoothed when generating text. A higher temperature value will reduce the peak value of the probability distribution, allowing more low-probability words to be selected, and the generated results will be more diverse; while a lower temperature value will enhance the peak value of the probability distribution, making it easier for high-probability words to be selected. , the generated results are more certain.
- - name: max_tokens
- use_template: max_tokens
- type: int
- default: 2000
- min: 1
- max: 2000
- help:
- zh_Hans: 用于指定模型在生成内容时token的最大数量,它定义了生成的上限,但不保证每次都会生成到这个数量。
- en_US: It is used to specify the maximum number of tokens when the model generates content. It defines the upper limit of generation, but does not guarantee that this number will be generated every time.
- - name: top_p
- use_template: top_p
- type: float
- default: 0.8
- min: 0.1
- max: 0.9
- help:
- zh_Hans: 生成过程中核采样方法概率阈值,例如,取值为0.8时,仅保留概率加起来大于等于0.8的最可能token的最小集合作为候选集。取值范围为(0,1.0),取值越大,生成的随机性越高;取值越低,生成的确定性越高。
- en_US: The probability threshold of the kernel sampling method during the generation process. For example, when the value is 0.8, only the smallest set of the most likely tokens with a sum of probabilities greater than or equal to 0.8 is retained as the candidate set. The value range is (0,1.0). The larger the value, the higher the randomness generated; the lower the value, the higher the certainty generated.
- - name: top_k
- type: int
- min: 0
- max: 99
- label:
- zh_Hans: 取样数量
- en_US: Top k
- help:
- zh_Hans: 生成时,采样候选集的大小。例如,取值为50时,仅将单次生成中得分最高的50个token组成随机采样的候选集。取值越大,生成的随机性越高;取值越小,生成的确定性越高。
- en_US: The size of the sample candidate set when generated. For example, when the value is 50, only the 50 highest-scoring tokens in a single generation form a randomly sampled candidate set. The larger the value, the higher the randomness generated; the smaller the value, the higher the certainty generated.
- - name: seed
- required: false
- type: int
- default: 1234
- label:
- zh_Hans: 随机种子
- en_US: Random seed
- help:
- zh_Hans: 生成时使用的随机数种子,用户控制模型生成内容的随机性。支持无符号64位整数,默认值为 1234。在使用seed时,模型将尽可能生成相同或相似的结果,但目前不保证每次生成的结果完全相同。
- en_US: The random number seed used when generating, the user controls the randomness of the content generated by the model. Supports unsigned 64-bit integers, default value is 1234. When using seed, the model will try its best to generate the same or similar results, but there is currently no guarantee that the results will be exactly the same every time.
- - name: repetition_penalty
- required: false
- type: float
- default: 1.1
- label:
- zh_Hans: 重复惩罚
- en_US: Repetition penalty
- help:
- zh_Hans: 用于控制模型生成时的重复度。提高repetition_penalty时可以降低模型生成的重复度。1.0表示不做惩罚。
- en_US: Used to control the repeatability when generating models. Increasing repetition_penalty can reduce the duplication of model generation. 1.0 means no punishment.
- - name: enable_search
- type: boolean
- default: false
- label:
- zh_Hans: 联网搜索
- en_US: Web Search
- help:
- zh_Hans: 模型内置了互联网搜索服务,该参数控制模型在生成文本时是否参考使用互联网搜索结果。启用互联网搜索,模型会将搜索结果作为文本生成过程中的参考信息,但模型会基于其内部逻辑“自行判断”是否使用互联网搜索结果。
- en_US: The model has a built-in Internet search service. This parameter controls whether the model refers to Internet search results when generating text. When Internet search is enabled, the model will use the search results as reference information in the text generation process, but the model will "judge" whether to use Internet search results based on its internal logic.
- - name: response_format
- use_template: response_format
-pricing:
- input: '0.04'
- output: '0.12'
- unit: '0.001'
- currency: RMB
diff --git a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-max-0403.yaml b/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-max-0403.yaml
deleted file mode 100644
index 76b739a92b..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-max-0403.yaml
+++ /dev/null
@@ -1,87 +0,0 @@
-# this model corresponds to qwen-max-0403, for more details
-# please refer to (https://help.aliyun.com/zh/model-studio/getting-started/models#cf6cc4aa2aokf)
-model: qwen-max-0403
-label:
- en_US: qwen-max-0403
-model_type: llm
-features:
- - multi-tool-call
- - agent-thought
- - stream-tool-call
-model_properties:
- mode: chat
- context_size: 8000
-parameter_rules:
- - name: temperature
- use_template: temperature
- type: float
- default: 0.3
- min: 0.0
- max: 2.0
- help:
- zh_Hans: 用于控制随机性和多样性的程度。具体来说,temperature值控制了生成文本时对每个候选词的概率分布进行平滑的程度。较高的temperature值会降低概率分布的峰值,使得更多的低概率词被选择,生成结果更加多样化;而较低的temperature值则会增强概率分布的峰值,使得高概率词更容易被选择,生成结果更加确定。
- en_US: Used to control the degree of randomness and diversity. Specifically, the temperature value controls the degree to which the probability distribution of each candidate word is smoothed when generating text. A higher temperature value will reduce the peak value of the probability distribution, allowing more low-probability words to be selected, and the generated results will be more diverse; while a lower temperature value will enhance the peak value of the probability distribution, making it easier for high-probability words to be selected. , the generated results are more certain.
- - name: max_tokens
- use_template: max_tokens
- type: int
- default: 2000
- min: 1
- max: 2000
- help:
- zh_Hans: 用于指定模型在生成内容时token的最大数量,它定义了生成的上限,但不保证每次都会生成到这个数量。
- en_US: It is used to specify the maximum number of tokens when the model generates content. It defines the upper limit of generation, but does not guarantee that this number will be generated every time.
- - name: top_p
- use_template: top_p
- type: float
- default: 0.8
- min: 0.1
- max: 0.9
- help:
- zh_Hans: 生成过程中核采样方法概率阈值,例如,取值为0.8时,仅保留概率加起来大于等于0.8的最可能token的最小集合作为候选集。取值范围为(0,1.0),取值越大,生成的随机性越高;取值越低,生成的确定性越高。
- en_US: The probability threshold of the kernel sampling method during the generation process. For example, when the value is 0.8, only the smallest set of the most likely tokens with a sum of probabilities greater than or equal to 0.8 is retained as the candidate set. The value range is (0,1.0). The larger the value, the higher the randomness generated; the lower the value, the higher the certainty generated.
- - name: top_k
- type: int
- min: 0
- max: 99
- label:
- zh_Hans: 取样数量
- en_US: Top k
- help:
- zh_Hans: 生成时,采样候选集的大小。例如,取值为50时,仅将单次生成中得分最高的50个token组成随机采样的候选集。取值越大,生成的随机性越高;取值越小,生成的确定性越高。
- en_US: The size of the sample candidate set when generated. For example, when the value is 50, only the 50 highest-scoring tokens in a single generation form a randomly sampled candidate set. The larger the value, the higher the randomness generated; the smaller the value, the higher the certainty generated.
- - name: seed
- required: false
- type: int
- default: 1234
- label:
- zh_Hans: 随机种子
- en_US: Random seed
- help:
- zh_Hans: 生成时使用的随机数种子,用户控制模型生成内容的随机性。支持无符号64位整数,默认值为 1234。在使用seed时,模型将尽可能生成相同或相似的结果,但目前不保证每次生成的结果完全相同。
- en_US: The random number seed used when generating, the user controls the randomness of the content generated by the model. Supports unsigned 64-bit integers, default value is 1234. When using seed, the model will try its best to generate the same or similar results, but there is currently no guarantee that the results will be exactly the same every time.
- - name: repetition_penalty
- required: false
- type: float
- default: 1.1
- label:
- zh_Hans: 重复惩罚
- en_US: Repetition penalty
- help:
- zh_Hans: 用于控制模型生成时的重复度。提高repetition_penalty时可以降低模型生成的重复度。1.0表示不做惩罚。
- en_US: Used to control the repeatability when generating models. Increasing repetition_penalty can reduce the duplication of model generation. 1.0 means no punishment.
- - name: enable_search
- type: boolean
- default: false
- label:
- zh_Hans: 联网搜索
- en_US: Web Search
- help:
- zh_Hans: 模型内置了互联网搜索服务,该参数控制模型在生成文本时是否参考使用互联网搜索结果。启用互联网搜索,模型会将搜索结果作为文本生成过程中的参考信息,但模型会基于其内部逻辑“自行判断”是否使用互联网搜索结果。
- en_US: The model has a built-in Internet search service. This parameter controls whether the model refers to Internet search results when generating text. When Internet search is enabled, the model will use the search results as reference information in the text generation process, but the model will "judge" whether to use Internet search results based on its internal logic.
- - name: response_format
- use_template: response_format
-pricing:
- input: '0.04'
- output: '0.12'
- unit: '0.001'
- currency: RMB
diff --git a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-max-0428.yaml b/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-max-0428.yaml
deleted file mode 100644
index 334b41257f..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-max-0428.yaml
+++ /dev/null
@@ -1,87 +0,0 @@
-# this model corresponds to qwen-max-0428, for more details
-# please refer to (https://help.aliyun.com/zh/model-studio/getting-started/models#cf6cc4aa2aokf)
-model: qwen-max-0428
-label:
- en_US: qwen-max-0428
-model_type: llm
-features:
- - multi-tool-call
- - agent-thought
- - stream-tool-call
-model_properties:
- mode: chat
- context_size: 8000
-parameter_rules:
- - name: temperature
- use_template: temperature
- type: float
- default: 0.3
- min: 0.0
- max: 2.0
- help:
- zh_Hans: 用于控制随机性和多样性的程度。具体来说,temperature值控制了生成文本时对每个候选词的概率分布进行平滑的程度。较高的temperature值会降低概率分布的峰值,使得更多的低概率词被选择,生成结果更加多样化;而较低的temperature值则会增强概率分布的峰值,使得高概率词更容易被选择,生成结果更加确定。
- en_US: Used to control the degree of randomness and diversity. Specifically, the temperature value controls the degree to which the probability distribution of each candidate word is smoothed when generating text. A higher temperature value will reduce the peak value of the probability distribution, allowing more low-probability words to be selected, and the generated results will be more diverse; while a lower temperature value will enhance the peak value of the probability distribution, making it easier for high-probability words to be selected. , the generated results are more certain.
- - name: max_tokens
- use_template: max_tokens
- type: int
- default: 2000
- min: 1
- max: 2000
- help:
- zh_Hans: 用于指定模型在生成内容时token的最大数量,它定义了生成的上限,但不保证每次都会生成到这个数量。
- en_US: It is used to specify the maximum number of tokens when the model generates content. It defines the upper limit of generation, but does not guarantee that this number will be generated every time.
- - name: top_p
- use_template: top_p
- type: float
- default: 0.8
- min: 0.1
- max: 0.9
- help:
- zh_Hans: 生成过程中核采样方法概率阈值,例如,取值为0.8时,仅保留概率加起来大于等于0.8的最可能token的最小集合作为候选集。取值范围为(0,1.0),取值越大,生成的随机性越高;取值越低,生成的确定性越高。
- en_US: The probability threshold of the kernel sampling method during the generation process. For example, when the value is 0.8, only the smallest set of the most likely tokens with a sum of probabilities greater than or equal to 0.8 is retained as the candidate set. The value range is (0,1.0). The larger the value, the higher the randomness generated; the lower the value, the higher the certainty generated.
- - name: top_k
- type: int
- min: 0
- max: 99
- label:
- zh_Hans: 取样数量
- en_US: Top k
- help:
- zh_Hans: 生成时,采样候选集的大小。例如,取值为50时,仅将单次生成中得分最高的50个token组成随机采样的候选集。取值越大,生成的随机性越高;取值越小,生成的确定性越高。
- en_US: The size of the sample candidate set when generated. For example, when the value is 50, only the 50 highest-scoring tokens in a single generation form a randomly sampled candidate set. The larger the value, the higher the randomness generated; the smaller the value, the higher the certainty generated.
- - name: seed
- required: false
- type: int
- default: 1234
- label:
- zh_Hans: 随机种子
- en_US: Random seed
- help:
- zh_Hans: 生成时使用的随机数种子,用户控制模型生成内容的随机性。支持无符号64位整数,默认值为 1234。在使用seed时,模型将尽可能生成相同或相似的结果,但目前不保证每次生成的结果完全相同。
- en_US: The random number seed used when generating, the user controls the randomness of the content generated by the model. Supports unsigned 64-bit integers, default value is 1234. When using seed, the model will try its best to generate the same or similar results, but there is currently no guarantee that the results will be exactly the same every time.
- - name: repetition_penalty
- required: false
- type: float
- default: 1.1
- label:
- zh_Hans: 重复惩罚
- en_US: Repetition penalty
- help:
- zh_Hans: 用于控制模型生成时的重复度。提高repetition_penalty时可以降低模型生成的重复度。1.0表示不做惩罚。
- en_US: Used to control the repeatability when generating models. Increasing repetition_penalty can reduce the duplication of model generation. 1.0 means no punishment.
- - name: enable_search
- type: boolean
- default: false
- label:
- zh_Hans: 联网搜索
- en_US: Web Search
- help:
- zh_Hans: 模型内置了互联网搜索服务,该参数控制模型在生成文本时是否参考使用互联网搜索结果。启用互联网搜索,模型会将搜索结果作为文本生成过程中的参考信息,但模型会基于其内部逻辑“自行判断”是否使用互联网搜索结果。
- en_US: The model has a built-in Internet search service. This parameter controls whether the model refers to Internet search results when generating text. When Internet search is enabled, the model will use the search results as reference information in the text generation process, but the model will "judge" whether to use Internet search results based on its internal logic.
- - name: response_format
- use_template: response_format
-pricing:
- input: '0.04'
- output: '0.12'
- unit: '0.001'
- currency: RMB
diff --git a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-max-0919.yaml b/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-max-0919.yaml
deleted file mode 100644
index bfa70ca935..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-max-0919.yaml
+++ /dev/null
@@ -1,87 +0,0 @@
-# this model corresponds to qwen-max-0919, for more details
-# please refer to (https://help.aliyun.com/zh/model-studio/getting-started/models#cf6cc4aa2aokf)
-model: qwen-max-0919
-label:
- en_US: qwen-max-0919
-model_type: llm
-features:
- - multi-tool-call
- - agent-thought
- - stream-tool-call
-model_properties:
- mode: chat
- context_size: 32768
-parameter_rules:
- - name: temperature
- use_template: temperature
- type: float
- default: 0.3
- min: 0.0
- max: 2.0
- help:
- zh_Hans: 用于控制随机性和多样性的程度。具体来说,temperature值控制了生成文本时对每个候选词的概率分布进行平滑的程度。较高的temperature值会降低概率分布的峰值,使得更多的低概率词被选择,生成结果更加多样化;而较低的temperature值则会增强概率分布的峰值,使得高概率词更容易被选择,生成结果更加确定。
- en_US: Used to control the degree of randomness and diversity. Specifically, the temperature value controls the degree to which the probability distribution of each candidate word is smoothed when generating text. A higher temperature value will reduce the peak value of the probability distribution, allowing more low-probability words to be selected, and the generated results will be more diverse; while a lower temperature value will enhance the peak value of the probability distribution, making it easier for high-probability words to be selected. , the generated results are more certain.
- - name: max_tokens
- use_template: max_tokens
- type: int
- default: 8192
- min: 1
- max: 8192
- help:
- zh_Hans: 用于指定模型在生成内容时token的最大数量,它定义了生成的上限,但不保证每次都会生成到这个数量。
- en_US: It is used to specify the maximum number of tokens when the model generates content. It defines the upper limit of generation, but does not guarantee that this number will be generated every time.
- - name: top_p
- use_template: top_p
- type: float
- default: 0.8
- min: 0.1
- max: 0.9
- help:
- zh_Hans: 生成过程中核采样方法概率阈值,例如,取值为0.8时,仅保留概率加起来大于等于0.8的最可能token的最小集合作为候选集。取值范围为(0,1.0),取值越大,生成的随机性越高;取值越低,生成的确定性越高。
- en_US: The probability threshold of the kernel sampling method during the generation process. For example, when the value is 0.8, only the smallest set of the most likely tokens with a sum of probabilities greater than or equal to 0.8 is retained as the candidate set. The value range is (0,1.0). The larger the value, the higher the randomness generated; the lower the value, the higher the certainty generated.
- - name: top_k
- type: int
- min: 0
- max: 99
- label:
- zh_Hans: 取样数量
- en_US: Top k
- help:
- zh_Hans: 生成时,采样候选集的大小。例如,取值为50时,仅将单次生成中得分最高的50个token组成随机采样的候选集。取值越大,生成的随机性越高;取值越小,生成的确定性越高。
- en_US: The size of the sample candidate set when generated. For example, when the value is 50, only the 50 highest-scoring tokens in a single generation form a randomly sampled candidate set. The larger the value, the higher the randomness generated; the smaller the value, the higher the certainty generated.
- - name: seed
- required: false
- type: int
- default: 1234
- label:
- zh_Hans: 随机种子
- en_US: Random seed
- help:
- zh_Hans: 生成时使用的随机数种子,用户控制模型生成内容的随机性。支持无符号64位整数,默认值为 1234。在使用seed时,模型将尽可能生成相同或相似的结果,但目前不保证每次生成的结果完全相同。
- en_US: The random number seed used when generating, the user controls the randomness of the content generated by the model. Supports unsigned 64-bit integers, default value is 1234. When using seed, the model will try its best to generate the same or similar results, but there is currently no guarantee that the results will be exactly the same every time.
- - name: repetition_penalty
- required: false
- type: float
- default: 1.1
- label:
- zh_Hans: 重复惩罚
- en_US: Repetition penalty
- help:
- zh_Hans: 用于控制模型生成时的重复度。提高repetition_penalty时可以降低模型生成的重复度。1.0表示不做惩罚。
- en_US: Used to control the repeatability when generating models. Increasing repetition_penalty can reduce the duplication of model generation. 1.0 means no punishment.
- - name: enable_search
- type: boolean
- default: false
- label:
- zh_Hans: 联网搜索
- en_US: Web Search
- help:
- zh_Hans: 模型内置了互联网搜索服务,该参数控制模型在生成文本时是否参考使用互联网搜索结果。启用互联网搜索,模型会将搜索结果作为文本生成过程中的参考信息,但模型会基于其内部逻辑“自行判断”是否使用互联网搜索结果。
- en_US: The model has a built-in Internet search service. This parameter controls whether the model refers to Internet search results when generating text. When Internet search is enabled, the model will use the search results as reference information in the text generation process, but the model will "judge" whether to use Internet search results based on its internal logic.
- - name: response_format
- use_template: response_format
-pricing:
- input: '0.02'
- output: '0.06'
- unit: '0.001'
- currency: RMB
diff --git a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-max-1201.yaml b/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-max-1201.yaml
deleted file mode 100644
index 83c5732cd6..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-max-1201.yaml
+++ /dev/null
@@ -1,87 +0,0 @@
-# this model corresponds to qwen-max, for more details
-# please refer to (https://help.aliyun.com/zh/model-studio/getting-started/models#cf6cc4aa2aokf)
-model: qwen-max-1201
-label:
- en_US: qwen-max-1201
-model_type: llm
-features:
- - multi-tool-call
- - agent-thought
- - stream-tool-call
-model_properties:
- mode: chat
- context_size: 8192
-parameter_rules:
- - name: temperature
- use_template: temperature
- type: float
- default: 0.3
- min: 0.0
- max: 2.0
- help:
- zh_Hans: 用于控制随机性和多样性的程度。具体来说,temperature值控制了生成文本时对每个候选词的概率分布进行平滑的程度。较高的temperature值会降低概率分布的峰值,使得更多的低概率词被选择,生成结果更加多样化;而较低的temperature值则会增强概率分布的峰值,使得高概率词更容易被选择,生成结果更加确定。
- en_US: Used to control the degree of randomness and diversity. Specifically, the temperature value controls the degree to which the probability distribution of each candidate word is smoothed when generating text. A higher temperature value will reduce the peak value of the probability distribution, allowing more low-probability words to be selected, and the generated results will be more diverse; while a lower temperature value will enhance the peak value of the probability distribution, making it easier for high-probability words to be selected. , the generated results are more certain.
- - name: max_tokens
- use_template: max_tokens
- type: int
- default: 2000
- min: 1
- max: 2000
- help:
- zh_Hans: 用于指定模型在生成内容时token的最大数量,它定义了生成的上限,但不保证每次都会生成到这个数量。
- en_US: It is used to specify the maximum number of tokens when the model generates content. It defines the upper limit of generation, but does not guarantee that this number will be generated every time.
- - name: top_p
- use_template: top_p
- type: float
- default: 0.8
- min: 0.1
- max: 0.9
- help:
- zh_Hans: 生成过程中核采样方法概率阈值,例如,取值为0.8时,仅保留概率加起来大于等于0.8的最可能token的最小集合作为候选集。取值范围为(0,1.0),取值越大,生成的随机性越高;取值越低,生成的确定性越高。
- en_US: The probability threshold of the kernel sampling method during the generation process. For example, when the value is 0.8, only the smallest set of the most likely tokens with a sum of probabilities greater than or equal to 0.8 is retained as the candidate set. The value range is (0,1.0). The larger the value, the higher the randomness generated; the lower the value, the higher the certainty generated.
- - name: top_k
- type: int
- min: 0
- max: 99
- label:
- zh_Hans: 取样数量
- en_US: Top k
- help:
- zh_Hans: 生成时,采样候选集的大小。例如,取值为50时,仅将单次生成中得分最高的50个token组成随机采样的候选集。取值越大,生成的随机性越高;取值越小,生成的确定性越高。
- en_US: The size of the sample candidate set when generated. For example, when the value is 50, only the 50 highest-scoring tokens in a single generation form a randomly sampled candidate set. The larger the value, the higher the randomness generated; the smaller the value, the higher the certainty generated.
- - name: seed
- required: false
- type: int
- default: 1234
- label:
- zh_Hans: 随机种子
- en_US: Random seed
- help:
- zh_Hans: 生成时使用的随机数种子,用户控制模型生成内容的随机性。支持无符号64位整数,默认值为 1234。在使用seed时,模型将尽可能生成相同或相似的结果,但目前不保证每次生成的结果完全相同。
- en_US: The random number seed used when generating, the user controls the randomness of the content generated by the model. Supports unsigned 64-bit integers, default value is 1234. When using seed, the model will try its best to generate the same or similar results, but there is currently no guarantee that the results will be exactly the same every time.
- - name: repetition_penalty
- required: false
- type: float
- default: 1.1
- label:
- en_US: Repetition penalty
- help:
- zh_Hans: 用于控制模型生成时的重复度。提高repetition_penalty时可以降低模型生成的重复度。1.0表示不做惩罚。
- en_US: Used to control the repeatability when generating models. Increasing repetition_penalty can reduce the duplication of model generation. 1.0 means no punishment.
- - name: enable_search
- type: boolean
- default: false
- label:
- zh_Hans: 联网搜索
- en_US: Web Search
- help:
- zh_Hans: 模型内置了互联网搜索服务,该参数控制模型在生成文本时是否参考使用互联网搜索结果。启用互联网搜索,模型会将搜索结果作为文本生成过程中的参考信息,但模型会基于其内部逻辑“自行判断”是否使用互联网搜索结果。
- en_US: The model has a built-in Internet search service. This parameter controls whether the model refers to Internet search results when generating text. When Internet search is enabled, the model will use the search results as reference information in the text generation process, but the model will "judge" whether to use Internet search results based on its internal logic.
- - name: response_format
- use_template: response_format
-pricing:
- input: '0.04'
- output: '0.12'
- unit: '0.001'
- currency: RMB
-deprecated: true
diff --git a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-max-latest.yaml b/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-max-latest.yaml
deleted file mode 100644
index 538bfb0448..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-max-latest.yaml
+++ /dev/null
@@ -1,87 +0,0 @@
-# this model corresponds to qwen-max, for more details
-# please refer to (https://help.aliyun.com/zh/model-studio/getting-started/models#cf6cc4aa2aokf)
-model: qwen-max-latest
-label:
- en_US: qwen-max-latest
-model_type: llm
-features:
- - multi-tool-call
- - agent-thought
- - stream-tool-call
-model_properties:
- mode: chat
- context_size: 32768
-parameter_rules:
- - name: temperature
- use_template: temperature
- type: float
- default: 0.3
- min: 0.0
- max: 2.0
- help:
- zh_Hans: 用于控制随机性和多样性的程度。具体来说,temperature值控制了生成文本时对每个候选词的概率分布进行平滑的程度。较高的temperature值会降低概率分布的峰值,使得更多的低概率词被选择,生成结果更加多样化;而较低的temperature值则会增强概率分布的峰值,使得高概率词更容易被选择,生成结果更加确定。
- en_US: Used to control the degree of randomness and diversity. Specifically, the temperature value controls the degree to which the probability distribution of each candidate word is smoothed when generating text. A higher temperature value will reduce the peak value of the probability distribution, allowing more low-probability words to be selected, and the generated results will be more diverse; while a lower temperature value will enhance the peak value of the probability distribution, making it easier for high-probability words to be selected. , the generated results are more certain.
- - name: max_tokens
- use_template: max_tokens
- type: int
- default: 8192
- min: 1
- max: 8192
- help:
- zh_Hans: 用于指定模型在生成内容时token的最大数量,它定义了生成的上限,但不保证每次都会生成到这个数量。
- en_US: It is used to specify the maximum number of tokens when the model generates content. It defines the upper limit of generation, but does not guarantee that this number will be generated every time.
- - name: top_p
- use_template: top_p
- type: float
- default: 0.8
- min: 0.1
- max: 0.9
- help:
- zh_Hans: 生成过程中核采样方法概率阈值,例如,取值为0.8时,仅保留概率加起来大于等于0.8的最可能token的最小集合作为候选集。取值范围为(0,1.0),取值越大,生成的随机性越高;取值越低,生成的确定性越高。
- en_US: The probability threshold of the kernel sampling method during the generation process. For example, when the value is 0.8, only the smallest set of the most likely tokens with a sum of probabilities greater than or equal to 0.8 is retained as the candidate set. The value range is (0,1.0). The larger the value, the higher the randomness generated; the lower the value, the higher the certainty generated.
- - name: top_k
- type: int
- min: 0
- max: 99
- label:
- zh_Hans: 取样数量
- en_US: Top k
- help:
- zh_Hans: 生成时,采样候选集的大小。例如,取值为50时,仅将单次生成中得分最高的50个token组成随机采样的候选集。取值越大,生成的随机性越高;取值越小,生成的确定性越高。
- en_US: The size of the sample candidate set when generated. For example, when the value is 50, only the 50 highest-scoring tokens in a single generation form a randomly sampled candidate set. The larger the value, the higher the randomness generated; the smaller the value, the higher the certainty generated.
- - name: seed
- required: false
- type: int
- default: 1234
- label:
- zh_Hans: 随机种子
- en_US: Random seed
- help:
- zh_Hans: 生成时使用的随机数种子,用户控制模型生成内容的随机性。支持无符号64位整数,默认值为 1234。在使用seed时,模型将尽可能生成相同或相似的结果,但目前不保证每次生成的结果完全相同。
- en_US: The random number seed used when generating, the user controls the randomness of the content generated by the model. Supports unsigned 64-bit integers, default value is 1234. When using seed, the model will try its best to generate the same or similar results, but there is currently no guarantee that the results will be exactly the same every time.
- - name: repetition_penalty
- required: false
- type: float
- default: 1.1
- label:
- zh_Hans: 重复惩罚
- en_US: Repetition penalty
- help:
- zh_Hans: 用于控制模型生成时的重复度。提高repetition_penalty时可以降低模型生成的重复度。1.0表示不做惩罚。
- en_US: Used to control the repeatability when generating models. Increasing repetition_penalty can reduce the duplication of model generation. 1.0 means no punishment.
- - name: enable_search
- type: boolean
- default: false
- label:
- zh_Hans: 联网搜索
- en_US: Web Search
- help:
- zh_Hans: 模型内置了互联网搜索服务,该参数控制模型在生成文本时是否参考使用互联网搜索结果。启用互联网搜索,模型会将搜索结果作为文本生成过程中的参考信息,但模型会基于其内部逻辑“自行判断”是否使用互联网搜索结果。
- en_US: The model has a built-in Internet search service. This parameter controls whether the model refers to Internet search results when generating text. When Internet search is enabled, the model will use the search results as reference information in the text generation process, but the model will "judge" whether to use Internet search results based on its internal logic.
- - name: response_format
- use_template: response_format
-pricing:
- input: '0.02'
- output: '0.06'
- unit: '0.001'
- currency: RMB
diff --git a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-max-longcontext.yaml b/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-max-longcontext.yaml
deleted file mode 100644
index 52bd758702..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-max-longcontext.yaml
+++ /dev/null
@@ -1,88 +0,0 @@
-# this model corresponds to qwen-max, for more details
-# please refer to (https://help.aliyun.com/zh/model-studio/getting-started/models#cf6cc4aa2aokf)
-model: qwen-max-longcontext
-label:
- en_US: qwen-max-longcontext
-model_type: llm
-features:
- - multi-tool-call
- - agent-thought
- - stream-tool-call
-model_properties:
- mode: chat
- context_size: 32000
-parameter_rules:
- - name: temperature
- use_template: temperature
- type: float
- default: 0.3
- min: 0.0
- max: 2.0
- help:
- zh_Hans: 用于控制随机性和多样性的程度。具体来说,temperature值控制了生成文本时对每个候选词的概率分布进行平滑的程度。较高的temperature值会降低概率分布的峰值,使得更多的低概率词被选择,生成结果更加多样化;而较低的temperature值则会增强概率分布的峰值,使得高概率词更容易被选择,生成结果更加确定。
- en_US: Used to control the degree of randomness and diversity. Specifically, the temperature value controls the degree to which the probability distribution of each candidate word is smoothed when generating text. A higher temperature value will reduce the peak value of the probability distribution, allowing more low-probability words to be selected, and the generated results will be more diverse; while a lower temperature value will enhance the peak value of the probability distribution, making it easier for high-probability words to be selected. , the generated results are more certain.
- - name: max_tokens
- use_template: max_tokens
- type: int
- default: 8000
- min: 1
- max: 8000
- help:
- zh_Hans: 用于指定模型在生成内容时token的最大数量,它定义了生成的上限,但不保证每次都会生成到这个数量。
- en_US: It is used to specify the maximum number of tokens when the model generates content. It defines the upper limit of generation, but does not guarantee that this number will be generated every time.
- - name: top_p
- use_template: top_p
- type: float
- default: 0.8
- min: 0.1
- max: 0.9
- help:
- zh_Hans: 生成过程中核采样方法概率阈值,例如,取值为0.8时,仅保留概率加起来大于等于0.8的最可能token的最小集合作为候选集。取值范围为(0,1.0),取值越大,生成的随机性越高;取值越低,生成的确定性越高。
- en_US: The probability threshold of the kernel sampling method during the generation process. For example, when the value is 0.8, only the smallest set of the most likely tokens with a sum of probabilities greater than or equal to 0.8 is retained as the candidate set. The value range is (0,1.0). The larger the value, the higher the randomness generated; the lower the value, the higher the certainty generated.
- - name: top_k
- type: int
- min: 0
- max: 99
- label:
- zh_Hans: 取样数量
- en_US: Top k
- help:
- zh_Hans: 生成时,采样候选集的大小。例如,取值为50时,仅将单次生成中得分最高的50个token组成随机采样的候选集。取值越大,生成的随机性越高;取值越小,生成的确定性越高。
- en_US: The size of the sample candidate set when generated. For example, when the value is 50, only the 50 highest-scoring tokens in a single generation form a randomly sampled candidate set. The larger the value, the higher the randomness generated; the smaller the value, the higher the certainty generated.
- - name: seed
- required: false
- type: int
- default: 1234
- label:
- zh_Hans: 随机种子
- en_US: Random seed
- help:
- zh_Hans: 生成时使用的随机数种子,用户控制模型生成内容的随机性。支持无符号64位整数,默认值为 1234。在使用seed时,模型将尽可能生成相同或相似的结果,但目前不保证每次生成的结果完全相同。
- en_US: The random number seed used when generating, the user controls the randomness of the content generated by the model. Supports unsigned 64-bit integers, default value is 1234. When using seed, the model will try its best to generate the same or similar results, but there is currently no guarantee that the results will be exactly the same every time.
- - name: repetition_penalty
- required: false
- type: float
- default: 1.1
- label:
- zh_Hans: 重复惩罚
- en_US: Repetition penalty
- help:
- zh_Hans: 用于控制模型生成时的重复度。提高repetition_penalty时可以降低模型生成的重复度。1.0表示不做惩罚。
- en_US: Used to control the repeatability when generating models. Increasing repetition_penalty can reduce the duplication of model generation. 1.0 means no punishment.
- - name: enable_search
- type: boolean
- default: false
- label:
- zh_Hans: 联网搜索
- en_US: Web Search
- help:
- zh_Hans: 模型内置了互联网搜索服务,该参数控制模型在生成文本时是否参考使用互联网搜索结果。启用互联网搜索,模型会将搜索结果作为文本生成过程中的参考信息,但模型会基于其内部逻辑“自行判断”是否使用互联网搜索结果。
- en_US: The model has a built-in Internet search service. This parameter controls whether the model refers to Internet search results when generating text. When Internet search is enabled, the model will use the search results as reference information in the text generation process, but the model will "judge" whether to use Internet search results based on its internal logic.
- - name: response_format
- use_template: response_format
-pricing:
- input: '0.04'
- output: '0.12'
- unit: '0.001'
- currency: RMB
-deprecated: true
diff --git a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-max.yaml b/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-max.yaml
deleted file mode 100644
index 4af4822e86..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-max.yaml
+++ /dev/null
@@ -1,87 +0,0 @@
-# this model corresponds to qwen-max, for more details
-# please refer to (https://help.aliyun.com/zh/model-studio/getting-started/models#cf6cc4aa2aokf)
-model: qwen-max
-label:
- en_US: qwen-max
-model_type: llm
-features:
- - multi-tool-call
- - agent-thought
- - stream-tool-call
-model_properties:
- mode: chat
- context_size: 32000
-parameter_rules:
- - name: temperature
- use_template: temperature
- type: float
- default: 0.3
- min: 0.0
- max: 2.0
- help:
- zh_Hans: 用于控制随机性和多样性的程度。具体来说,temperature值控制了生成文本时对每个候选词的概率分布进行平滑的程度。较高的temperature值会降低概率分布的峰值,使得更多的低概率词被选择,生成结果更加多样化;而较低的temperature值则会增强概率分布的峰值,使得高概率词更容易被选择,生成结果更加确定。
- en_US: Used to control the degree of randomness and diversity. Specifically, the temperature value controls the degree to which the probability distribution of each candidate word is smoothed when generating text. A higher temperature value will reduce the peak value of the probability distribution, allowing more low-probability words to be selected, and the generated results will be more diverse; while a lower temperature value will enhance the peak value of the probability distribution, making it easier for high-probability words to be selected. , the generated results are more certain.
- - name: max_tokens
- use_template: max_tokens
- type: int
- default: 2000
- min: 1
- max: 8192
- help:
- zh_Hans: 用于指定模型在生成内容时token的最大数量,它定义了生成的上限,但不保证每次都会生成到这个数量。
- en_US: It is used to specify the maximum number of tokens when the model generates content. It defines the upper limit of generation, but does not guarantee that this number will be generated every time.
- - name: top_p
- use_template: top_p
- type: float
- default: 0.8
- min: 0.1
- max: 0.9
- help:
- zh_Hans: 生成过程中核采样方法概率阈值,例如,取值为0.8时,仅保留概率加起来大于等于0.8的最可能token的最小集合作为候选集。取值范围为(0,1.0),取值越大,生成的随机性越高;取值越低,生成的确定性越高。
- en_US: The probability threshold of the kernel sampling method during the generation process. For example, when the value is 0.8, only the smallest set of the most likely tokens with a sum of probabilities greater than or equal to 0.8 is retained as the candidate set. The value range is (0,1.0). The larger the value, the higher the randomness generated; the lower the value, the higher the certainty generated.
- - name: top_k
- type: int
- min: 0
- max: 99
- label:
- zh_Hans: 取样数量
- en_US: Top k
- help:
- zh_Hans: 生成时,采样候选集的大小。例如,取值为50时,仅将单次生成中得分最高的50个token组成随机采样的候选集。取值越大,生成的随机性越高;取值越小,生成的确定性越高。
- en_US: The size of the sample candidate set when generated. For example, when the value is 50, only the 50 highest-scoring tokens in a single generation form a randomly sampled candidate set. The larger the value, the higher the randomness generated; the smaller the value, the higher the certainty generated.
- - name: seed
- required: false
- type: int
- default: 1234
- label:
- zh_Hans: 随机种子
- en_US: Random seed
- help:
- zh_Hans: 生成时使用的随机数种子,用户控制模型生成内容的随机性。支持无符号64位整数,默认值为 1234。在使用seed时,模型将尽可能生成相同或相似的结果,但目前不保证每次生成的结果完全相同。
- en_US: The random number seed used when generating, the user controls the randomness of the content generated by the model. Supports unsigned 64-bit integers, default value is 1234. When using seed, the model will try its best to generate the same or similar results, but there is currently no guarantee that the results will be exactly the same every time.
- - name: repetition_penalty
- required: false
- type: float
- default: 1.1
- label:
- zh_Hans: 重复惩罚
- en_US: Repetition penalty
- help:
- zh_Hans: 用于控制模型生成时的重复度。提高repetition_penalty时可以降低模型生成的重复度。1.0表示不做惩罚。
- en_US: Used to control the repeatability when generating models. Increasing repetition_penalty can reduce the duplication of model generation. 1.0 means no punishment.
- - name: enable_search
- type: boolean
- default: false
- label:
- zh_Hans: 联网搜索
- en_US: Web Search
- help:
- zh_Hans: 模型内置了互联网搜索服务,该参数控制模型在生成文本时是否参考使用互联网搜索结果。启用互联网搜索,模型会将搜索结果作为文本生成过程中的参考信息,但模型会基于其内部逻辑“自行判断”是否使用互联网搜索结果。
- en_US: The model has a built-in Internet search service. This parameter controls whether the model refers to Internet search results when generating text. When Internet search is enabled, the model will use the search results as reference information in the text generation process, but the model will "judge" whether to use Internet search results based on its internal logic.
- - name: response_format
- use_template: response_format
-pricing:
- input: '0.02'
- output: '0.06'
- unit: '0.001'
- currency: RMB
diff --git a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-plus-0206.yaml b/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-plus-0206.yaml
deleted file mode 100644
index d37052f560..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-plus-0206.yaml
+++ /dev/null
@@ -1,85 +0,0 @@
-# this model corresponds to qwen-plus-0206, for more details
-# please refer to (https://help.aliyun.com/zh/model-studio/getting-started/models#bb0ffee88bwnk)
-model: qwen-plus-0206
-label:
- en_US: qwen-plus-0206
-model_type: llm
-features:
- - agent-thought
-model_properties:
- mode: completion
- context_size: 32000
-parameter_rules:
- - name: temperature
- use_template: temperature
- type: float
- default: 0.3
- min: 0.0
- max: 2.0
- help:
- zh_Hans: 用于控制随机性和多样性的程度。具体来说,temperature值控制了生成文本时对每个候选词的概率分布进行平滑的程度。较高的temperature值会降低概率分布的峰值,使得更多的低概率词被选择,生成结果更加多样化;而较低的temperature值则会增强概率分布的峰值,使得高概率词更容易被选择,生成结果更加确定。
- en_US: Used to control the degree of randomness and diversity. Specifically, the temperature value controls the degree to which the probability distribution of each candidate word is smoothed when generating text. A higher temperature value will reduce the peak value of the probability distribution, allowing more low-probability words to be selected, and the generated results will be more diverse; while a lower temperature value will enhance the peak value of the probability distribution, making it easier for high-probability words to be selected. , the generated results are more certain.
- - name: max_tokens
- use_template: max_tokens
- type: int
- default: 8000
- min: 1
- max: 8000
- help:
- zh_Hans: 用于指定模型在生成内容时token的最大数量,它定义了生成的上限,但不保证每次都会生成到这个数量。
- en_US: It is used to specify the maximum number of tokens when the model generates content. It defines the upper limit of generation, but does not guarantee that this number will be generated every time.
- - name: top_p
- use_template: top_p
- type: float
- default: 0.8
- min: 0.1
- max: 0.9
- help:
- zh_Hans: 生成过程中核采样方法概率阈值,例如,取值为0.8时,仅保留概率加起来大于等于0.8的最可能token的最小集合作为候选集。取值范围为(0,1.0),取值越大,生成的随机性越高;取值越低,生成的确定性越高。
- en_US: The probability threshold of the kernel sampling method during the generation process. For example, when the value is 0.8, only the smallest set of the most likely tokens with a sum of probabilities greater than or equal to 0.8 is retained as the candidate set. The value range is (0,1.0). The larger the value, the higher the randomness generated; the lower the value, the higher the certainty generated.
- - name: top_k
- type: int
- min: 0
- max: 99
- label:
- zh_Hans: 取样数量
- en_US: Top k
- help:
- zh_Hans: 生成时,采样候选集的大小。例如,取值为50时,仅将单次生成中得分最高的50个token组成随机采样的候选集。取值越大,生成的随机性越高;取值越小,生成的确定性越高。
- en_US: The size of the sample candidate set when generated. For example, when the value is 50, only the 50 highest-scoring tokens in a single generation form a randomly sampled candidate set. The larger the value, the higher the randomness generated; the smaller the value, the higher the certainty generated.
- - name: seed
- required: false
- type: int
- default: 1234
- label:
- zh_Hans: 随机种子
- en_US: Random seed
- help:
- zh_Hans: 生成时使用的随机数种子,用户控制模型生成内容的随机性。支持无符号64位整数,默认值为 1234。在使用seed时,模型将尽可能生成相同或相似的结果,但目前不保证每次生成的结果完全相同。
- en_US: The random number seed used when generating, the user controls the randomness of the content generated by the model. Supports unsigned 64-bit integers, default value is 1234. When using seed, the model will try its best to generate the same or similar results, but there is currently no guarantee that the results will be exactly the same every time.
- - name: repetition_penalty
- required: false
- type: float
- default: 1.1
- label:
- zh_Hans: 重复惩罚
- en_US: Repetition penalty
- help:
- zh_Hans: 用于控制模型生成时的重复度。提高repetition_penalty时可以降低模型生成的重复度。1.0表示不做惩罚。
- en_US: Used to control the repeatability when generating models. Increasing repetition_penalty can reduce the duplication of model generation. 1.0 means no punishment.
- - name: enable_search
- type: boolean
- default: false
- label:
- zh_Hans: 联网搜索
- en_US: Web Search
- help:
- zh_Hans: 模型内置了互联网搜索服务,该参数控制模型在生成文本时是否参考使用互联网搜索结果。启用互联网搜索,模型会将搜索结果作为文本生成过程中的参考信息,但模型会基于其内部逻辑“自行判断”是否使用互联网搜索结果。
- en_US: The model has a built-in Internet search service. This parameter controls whether the model refers to Internet search results when generating text. When Internet search is enabled, the model will use the search results as reference information in the text generation process, but the model will "judge" whether to use Internet search results based on its internal logic.
- - name: response_format
- use_template: response_format
-pricing:
- input: '0.004'
- output: '0.012'
- unit: '0.001'
- currency: RMB
diff --git a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-plus-0624.yaml b/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-plus-0624.yaml
deleted file mode 100644
index 0025db9bd1..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-plus-0624.yaml
+++ /dev/null
@@ -1,85 +0,0 @@
-# this model corresponds to qwen-plus-0624, for more details
-# please refer to (https://help.aliyun.com/zh/model-studio/getting-started/models#bb0ffee88bwnk)
-model: qwen-plus-0624
-label:
- en_US: qwen-plus-0624
-model_type: llm
-features:
- - agent-thought
-model_properties:
- mode: completion
- context_size: 32000
-parameter_rules:
- - name: temperature
- use_template: temperature
- type: float
- default: 0.3
- min: 0.0
- max: 2.0
- help:
- zh_Hans: 用于控制随机性和多样性的程度。具体来说,temperature值控制了生成文本时对每个候选词的概率分布进行平滑的程度。较高的temperature值会降低概率分布的峰值,使得更多的低概率词被选择,生成结果更加多样化;而较低的temperature值则会增强概率分布的峰值,使得高概率词更容易被选择,生成结果更加确定。
- en_US: Used to control the degree of randomness and diversity. Specifically, the temperature value controls the degree to which the probability distribution of each candidate word is smoothed when generating text. A higher temperature value will reduce the peak value of the probability distribution, allowing more low-probability words to be selected, and the generated results will be more diverse; while a lower temperature value will enhance the peak value of the probability distribution, making it easier for high-probability words to be selected. , the generated results are more certain.
- - name: max_tokens
- use_template: max_tokens
- type: int
- default: 8000
- min: 1
- max: 8000
- help:
- zh_Hans: 用于指定模型在生成内容时token的最大数量,它定义了生成的上限,但不保证每次都会生成到这个数量。
- en_US: It is used to specify the maximum number of tokens when the model generates content. It defines the upper limit of generation, but does not guarantee that this number will be generated every time.
- - name: top_p
- use_template: top_p
- type: float
- default: 0.8
- min: 0.1
- max: 0.9
- help:
- zh_Hans: 生成过程中核采样方法概率阈值,例如,取值为0.8时,仅保留概率加起来大于等于0.8的最可能token的最小集合作为候选集。取值范围为(0,1.0),取值越大,生成的随机性越高;取值越低,生成的确定性越高。
- en_US: The probability threshold of the kernel sampling method during the generation process. For example, when the value is 0.8, only the smallest set of the most likely tokens with a sum of probabilities greater than or equal to 0.8 is retained as the candidate set. The value range is (0,1.0). The larger the value, the higher the randomness generated; the lower the value, the higher the certainty generated.
- - name: top_k
- type: int
- min: 0
- max: 99
- label:
- zh_Hans: 取样数量
- en_US: Top k
- help:
- zh_Hans: 生成时,采样候选集的大小。例如,取值为50时,仅将单次生成中得分最高的50个token组成随机采样的候选集。取值越大,生成的随机性越高;取值越小,生成的确定性越高。
- en_US: The size of the sample candidate set when generated. For example, when the value is 50, only the 50 highest-scoring tokens in a single generation form a randomly sampled candidate set. The larger the value, the higher the randomness generated; the smaller the value, the higher the certainty generated.
- - name: seed
- required: false
- type: int
- default: 1234
- label:
- zh_Hans: 随机种子
- en_US: Random seed
- help:
- zh_Hans: 生成时使用的随机数种子,用户控制模型生成内容的随机性。支持无符号64位整数,默认值为 1234。在使用seed时,模型将尽可能生成相同或相似的结果,但目前不保证每次生成的结果完全相同。
- en_US: The random number seed used when generating, the user controls the randomness of the content generated by the model. Supports unsigned 64-bit integers, default value is 1234. When using seed, the model will try its best to generate the same or similar results, but there is currently no guarantee that the results will be exactly the same every time.
- - name: repetition_penalty
- required: false
- type: float
- default: 1.1
- label:
- zh_Hans: 重复惩罚
- en_US: Repetition penalty
- help:
- zh_Hans: 用于控制模型生成时的重复度。提高repetition_penalty时可以降低模型生成的重复度。1.0表示不做惩罚。
- en_US: Used to control the repeatability when generating models. Increasing repetition_penalty can reduce the duplication of model generation. 1.0 means no punishment.
- - name: enable_search
- type: boolean
- default: false
- label:
- zh_Hans: 联网搜索
- en_US: Web Search
- help:
- zh_Hans: 模型内置了互联网搜索服务,该参数控制模型在生成文本时是否参考使用互联网搜索结果。启用互联网搜索,模型会将搜索结果作为文本生成过程中的参考信息,但模型会基于其内部逻辑“自行判断”是否使用互联网搜索结果。
- en_US: The model has a built-in Internet search service. This parameter controls whether the model refers to Internet search results when generating text. When Internet search is enabled, the model will use the search results as reference information in the text generation process, but the model will "judge" whether to use Internet search results based on its internal logic.
- - name: response_format
- use_template: response_format
-pricing:
- input: '0.004'
- output: '0.012'
- unit: '0.001'
- currency: RMB
diff --git a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-plus-0723.yaml b/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-plus-0723.yaml
deleted file mode 100644
index 401a15b690..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-plus-0723.yaml
+++ /dev/null
@@ -1,85 +0,0 @@
-# this model corresponds to qwen-plus-0723, for more details
-# please refer to (https://help.aliyun.com/zh/model-studio/getting-started/models#bb0ffee88bwnk)
-model: qwen-plus-0723
-label:
- en_US: qwen-plus-0723
-model_type: llm
-features:
- - agent-thought
-model_properties:
- mode: completion
- context_size: 32000
-parameter_rules:
- - name: temperature
- use_template: temperature
- type: float
- default: 0.3
- min: 0.0
- max: 2.0
- help:
- zh_Hans: 用于控制随机性和多样性的程度。具体来说,temperature值控制了生成文本时对每个候选词的概率分布进行平滑的程度。较高的temperature值会降低概率分布的峰值,使得更多的低概率词被选择,生成结果更加多样化;而较低的temperature值则会增强概率分布的峰值,使得高概率词更容易被选择,生成结果更加确定。
- en_US: Used to control the degree of randomness and diversity. Specifically, the temperature value controls the degree to which the probability distribution of each candidate word is smoothed when generating text. A higher temperature value will reduce the peak value of the probability distribution, allowing more low-probability words to be selected, and the generated results will be more diverse; while a lower temperature value will enhance the peak value of the probability distribution, making it easier for high-probability words to be selected. , the generated results are more certain.
- - name: max_tokens
- use_template: max_tokens
- type: int
- default: 8000
- min: 1
- max: 8000
- help:
- zh_Hans: 用于指定模型在生成内容时token的最大数量,它定义了生成的上限,但不保证每次都会生成到这个数量。
- en_US: It is used to specify the maximum number of tokens when the model generates content. It defines the upper limit of generation, but does not guarantee that this number will be generated every time.
- - name: top_p
- use_template: top_p
- type: float
- default: 0.8
- min: 0.1
- max: 0.9
- help:
- zh_Hans: 生成过程中核采样方法概率阈值,例如,取值为0.8时,仅保留概率加起来大于等于0.8的最可能token的最小集合作为候选集。取值范围为(0,1.0),取值越大,生成的随机性越高;取值越低,生成的确定性越高。
- en_US: The probability threshold of the kernel sampling method during the generation process. For example, when the value is 0.8, only the smallest set of the most likely tokens with a sum of probabilities greater than or equal to 0.8 is retained as the candidate set. The value range is (0,1.0). The larger the value, the higher the randomness generated; the lower the value, the higher the certainty generated.
- - name: top_k
- type: int
- min: 0
- max: 99
- label:
- zh_Hans: 取样数量
- en_US: Top k
- help:
- zh_Hans: 生成时,采样候选集的大小。例如,取值为50时,仅将单次生成中得分最高的50个token组成随机采样的候选集。取值越大,生成的随机性越高;取值越小,生成的确定性越高。
- en_US: The size of the sample candidate set when generated. For example, when the value is 50, only the 50 highest-scoring tokens in a single generation form a randomly sampled candidate set. The larger the value, the higher the randomness generated; the smaller the value, the higher the certainty generated.
- - name: seed
- required: false
- type: int
- default: 1234
- label:
- zh_Hans: 随机种子
- en_US: Random seed
- help:
- zh_Hans: 生成时使用的随机数种子,用户控制模型生成内容的随机性。支持无符号64位整数,默认值为 1234。在使用seed时,模型将尽可能生成相同或相似的结果,但目前不保证每次生成的结果完全相同。
- en_US: The random number seed used when generating, the user controls the randomness of the content generated by the model. Supports unsigned 64-bit integers, default value is 1234. When using seed, the model will try its best to generate the same or similar results, but there is currently no guarantee that the results will be exactly the same every time.
- - name: repetition_penalty
- required: false
- type: float
- default: 1.1
- label:
- zh_Hans: 重复惩罚
- en_US: Repetition penalty
- help:
- zh_Hans: 用于控制模型生成时的重复度。提高repetition_penalty时可以降低模型生成的重复度。1.0表示不做惩罚。
- en_US: Used to control the repeatability when generating models. Increasing repetition_penalty can reduce the duplication of model generation. 1.0 means no punishment.
- - name: enable_search
- type: boolean
- default: false
- label:
- zh_Hans: 联网搜索
- en_US: Web Search
- help:
- zh_Hans: 模型内置了互联网搜索服务,该参数控制模型在生成文本时是否参考使用互联网搜索结果。启用互联网搜索,模型会将搜索结果作为文本生成过程中的参考信息,但模型会基于其内部逻辑“自行判断”是否使用互联网搜索结果。
- en_US: The model has a built-in Internet search service. This parameter controls whether the model refers to Internet search results when generating text. When Internet search is enabled, the model will use the search results as reference information in the text generation process, but the model will "judge" whether to use Internet search results based on its internal logic.
- - name: response_format
- use_template: response_format
-pricing:
- input: '0.004'
- output: '0.012'
- unit: '0.001'
- currency: RMB
diff --git a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-plus-0806.yaml b/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-plus-0806.yaml
deleted file mode 100644
index 39154708a1..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-plus-0806.yaml
+++ /dev/null
@@ -1,85 +0,0 @@
-# this model corresponds to qwen-plus-0806, for more details
-# please refer to (https://help.aliyun.com/zh/model-studio/getting-started/models#bb0ffee88bwnk)
-model: qwen-plus-0806
-label:
- en_US: qwen-plus-0806
-model_type: llm
-features:
- - agent-thought
-model_properties:
- mode: completion
- context_size: 131072
-parameter_rules:
- - name: temperature
- use_template: temperature
- type: float
- default: 0.3
- min: 0.0
- max: 2.0
- help:
- zh_Hans: 用于控制随机性和多样性的程度。具体来说,temperature值控制了生成文本时对每个候选词的概率分布进行平滑的程度。较高的temperature值会降低概率分布的峰值,使得更多的低概率词被选择,生成结果更加多样化;而较低的temperature值则会增强概率分布的峰值,使得高概率词更容易被选择,生成结果更加确定。
- en_US: Used to control the degree of randomness and diversity. Specifically, the temperature value controls the degree to which the probability distribution of each candidate word is smoothed when generating text. A higher temperature value will reduce the peak value of the probability distribution, allowing more low-probability words to be selected, and the generated results will be more diverse; while a lower temperature value will enhance the peak value of the probability distribution, making it easier for high-probability words to be selected. , the generated results are more certain.
- - name: max_tokens
- use_template: max_tokens
- type: int
- default: 8192
- min: 1
- max: 8192
- help:
- zh_Hans: 用于指定模型在生成内容时token的最大数量,它定义了生成的上限,但不保证每次都会生成到这个数量。
- en_US: It is used to specify the maximum number of tokens when the model generates content. It defines the upper limit of generation, but does not guarantee that this number will be generated every time.
- - name: top_p
- use_template: top_p
- type: float
- default: 0.8
- min: 0.1
- max: 0.9
- help:
- zh_Hans: 生成过程中核采样方法概率阈值,例如,取值为0.8时,仅保留概率加起来大于等于0.8的最可能token的最小集合作为候选集。取值范围为(0,1.0),取值越大,生成的随机性越高;取值越低,生成的确定性越高。
- en_US: The probability threshold of the kernel sampling method during the generation process. For example, when the value is 0.8, only the smallest set of the most likely tokens with a sum of probabilities greater than or equal to 0.8 is retained as the candidate set. The value range is (0,1.0). The larger the value, the higher the randomness generated; the lower the value, the higher the certainty generated.
- - name: top_k
- type: int
- min: 0
- max: 99
- label:
- zh_Hans: 取样数量
- en_US: Top k
- help:
- zh_Hans: 生成时,采样候选集的大小。例如,取值为50时,仅将单次生成中得分最高的50个token组成随机采样的候选集。取值越大,生成的随机性越高;取值越小,生成的确定性越高。
- en_US: The size of the sample candidate set when generated. For example, when the value is 50, only the 50 highest-scoring tokens in a single generation form a randomly sampled candidate set. The larger the value, the higher the randomness generated; the smaller the value, the higher the certainty generated.
- - name: seed
- required: false
- type: int
- default: 1234
- label:
- zh_Hans: 随机种子
- en_US: Random seed
- help:
- zh_Hans: 生成时使用的随机数种子,用户控制模型生成内容的随机性。支持无符号64位整数,默认值为 1234。在使用seed时,模型将尽可能生成相同或相似的结果,但目前不保证每次生成的结果完全相同。
- en_US: The random number seed used when generating, the user controls the randomness of the content generated by the model. Supports unsigned 64-bit integers, default value is 1234. When using seed, the model will try its best to generate the same or similar results, but there is currently no guarantee that the results will be exactly the same every time.
- - name: repetition_penalty
- required: false
- type: float
- default: 1.1
- label:
- zh_Hans: 重复惩罚
- en_US: Repetition penalty
- help:
- zh_Hans: 用于控制模型生成时的重复度。提高repetition_penalty时可以降低模型生成的重复度。1.0表示不做惩罚。
- en_US: Used to control the repeatability when generating models. Increasing repetition_penalty can reduce the duplication of model generation. 1.0 means no punishment.
- - name: enable_search
- type: boolean
- default: false
- label:
- zh_Hans: 联网搜索
- en_US: Web Search
- help:
- zh_Hans: 模型内置了互联网搜索服务,该参数控制模型在生成文本时是否参考使用互联网搜索结果。启用互联网搜索,模型会将搜索结果作为文本生成过程中的参考信息,但模型会基于其内部逻辑“自行判断”是否使用互联网搜索结果。
- en_US: The model has a built-in Internet search service. This parameter controls whether the model refers to Internet search results when generating text. When Internet search is enabled, the model will use the search results as reference information in the text generation process, but the model will "judge" whether to use Internet search results based on its internal logic.
- - name: response_format
- use_template: response_format
-pricing:
- input: '0.004'
- output: '0.012'
- unit: '0.001'
- currency: RMB
diff --git a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-plus-0919.yaml b/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-plus-0919.yaml
deleted file mode 100644
index 2ed2949a45..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-plus-0919.yaml
+++ /dev/null
@@ -1,85 +0,0 @@
-# this model corresponds to qwen-plus-0919, for more details
-# please refer to (https://help.aliyun.com/zh/model-studio/getting-started/models#bb0ffee88bwnk)
-model: qwen-plus-0919
-label:
- en_US: qwen-plus-0919
-model_type: llm
-features:
- - agent-thought
-model_properties:
- mode: completion
- context_size: 131072
-parameter_rules:
- - name: temperature
- use_template: temperature
- type: float
- default: 0.3
- min: 0.0
- max: 2.0
- help:
- zh_Hans: 用于控制随机性和多样性的程度。具体来说,temperature值控制了生成文本时对每个候选词的概率分布进行平滑的程度。较高的temperature值会降低概率分布的峰值,使得更多的低概率词被选择,生成结果更加多样化;而较低的temperature值则会增强概率分布的峰值,使得高概率词更容易被选择,生成结果更加确定。
- en_US: Used to control the degree of randomness and diversity. Specifically, the temperature value controls the degree to which the probability distribution of each candidate word is smoothed when generating text. A higher temperature value will reduce the peak value of the probability distribution, allowing more low-probability words to be selected, and the generated results will be more diverse; while a lower temperature value will enhance the peak value of the probability distribution, making it easier for high-probability words to be selected. , the generated results are more certain.
- - name: max_tokens
- use_template: max_tokens
- type: int
- default: 8192
- min: 1
- max: 8192
- help:
- zh_Hans: 用于指定模型在生成内容时token的最大数量,它定义了生成的上限,但不保证每次都会生成到这个数量。
- en_US: It is used to specify the maximum number of tokens when the model generates content. It defines the upper limit of generation, but does not guarantee that this number will be generated every time.
- - name: top_p
- use_template: top_p
- type: float
- default: 0.8
- min: 0.1
- max: 0.9
- help:
- zh_Hans: 生成过程中核采样方法概率阈值,例如,取值为0.8时,仅保留概率加起来大于等于0.8的最可能token的最小集合作为候选集。取值范围为(0,1.0),取值越大,生成的随机性越高;取值越低,生成的确定性越高。
- en_US: The probability threshold of the kernel sampling method during the generation process. For example, when the value is 0.8, only the smallest set of the most likely tokens with a sum of probabilities greater than or equal to 0.8 is retained as the candidate set. The value range is (0,1.0). The larger the value, the higher the randomness generated; the lower the value, the higher the certainty generated.
- - name: top_k
- type: int
- min: 0
- max: 99
- label:
- zh_Hans: 取样数量
- en_US: Top k
- help:
- zh_Hans: 生成时,采样候选集的大小。例如,取值为50时,仅将单次生成中得分最高的50个token组成随机采样的候选集。取值越大,生成的随机性越高;取值越小,生成的确定性越高。
- en_US: The size of the sample candidate set when generated. For example, when the value is 50, only the 50 highest-scoring tokens in a single generation form a randomly sampled candidate set. The larger the value, the higher the randomness generated; the smaller the value, the higher the certainty generated.
- - name: seed
- required: false
- type: int
- default: 1234
- label:
- zh_Hans: 随机种子
- en_US: Random seed
- help:
- zh_Hans: 生成时使用的随机数种子,用户控制模型生成内容的随机性。支持无符号64位整数,默认值为 1234。在使用seed时,模型将尽可能生成相同或相似的结果,但目前不保证每次生成的结果完全相同。
- en_US: The random number seed used when generating, the user controls the randomness of the content generated by the model. Supports unsigned 64-bit integers, default value is 1234. When using seed, the model will try its best to generate the same or similar results, but there is currently no guarantee that the results will be exactly the same every time.
- - name: repetition_penalty
- required: false
- type: float
- default: 1.1
- label:
- zh_Hans: 重复惩罚
- en_US: Repetition penalty
- help:
- zh_Hans: 用于控制模型生成时的重复度。提高repetition_penalty时可以降低模型生成的重复度。1.0表示不做惩罚。
- en_US: Used to control the repeatability when generating models. Increasing repetition_penalty can reduce the duplication of model generation. 1.0 means no punishment.
- - name: enable_search
- type: boolean
- default: false
- label:
- zh_Hans: 联网搜索
- en_US: Web Search
- help:
- zh_Hans: 模型内置了互联网搜索服务,该参数控制模型在生成文本时是否参考使用互联网搜索结果。启用互联网搜索,模型会将搜索结果作为文本生成过程中的参考信息,但模型会基于其内部逻辑“自行判断”是否使用互联网搜索结果。
- en_US: The model has a built-in Internet search service. This parameter controls whether the model refers to Internet search results when generating text. When Internet search is enabled, the model will use the search results as reference information in the text generation process, but the model will "judge" whether to use Internet search results based on its internal logic.
- - name: response_format
- use_template: response_format
-pricing:
- input: '0.0008'
- output: '0.002'
- unit: '0.001'
- currency: RMB
diff --git a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-plus-chat.yaml b/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-plus-chat.yaml
deleted file mode 100644
index d891796bac..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-plus-chat.yaml
+++ /dev/null
@@ -1,88 +0,0 @@
-# this model corresponds to qwen-plus, for more details
-# please refer to (https://help.aliyun.com/zh/model-studio/getting-started/models#bb0ffee88bwnk)
-model: qwen-plus-chat
-label:
- en_US: qwen-plus-chat
-model_type: llm
-features:
- - multi-tool-call
- - agent-thought
- - stream-tool-call
-model_properties:
- mode: chat
- context_size: 32768
-parameter_rules:
- - name: temperature
- use_template: temperature
- type: float
- default: 0.3
- min: 0.0
- max: 2.0
- help:
- zh_Hans: 用于控制随机性和多样性的程度。具体来说,temperature值控制了生成文本时对每个候选词的概率分布进行平滑的程度。较高的temperature值会降低概率分布的峰值,使得更多的低概率词被选择,生成结果更加多样化;而较低的temperature值则会增强概率分布的峰值,使得高概率词更容易被选择,生成结果更加确定。
- en_US: Used to control the degree of randomness and diversity. Specifically, the temperature value controls the degree to which the probability distribution of each candidate word is smoothed when generating text. A higher temperature value will reduce the peak value of the probability distribution, allowing more low-probability words to be selected, and the generated results will be more diverse; while a lower temperature value will enhance the peak value of the probability distribution, making it easier for high-probability words to be selected. , the generated results are more certain.
- - name: max_tokens
- use_template: max_tokens
- type: int
- default: 2000
- min: 1
- max: 2000
- help:
- zh_Hans: 用于指定模型在生成内容时token的最大数量,它定义了生成的上限,但不保证每次都会生成到这个数量。
- en_US: It is used to specify the maximum number of tokens when the model generates content. It defines the upper limit of generation, but does not guarantee that this number will be generated every time.
- - name: top_p
- use_template: top_p
- type: float
- default: 0.8
- min: 0.1
- max: 0.9
- help:
- zh_Hans: 生成过程中核采样方法概率阈值,例如,取值为0.8时,仅保留概率加起来大于等于0.8的最可能token的最小集合作为候选集。取值范围为(0,1.0),取值越大,生成的随机性越高;取值越低,生成的确定性越高。
- en_US: The probability threshold of the kernel sampling method during the generation process. For example, when the value is 0.8, only the smallest set of the most likely tokens with a sum of probabilities greater than or equal to 0.8 is retained as the candidate set. The value range is (0,1.0). The larger the value, the higher the randomness generated; the lower the value, the higher the certainty generated.
- - name: top_k
- type: int
- min: 0
- max: 99
- label:
- zh_Hans: 取样数量
- en_US: Top k
- help:
- zh_Hans: 生成时,采样候选集的大小。例如,取值为50时,仅将单次生成中得分最高的50个token组成随机采样的候选集。取值越大,生成的随机性越高;取值越小,生成的确定性越高。
- en_US: The size of the sample candidate set when generated. For example, when the value is 50, only the 50 highest-scoring tokens in a single generation form a randomly sampled candidate set. The larger the value, the higher the randomness generated; the smaller the value, the higher the certainty generated.
- - name: seed
- required: false
- type: int
- default: 1234
- label:
- zh_Hans: 随机种子
- en_US: Random seed
- help:
- zh_Hans: 生成时使用的随机数种子,用户控制模型生成内容的随机性。支持无符号64位整数,默认值为 1234。在使用seed时,模型将尽可能生成相同或相似的结果,但目前不保证每次生成的结果完全相同。
- en_US: The random number seed used when generating, the user controls the randomness of the content generated by the model. Supports unsigned 64-bit integers, default value is 1234. When using seed, the model will try its best to generate the same or similar results, but there is currently no guarantee that the results will be exactly the same every time.
- - name: repetition_penalty
- required: false
- type: float
- default: 1.1
- label:
- zh_Hans: 重复惩罚
- en_US: Repetition penalty
- help:
- zh_Hans: 用于控制模型生成时的重复度。提高repetition_penalty时可以降低模型生成的重复度。1.0表示不做惩罚。
- en_US: Used to control the repeatability when generating models. Increasing repetition_penalty can reduce the duplication of model generation. 1.0 means no punishment.
- - name: enable_search
- type: boolean
- default: false
- label:
- zh_Hans: 联网搜索
- en_US: Web Search
- help:
- zh_Hans: 模型内置了互联网搜索服务,该参数控制模型在生成文本时是否参考使用互联网搜索结果。启用互联网搜索,模型会将搜索结果作为文本生成过程中的参考信息,但模型会基于其内部逻辑“自行判断”是否使用互联网搜索结果。
- en_US: The model has a built-in Internet search service. This parameter controls whether the model refers to Internet search results when generating text. When Internet search is enabled, the model will use the search results as reference information in the text generation process, but the model will "judge" whether to use Internet search results based on its internal logic.
- - name: response_format
- use_template: response_format
-pricing:
- input: '0.004'
- output: '0.012'
- unit: '0.001'
- currency: RMB
-deprecated: true
diff --git a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-plus-latest.yaml b/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-plus-latest.yaml
deleted file mode 100644
index 7ef5c04975..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-plus-latest.yaml
+++ /dev/null
@@ -1,85 +0,0 @@
-# this model corresponds to qwen-plus-latest, for more details
-# please refer to (https://help.aliyun.com/zh/model-studio/getting-started/models#bb0ffee88bwnk)
-model: qwen-plus-latest
-label:
- en_US: qwen-plus-latest
-model_type: llm
-features:
- - agent-thought
-model_properties:
- mode: chat
- context_size: 131072
-parameter_rules:
- - name: temperature
- use_template: temperature
- type: float
- default: 0.3
- min: 0.0
- max: 2.0
- help:
- zh_Hans: 用于控制随机性和多样性的程度。具体来说,temperature值控制了生成文本时对每个候选词的概率分布进行平滑的程度。较高的temperature值会降低概率分布的峰值,使得更多的低概率词被选择,生成结果更加多样化;而较低的temperature值则会增强概率分布的峰值,使得高概率词更容易被选择,生成结果更加确定。
- en_US: Used to control the degree of randomness and diversity. Specifically, the temperature value controls the degree to which the probability distribution of each candidate word is smoothed when generating text. A higher temperature value will reduce the peak value of the probability distribution, allowing more low-probability words to be selected, and the generated results will be more diverse; while a lower temperature value will enhance the peak value of the probability distribution, making it easier for high-probability words to be selected. , the generated results are more certain.
- - name: max_tokens
- use_template: max_tokens
- type: int
- default: 8192
- min: 1
- max: 8192
- help:
- zh_Hans: 用于指定模型在生成内容时token的最大数量,它定义了生成的上限,但不保证每次都会生成到这个数量。
- en_US: It is used to specify the maximum number of tokens when the model generates content. It defines the upper limit of generation, but does not guarantee that this number will be generated every time.
- - name: top_p
- use_template: top_p
- type: float
- default: 0.8
- min: 0.1
- max: 0.9
- help:
- zh_Hans: 生成过程中核采样方法概率阈值,例如,取值为0.8时,仅保留概率加起来大于等于0.8的最可能token的最小集合作为候选集。取值范围为(0,1.0),取值越大,生成的随机性越高;取值越低,生成的确定性越高。
- en_US: The probability threshold of the kernel sampling method during the generation process. For example, when the value is 0.8, only the smallest set of the most likely tokens with a sum of probabilities greater than or equal to 0.8 is retained as the candidate set. The value range is (0,1.0). The larger the value, the higher the randomness generated; the lower the value, the higher the certainty generated.
- - name: top_k
- type: int
- min: 0
- max: 99
- label:
- zh_Hans: 取样数量
- en_US: Top k
- help:
- zh_Hans: 生成时,采样候选集的大小。例如,取值为50时,仅将单次生成中得分最高的50个token组成随机采样的候选集。取值越大,生成的随机性越高;取值越小,生成的确定性越高。
- en_US: The size of the sample candidate set when generated. For example, when the value is 50, only the 50 highest-scoring tokens in a single generation form a randomly sampled candidate set. The larger the value, the higher the randomness generated; the smaller the value, the higher the certainty generated.
- - name: seed
- required: false
- type: int
- default: 1234
- label:
- zh_Hans: 随机种子
- en_US: Random seed
- help:
- zh_Hans: 生成时使用的随机数种子,用户控制模型生成内容的随机性。支持无符号64位整数,默认值为 1234。在使用seed时,模型将尽可能生成相同或相似的结果,但目前不保证每次生成的结果完全相同。
- en_US: The random number seed used when generating, the user controls the randomness of the content generated by the model. Supports unsigned 64-bit integers, default value is 1234. When using seed, the model will try its best to generate the same or similar results, but there is currently no guarantee that the results will be exactly the same every time.
- - name: repetition_penalty
- required: false
- type: float
- default: 1.1
- label:
- zh_Hans: 重复惩罚
- en_US: Repetition penalty
- help:
- zh_Hans: 用于控制模型生成时的重复度。提高repetition_penalty时可以降低模型生成的重复度。1.0表示不做惩罚。
- en_US: Used to control the repeatability when generating models. Increasing repetition_penalty can reduce the duplication of model generation. 1.0 means no punishment.
- - name: enable_search
- type: boolean
- default: false
- label:
- zh_Hans: 联网搜索
- en_US: Web Search
- help:
- zh_Hans: 模型内置了互联网搜索服务,该参数控制模型在生成文本时是否参考使用互联网搜索结果。启用互联网搜索,模型会将搜索结果作为文本生成过程中的参考信息,但模型会基于其内部逻辑“自行判断”是否使用互联网搜索结果。
- en_US: The model has a built-in Internet search service. This parameter controls whether the model refers to Internet search results when generating text. When Internet search is enabled, the model will use the search results as reference information in the text generation process, but the model will "judge" whether to use Internet search results based on its internal logic.
- - name: response_format
- use_template: response_format
-pricing:
- input: '0.0008'
- output: '0.002'
- unit: '0.001'
- currency: RMB
diff --git a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-plus.yaml b/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-plus.yaml
deleted file mode 100644
index 529a29b1b5..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-plus.yaml
+++ /dev/null
@@ -1,87 +0,0 @@
-# this model corresponds to qwen-plus, for more details
-# please refer to (https://help.aliyun.com/zh/model-studio/getting-started/models#bb0ffee88bwnk)
-model: qwen-plus
-label:
- en_US: qwen-plus
-model_type: llm
-features:
- - multi-tool-call
- - agent-thought
- - stream-tool-call
-model_properties:
- mode: chat
- context_size: 128000
-parameter_rules:
- - name: temperature
- use_template: temperature
- type: float
- default: 0.3
- min: 0.0
- max: 2.0
- help:
- zh_Hans: 用于控制随机性和多样性的程度。具体来说,temperature值控制了生成文本时对每个候选词的概率分布进行平滑的程度。较高的temperature值会降低概率分布的峰值,使得更多的低概率词被选择,生成结果更加多样化;而较低的temperature值则会增强概率分布的峰值,使得高概率词更容易被选择,生成结果更加确定。
- en_US: Used to control the degree of randomness and diversity. Specifically, the temperature value controls the degree to which the probability distribution of each candidate word is smoothed when generating text. A higher temperature value will reduce the peak value of the probability distribution, allowing more low-probability words to be selected, and the generated results will be more diverse; while a lower temperature value will enhance the peak value of the probability distribution, making it easier for high-probability words to be selected. , the generated results are more certain.
- - name: max_tokens
- use_template: max_tokens
- type: int
- default: 8192
- min: 1
- max: 8192
- help:
- zh_Hans: 用于指定模型在生成内容时token的最大数量,它定义了生成的上限,但不保证每次都会生成到这个数量。
- en_US: It is used to specify the maximum number of tokens when the model generates content. It defines the upper limit of generation, but does not guarantee that this number will be generated every time.
- - name: top_p
- use_template: top_p
- type: float
- default: 0.8
- min: 0.1
- max: 0.9
- help:
- zh_Hans: 生成过程中核采样方法概率阈值,例如,取值为0.8时,仅保留概率加起来大于等于0.8的最可能token的最小集合作为候选集。取值范围为(0,1.0),取值越大,生成的随机性越高;取值越低,生成的确定性越高。
- en_US: The probability threshold of the kernel sampling method during the generation process. For example, when the value is 0.8, only the smallest set of the most likely tokens with a sum of probabilities greater than or equal to 0.8 is retained as the candidate set. The value range is (0,1.0). The larger the value, the higher the randomness generated; the lower the value, the higher the certainty generated.
- - name: top_k
- type: int
- min: 0
- max: 99
- label:
- zh_Hans: 取样数量
- en_US: Top k
- help:
- zh_Hans: 生成时,采样候选集的大小。例如,取值为50时,仅将单次生成中得分最高的50个token组成随机采样的候选集。取值越大,生成的随机性越高;取值越小,生成的确定性越高。
- en_US: The size of the sample candidate set when generated. For example, when the value is 50, only the 50 highest-scoring tokens in a single generation form a randomly sampled candidate set. The larger the value, the higher the randomness generated; the smaller the value, the higher the certainty generated.
- - name: seed
- required: false
- type: int
- default: 1234
- label:
- zh_Hans: 随机种子
- en_US: Random seed
- help:
- zh_Hans: 生成时使用的随机数种子,用户控制模型生成内容的随机性。支持无符号64位整数,默认值为 1234。在使用seed时,模型将尽可能生成相同或相似的结果,但目前不保证每次生成的结果完全相同。
- en_US: The random number seed used when generating, the user controls the randomness of the content generated by the model. Supports unsigned 64-bit integers, default value is 1234. When using seed, the model will try its best to generate the same or similar results, but there is currently no guarantee that the results will be exactly the same every time.
- - name: repetition_penalty
- required: false
- type: float
- default: 1.1
- label:
- zh_Hans: 重复惩罚
- en_US: Repetition penalty
- help:
- zh_Hans: 用于控制模型生成时的重复度。提高repetition_penalty时可以降低模型生成的重复度。1.0表示不做惩罚。
- en_US: Used to control the repeatability when generating models. Increasing repetition_penalty can reduce the duplication of model generation. 1.0 means no punishment.
- - name: enable_search
- type: boolean
- default: false
- label:
- zh_Hans: 联网搜索
- en_US: Web Search
- help:
- zh_Hans: 模型内置了互联网搜索服务,该参数控制模型在生成文本时是否参考使用互联网搜索结果。启用互联网搜索,模型会将搜索结果作为文本生成过程中的参考信息,但模型会基于其内部逻辑“自行判断”是否使用互联网搜索结果。
- en_US: The model has a built-in Internet search service. This parameter controls whether the model refers to Internet search results when generating text. When Internet search is enabled, the model will use the search results as reference information in the text generation process, but the model will "judge" whether to use Internet search results based on its internal logic.
- - name: response_format
- use_template: response_format
-pricing:
- input: '0.0008'
- output: '0.002'
- unit: '0.001'
- currency: RMB
diff --git a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-turbo-0206.yaml b/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-turbo-0206.yaml
deleted file mode 100644
index 09bc797465..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-turbo-0206.yaml
+++ /dev/null
@@ -1,86 +0,0 @@
-# this model corresponds to qwen-turbo-0206, for more details
-# please refer to (https://help.aliyun.com/zh/model-studio/getting-started/models#ff492e2c10lub)
-
-model: qwen-turbo-0206
-label:
- en_US: qwen-turbo-0206
-model_type: llm
-features:
- - agent-thought
-model_properties:
- mode: chat
- context_size: 8000
-parameter_rules:
- - name: temperature
- use_template: temperature
- type: float
- default: 0.3
- min: 0.0
- max: 2.0
- help:
- zh_Hans: 用于控制随机性和多样性的程度。具体来说,temperature值控制了生成文本时对每个候选词的概率分布进行平滑的程度。较高的temperature值会降低概率分布的峰值,使得更多的低概率词被选择,生成结果更加多样化;而较低的temperature值则会增强概率分布的峰值,使得高概率词更容易被选择,生成结果更加确定。
- en_US: Used to control the degree of randomness and diversity. Specifically, the temperature value controls the degree to which the probability distribution of each candidate word is smoothed when generating text. A higher temperature value will reduce the peak value of the probability distribution, allowing more low-probability words to be selected, and the generated results will be more diverse; while a lower temperature value will enhance the peak value of the probability distribution, making it easier for high-probability words to be selected. , the generated results are more certain.
- - name: max_tokens
- use_template: max_tokens
- type: int
- default: 2000
- min: 1
- max: 2000
- help:
- zh_Hans: 用于指定模型在生成内容时token的最大数量,它定义了生成的上限,但不保证每次都会生成到这个数量。
- en_US: It is used to specify the maximum number of tokens when the model generates content. It defines the upper limit of generation, but does not guarantee that this number will be generated every time.
- - name: top_p
- use_template: top_p
- type: float
- default: 0.8
- min: 0.1
- max: 0.9
- help:
- zh_Hans: 生成过程中核采样方法概率阈值,例如,取值为0.8时,仅保留概率加起来大于等于0.8的最可能token的最小集合作为候选集。取值范围为(0,1.0),取值越大,生成的随机性越高;取值越低,生成的确定性越高。
- en_US: The probability threshold of the kernel sampling method during the generation process. For example, when the value is 0.8, only the smallest set of the most likely tokens with a sum of probabilities greater than or equal to 0.8 is retained as the candidate set. The value range is (0,1.0). The larger the value, the higher the randomness generated; the lower the value, the higher the certainty generated.
- - name: top_k
- type: int
- min: 0
- max: 99
- label:
- zh_Hans: 取样数量
- en_US: Top k
- help:
- zh_Hans: 生成时,采样候选集的大小。例如,取值为50时,仅将单次生成中得分最高的50个token组成随机采样的候选集。取值越大,生成的随机性越高;取值越小,生成的确定性越高。
- en_US: The size of the sample candidate set when generated. For example, when the value is 50, only the 50 highest-scoring tokens in a single generation form a randomly sampled candidate set. The larger the value, the higher the randomness generated; the smaller the value, the higher the certainty generated.
- - name: seed
- required: false
- type: int
- default: 1234
- label:
- zh_Hans: 随机种子
- en_US: Random seed
- help:
- zh_Hans: 生成时使用的随机数种子,用户控制模型生成内容的随机性。支持无符号64位整数,默认值为 1234。在使用seed时,模型将尽可能生成相同或相似的结果,但目前不保证每次生成的结果完全相同。
- en_US: The random number seed used when generating, the user controls the randomness of the content generated by the model. Supports unsigned 64-bit integers, default value is 1234. When using seed, the model will try its best to generate the same or similar results, but there is currently no guarantee that the results will be exactly the same every time.
- - name: repetition_penalty
- required: false
- type: float
- default: 1.1
- label:
- zh_Hans: 重复惩罚
- en_US: Repetition penalty
- help:
- zh_Hans: 用于控制模型生成时的重复度。提高repetition_penalty时可以降低模型生成的重复度。1.0表示不做惩罚。
- en_US: Used to control the repeatability when generating models. Increasing repetition_penalty can reduce the duplication of model generation. 1.0 means no punishment.
- - name: enable_search
- type: boolean
- default: false
- label:
- zh_Hans: 联网搜索
- en_US: Web Search
- help:
- zh_Hans: 模型内置了互联网搜索服务,该参数控制模型在生成文本时是否参考使用互联网搜索结果。启用互联网搜索,模型会将搜索结果作为文本生成过程中的参考信息,但模型会基于其内部逻辑“自行判断”是否使用互联网搜索结果。
- en_US: The model has a built-in Internet search service. This parameter controls whether the model refers to Internet search results when generating text. When Internet search is enabled, the model will use the search results as reference information in the text generation process, but the model will "judge" whether to use Internet search results based on its internal logic.
- - name: response_format
- use_template: response_format
-pricing:
- input: '0.002'
- output: '0.006'
- unit: '0.001'
- currency: RMB
diff --git a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-turbo-0624.yaml b/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-turbo-0624.yaml
deleted file mode 100644
index 036a96d1ae..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-turbo-0624.yaml
+++ /dev/null
@@ -1,85 +0,0 @@
-# this model corresponds to qwen-turbo-0624, for more details
-# please refer to (https://help.aliyun.com/zh/model-studio/getting-started/models#ff492e2c10lub)
-model: qwen-turbo-0624
-label:
- en_US: qwen-turbo-0624
-model_type: llm
-features:
- - agent-thought
-model_properties:
- mode: chat
- context_size: 8000
-parameter_rules:
- - name: temperature
- use_template: temperature
- type: float
- default: 0.3
- min: 0.0
- max: 2.0
- help:
- zh_Hans: 用于控制随机性和多样性的程度。具体来说,temperature值控制了生成文本时对每个候选词的概率分布进行平滑的程度。较高的temperature值会降低概率分布的峰值,使得更多的低概率词被选择,生成结果更加多样化;而较低的temperature值则会增强概率分布的峰值,使得高概率词更容易被选择,生成结果更加确定。
- en_US: Used to control the degree of randomness and diversity. Specifically, the temperature value controls the degree to which the probability distribution of each candidate word is smoothed when generating text. A higher temperature value will reduce the peak value of the probability distribution, allowing more low-probability words to be selected, and the generated results will be more diverse; while a lower temperature value will enhance the peak value of the probability distribution, making it easier for high-probability words to be selected. , the generated results are more certain.
- - name: max_tokens
- use_template: max_tokens
- type: int
- default: 2000
- min: 1
- max: 2000
- help:
- zh_Hans: 用于指定模型在生成内容时token的最大数量,它定义了生成的上限,但不保证每次都会生成到这个数量。
- en_US: It is used to specify the maximum number of tokens when the model generates content. It defines the upper limit of generation, but does not guarantee that this number will be generated every time.
- - name: top_p
- use_template: top_p
- type: float
- default: 0.8
- min: 0.1
- max: 0.9
- help:
- zh_Hans: 生成过程中核采样方法概率阈值,例如,取值为0.8时,仅保留概率加起来大于等于0.8的最可能token的最小集合作为候选集。取值范围为(0,1.0),取值越大,生成的随机性越高;取值越低,生成的确定性越高。
- en_US: The probability threshold of the kernel sampling method during the generation process. For example, when the value is 0.8, only the smallest set of the most likely tokens with a sum of probabilities greater than or equal to 0.8 is retained as the candidate set. The value range is (0,1.0). The larger the value, the higher the randomness generated; the lower the value, the higher the certainty generated.
- - name: top_k
- type: int
- min: 0
- max: 99
- label:
- zh_Hans: 取样数量
- en_US: Top k
- help:
- zh_Hans: 生成时,采样候选集的大小。例如,取值为50时,仅将单次生成中得分最高的50个token组成随机采样的候选集。取值越大,生成的随机性越高;取值越小,生成的确定性越高。
- en_US: The size of the sample candidate set when generated. For example, when the value is 50, only the 50 highest-scoring tokens in a single generation form a randomly sampled candidate set. The larger the value, the higher the randomness generated; the smaller the value, the higher the certainty generated.
- - name: seed
- required: false
- type: int
- default: 1234
- label:
- zh_Hans: 随机种子
- en_US: Random seed
- help:
- zh_Hans: 生成时使用的随机数种子,用户控制模型生成内容的随机性。支持无符号64位整数,默认值为 1234。在使用seed时,模型将尽可能生成相同或相似的结果,但目前不保证每次生成的结果完全相同。
- en_US: The random number seed used when generating, the user controls the randomness of the content generated by the model. Supports unsigned 64-bit integers, default value is 1234. When using seed, the model will try its best to generate the same or similar results, but there is currently no guarantee that the results will be exactly the same every time.
- - name: repetition_penalty
- required: false
- type: float
- default: 1.1
- label:
- zh_Hans: 重复惩罚
- en_US: Repetition penalty
- help:
- zh_Hans: 用于控制模型生成时的重复度。提高repetition_penalty时可以降低模型生成的重复度。1.0表示不做惩罚。
- en_US: Used to control the repeatability when generating models. Increasing repetition_penalty can reduce the duplication of model generation. 1.0 means no punishment.
- - name: enable_search
- type: boolean
- default: false
- label:
- zh_Hans: 联网搜索
- en_US: Web Search
- help:
- zh_Hans: 模型内置了互联网搜索服务,该参数控制模型在生成文本时是否参考使用互联网搜索结果。启用互联网搜索,模型会将搜索结果作为文本生成过程中的参考信息,但模型会基于其内部逻辑“自行判断”是否使用互联网搜索结果。
- en_US: The model has a built-in Internet search service. This parameter controls whether the model refers to Internet search results when generating text. When Internet search is enabled, the model will use the search results as reference information in the text generation process, but the model will "judge" whether to use Internet search results based on its internal logic.
- - name: response_format
- use_template: response_format
-pricing:
- input: '0.002'
- output: '0.006'
- unit: '0.001'
- currency: RMB
diff --git a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-turbo-0919.yaml b/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-turbo-0919.yaml
deleted file mode 100644
index 866efa3248..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-turbo-0919.yaml
+++ /dev/null
@@ -1,85 +0,0 @@
-# this model corresponds to qwen-turbo-0919, for more details
-# please refer to (https://help.aliyun.com/zh/model-studio/getting-started/models#ff492e2c10lub)
-model: qwen-turbo-0919
-label:
- en_US: qwen-turbo-0919
-model_type: llm
-features:
- - agent-thought
-model_properties:
- mode: chat
- context_size: 131072
-parameter_rules:
- - name: temperature
- use_template: temperature
- type: float
- default: 0.3
- min: 0.0
- max: 2.0
- help:
- zh_Hans: 用于控制随机性和多样性的程度。具体来说,temperature值控制了生成文本时对每个候选词的概率分布进行平滑的程度。较高的temperature值会降低概率分布的峰值,使得更多的低概率词被选择,生成结果更加多样化;而较低的temperature值则会增强概率分布的峰值,使得高概率词更容易被选择,生成结果更加确定。
- en_US: Used to control the degree of randomness and diversity. Specifically, the temperature value controls the degree to which the probability distribution of each candidate word is smoothed when generating text. A higher temperature value will reduce the peak value of the probability distribution, allowing more low-probability words to be selected, and the generated results will be more diverse; while a lower temperature value will enhance the peak value of the probability distribution, making it easier for high-probability words to be selected. , the generated results are more certain.
- - name: max_tokens
- use_template: max_tokens
- type: int
- default: 8192
- min: 1
- max: 8192
- help:
- zh_Hans: 用于指定模型在生成内容时token的最大数量,它定义了生成的上限,但不保证每次都会生成到这个数量。
- en_US: It is used to specify the maximum number of tokens when the model generates content. It defines the upper limit of generation, but does not guarantee that this number will be generated every time.
- - name: top_p
- use_template: top_p
- type: float
- default: 0.8
- min: 0.1
- max: 0.9
- help:
- zh_Hans: 生成过程中核采样方法概率阈值,例如,取值为0.8时,仅保留概率加起来大于等于0.8的最可能token的最小集合作为候选集。取值范围为(0,1.0),取值越大,生成的随机性越高;取值越低,生成的确定性越高。
- en_US: The probability threshold of the kernel sampling method during the generation process. For example, when the value is 0.8, only the smallest set of the most likely tokens with a sum of probabilities greater than or equal to 0.8 is retained as the candidate set. The value range is (0,1.0). The larger the value, the higher the randomness generated; the lower the value, the higher the certainty generated.
- - name: top_k
- type: int
- min: 0
- max: 99
- label:
- zh_Hans: 取样数量
- en_US: Top k
- help:
- zh_Hans: 生成时,采样候选集的大小。例如,取值为50时,仅将单次生成中得分最高的50个token组成随机采样的候选集。取值越大,生成的随机性越高;取值越小,生成的确定性越高。
- en_US: The size of the sample candidate set when generated. For example, when the value is 50, only the 50 highest-scoring tokens in a single generation form a randomly sampled candidate set. The larger the value, the higher the randomness generated; the smaller the value, the higher the certainty generated.
- - name: seed
- required: false
- type: int
- default: 1234
- label:
- zh_Hans: 随机种子
- en_US: Random seed
- help:
- zh_Hans: 生成时使用的随机数种子,用户控制模型生成内容的随机性。支持无符号64位整数,默认值为 1234。在使用seed时,模型将尽可能生成相同或相似的结果,但目前不保证每次生成的结果完全相同。
- en_US: The random number seed used when generating, the user controls the randomness of the content generated by the model. Supports unsigned 64-bit integers, default value is 1234. When using seed, the model will try its best to generate the same or similar results, but there is currently no guarantee that the results will be exactly the same every time.
- - name: repetition_penalty
- required: false
- type: float
- default: 1.1
- label:
- zh_Hans: 重复惩罚
- en_US: Repetition penalty
- help:
- zh_Hans: 用于控制模型生成时的重复度。提高repetition_penalty时可以降低模型生成的重复度。1.0表示不做惩罚。
- en_US: Used to control the repeatability when generating models. Increasing repetition_penalty can reduce the duplication of model generation. 1.0 means no punishment.
- - name: enable_search
- type: boolean
- default: false
- label:
- zh_Hans: 联网搜索
- en_US: Web Search
- help:
- zh_Hans: 模型内置了互联网搜索服务,该参数控制模型在生成文本时是否参考使用互联网搜索结果。启用互联网搜索,模型会将搜索结果作为文本生成过程中的参考信息,但模型会基于其内部逻辑“自行判断”是否使用互联网搜索结果。
- en_US: The model has a built-in Internet search service. This parameter controls whether the model refers to Internet search results when generating text. When Internet search is enabled, the model will use the search results as reference information in the text generation process, but the model will "judge" whether to use Internet search results based on its internal logic.
- - name: response_format
- use_template: response_format
-pricing:
- input: '0.0003'
- output: '0.0006'
- unit: '0.001'
- currency: RMB
diff --git a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-turbo-chat.yaml b/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-turbo-chat.yaml
deleted file mode 100644
index 98c78ba8ac..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-turbo-chat.yaml
+++ /dev/null
@@ -1,88 +0,0 @@
-# this model corresponds to qwen-turbo, for more details
-# please refer to (https://help.aliyun.com/zh/model-studio/getting-started/models#ff492e2c10lub)
-model: qwen-turbo-chat
-label:
- en_US: qwen-turbo-chat
-model_type: llm
-features:
- - multi-tool-call
- - agent-thought
- - stream-tool-call
-model_properties:
- mode: chat
- context_size: 8192
-parameter_rules:
- - name: temperature
- use_template: temperature
- type: float
- default: 0.3
- min: 0.0
- max: 2.0
- help:
- zh_Hans: 用于控制随机性和多样性的程度。具体来说,temperature值控制了生成文本时对每个候选词的概率分布进行平滑的程度。较高的temperature值会降低概率分布的峰值,使得更多的低概率词被选择,生成结果更加多样化;而较低的temperature值则会增强概率分布的峰值,使得高概率词更容易被选择,生成结果更加确定。
- en_US: Used to control the degree of randomness and diversity. Specifically, the temperature value controls the degree to which the probability distribution of each candidate word is smoothed when generating text. A higher temperature value will reduce the peak value of the probability distribution, allowing more low-probability words to be selected, and the generated results will be more diverse; while a lower temperature value will enhance the peak value of the probability distribution, making it easier for high-probability words to be selected. , the generated results are more certain.
- - name: max_tokens
- use_template: max_tokens
- type: int
- default: 1500
- min: 1
- max: 1500
- help:
- zh_Hans: 用于指定模型在生成内容时token的最大数量,它定义了生成的上限,但不保证每次都会生成到这个数量。
- en_US: It is used to specify the maximum number of tokens when the model generates content. It defines the upper limit of generation, but does not guarantee that this number will be generated every time.
- - name: top_p
- use_template: top_p
- type: float
- default: 0.8
- min: 0.1
- max: 0.9
- help:
- zh_Hans: 生成过程中核采样方法概率阈值,例如,取值为0.8时,仅保留概率加起来大于等于0.8的最可能token的最小集合作为候选集。取值范围为(0,1.0),取值越大,生成的随机性越高;取值越低,生成的确定性越高。
- en_US: The probability threshold of the kernel sampling method during the generation process. For example, when the value is 0.8, only the smallest set of the most likely tokens with a sum of probabilities greater than or equal to 0.8 is retained as the candidate set. The value range is (0,1.0). The larger the value, the higher the randomness generated; the lower the value, the higher the certainty generated.
- - name: top_k
- type: int
- min: 0
- max: 99
- label:
- zh_Hans: 取样数量
- en_US: Top k
- help:
- zh_Hans: 生成时,采样候选集的大小。例如,取值为50时,仅将单次生成中得分最高的50个token组成随机采样的候选集。取值越大,生成的随机性越高;取值越小,生成的确定性越高。
- en_US: The size of the sample candidate set when generated. For example, when the value is 50, only the 50 highest-scoring tokens in a single generation form a randomly sampled candidate set. The larger the value, the higher the randomness generated; the smaller the value, the higher the certainty generated.
- - name: seed
- required: false
- type: int
- default: 1234
- label:
- zh_Hans: 随机种子
- en_US: Random seed
- help:
- zh_Hans: 生成时使用的随机数种子,用户控制模型生成内容的随机性。支持无符号64位整数,默认值为 1234。在使用seed时,模型将尽可能生成相同或相似的结果,但目前不保证每次生成的结果完全相同。
- en_US: The random number seed used when generating, the user controls the randomness of the content generated by the model. Supports unsigned 64-bit integers, default value is 1234. When using seed, the model will try its best to generate the same or similar results, but there is currently no guarantee that the results will be exactly the same every time.
- - name: repetition_penalty
- required: false
- type: float
- default: 1.1
- label:
- zh_Hans: 重复惩罚
- en_US: Repetition penalty
- help:
- zh_Hans: 用于控制模型生成时的重复度。提高repetition_penalty时可以降低模型生成的重复度。1.0表示不做惩罚。
- en_US: Used to control the repeatability when generating models. Increasing repetition_penalty can reduce the duplication of model generation. 1.0 means no punishment.
- - name: enable_search
- type: boolean
- default: false
- label:
- zh_Hans: 联网搜索
- en_US: Web Search
- help:
- zh_Hans: 模型内置了互联网搜索服务,该参数控制模型在生成文本时是否参考使用互联网搜索结果。启用互联网搜索,模型会将搜索结果作为文本生成过程中的参考信息,但模型会基于其内部逻辑“自行判断”是否使用互联网搜索结果。
- en_US: The model has a built-in Internet search service. This parameter controls whether the model refers to Internet search results when generating text. When Internet search is enabled, the model will use the search results as reference information in the text generation process, but the model will "judge" whether to use Internet search results based on its internal logic.
- - name: response_format
- use_template: response_format
-pricing:
- input: '0.002'
- output: '0.006'
- unit: '0.001'
- currency: RMB
-deprecated: true
diff --git a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-turbo-latest.yaml b/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-turbo-latest.yaml
deleted file mode 100644
index e1193aeb7f..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-turbo-latest.yaml
+++ /dev/null
@@ -1,85 +0,0 @@
-# this model corresponds to qwen-turbo-latest, for more details
-# please refer to (https://help.aliyun.com/zh/model-studio/getting-started/models#ff492e2c10lub)
-model: qwen-turbo-latest
-label:
- en_US: qwen-turbo-latest
-model_type: llm
-features:
- - agent-thought
-model_properties:
- mode: chat
- context_size: 131072
-parameter_rules:
- - name: temperature
- use_template: temperature
- type: float
- default: 0.3
- min: 0.0
- max: 2.0
- help:
- zh_Hans: 用于控制随机性和多样性的程度。具体来说,temperature值控制了生成文本时对每个候选词的概率分布进行平滑的程度。较高的temperature值会降低概率分布的峰值,使得更多的低概率词被选择,生成结果更加多样化;而较低的temperature值则会增强概率分布的峰值,使得高概率词更容易被选择,生成结果更加确定。
- en_US: Used to control the degree of randomness and diversity. Specifically, the temperature value controls the degree to which the probability distribution of each candidate word is smoothed when generating text. A higher temperature value will reduce the peak value of the probability distribution, allowing more low-probability words to be selected, and the generated results will be more diverse; while a lower temperature value will enhance the peak value of the probability distribution, making it easier for high-probability words to be selected. , the generated results are more certain.
- - name: max_tokens
- use_template: max_tokens
- type: int
- default: 8192
- min: 1
- max: 8192
- help:
- zh_Hans: 用于指定模型在生成内容时token的最大数量,它定义了生成的上限,但不保证每次都会生成到这个数量。
- en_US: It is used to specify the maximum number of tokens when the model generates content. It defines the upper limit of generation, but does not guarantee that this number will be generated every time.
- - name: top_p
- use_template: top_p
- type: float
- default: 0.8
- min: 0.1
- max: 0.9
- help:
- zh_Hans: 生成过程中核采样方法概率阈值,例如,取值为0.8时,仅保留概率加起来大于等于0.8的最可能token的最小集合作为候选集。取值范围为(0,1.0),取值越大,生成的随机性越高;取值越低,生成的确定性越高。
- en_US: The probability threshold of the kernel sampling method during the generation process. For example, when the value is 0.8, only the smallest set of the most likely tokens with a sum of probabilities greater than or equal to 0.8 is retained as the candidate set. The value range is (0,1.0). The larger the value, the higher the randomness generated; the lower the value, the higher the certainty generated.
- - name: top_k
- type: int
- min: 0
- max: 99
- label:
- zh_Hans: 取样数量
- en_US: Top k
- help:
- zh_Hans: 生成时,采样候选集的大小。例如,取值为50时,仅将单次生成中得分最高的50个token组成随机采样的候选集。取值越大,生成的随机性越高;取值越小,生成的确定性越高。
- en_US: The size of the sample candidate set when generated. For example, when the value is 50, only the 50 highest-scoring tokens in a single generation form a randomly sampled candidate set. The larger the value, the higher the randomness generated; the smaller the value, the higher the certainty generated.
- - name: seed
- required: false
- type: int
- default: 1234
- label:
- zh_Hans: 随机种子
- en_US: Random seed
- help:
- zh_Hans: 生成时使用的随机数种子,用户控制模型生成内容的随机性。支持无符号64位整数,默认值为 1234。在使用seed时,模型将尽可能生成相同或相似的结果,但目前不保证每次生成的结果完全相同。
- en_US: The random number seed used when generating, the user controls the randomness of the content generated by the model. Supports unsigned 64-bit integers, default value is 1234. When using seed, the model will try its best to generate the same or similar results, but there is currently no guarantee that the results will be exactly the same every time.
- - name: repetition_penalty
- required: false
- type: float
- default: 1.1
- label:
- zh_Hans: 重复惩罚
- en_US: Repetition penalty
- help:
- zh_Hans: 用于控制模型生成时的重复度。提高repetition_penalty时可以降低模型生成的重复度。1.0表示不做惩罚。
- en_US: Used to control the repeatability when generating models. Increasing repetition_penalty can reduce the duplication of model generation. 1.0 means no punishment.
- - name: enable_search
- type: boolean
- default: false
- label:
- zh_Hans: 联网搜索
- en_US: Web Search
- help:
- zh_Hans: 模型内置了互联网搜索服务,该参数控制模型在生成文本时是否参考使用互联网搜索结果。启用互联网搜索,模型会将搜索结果作为文本生成过程中的参考信息,但模型会基于其内部逻辑“自行判断”是否使用互联网搜索结果。
- en_US: The model has a built-in Internet search service. This parameter controls whether the model refers to Internet search results when generating text. When Internet search is enabled, the model will use the search results as reference information in the text generation process, but the model will "judge" whether to use Internet search results based on its internal logic.
- - name: response_format
- use_template: response_format
-pricing:
- input: '0.0006'
- output: '0.0003'
- unit: '0.001'
- currency: RMB
diff --git a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-turbo.yaml b/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-turbo.yaml
deleted file mode 100644
index a0c4ba6820..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-turbo.yaml
+++ /dev/null
@@ -1,87 +0,0 @@
-# this model corresponds to qwen-turbo, for more details
-# please refer to (https://help.aliyun.com/zh/model-studio/getting-started/models#ff492e2c10lub)
-model: qwen-turbo
-label:
- en_US: qwen-turbo
-model_type: llm
-features:
- - multi-tool-call
- - agent-thought
- - stream-tool-call
-model_properties:
- mode: chat
- context_size: 128000
-parameter_rules:
- - name: temperature
- use_template: temperature
- type: float
- default: 0.3
- min: 0.0
- max: 2.0
- help:
- zh_Hans: 用于控制随机性和多样性的程度。具体来说,temperature值控制了生成文本时对每个候选词的概率分布进行平滑的程度。较高的temperature值会降低概率分布的峰值,使得更多的低概率词被选择,生成结果更加多样化;而较低的temperature值则会增强概率分布的峰值,使得高概率词更容易被选择,生成结果更加确定。
- en_US: Used to control the degree of randomness and diversity. Specifically, the temperature value controls the degree to which the probability distribution of each candidate word is smoothed when generating text. A higher temperature value will reduce the peak value of the probability distribution, allowing more low-probability words to be selected, and the generated results will be more diverse; while a lower temperature value will enhance the peak value of the probability distribution, making it easier for high-probability words to be selected. , the generated results are more certain.
- - name: max_tokens
- use_template: max_tokens
- type: int
- default: 2000
- min: 1
- max: 8192
- help:
- zh_Hans: 用于指定模型在生成内容时token的最大数量,它定义了生成的上限,但不保证每次都会生成到这个数量。
- en_US: It is used to specify the maximum number of tokens when the model generates content. It defines the upper limit of generation, but does not guarantee that this number will be generated every time.
- - name: top_p
- use_template: top_p
- type: float
- default: 0.8
- min: 0.1
- max: 0.9
- help:
- zh_Hans: 生成过程中核采样方法概率阈值,例如,取值为0.8时,仅保留概率加起来大于等于0.8的最可能token的最小集合作为候选集。取值范围为(0,1.0),取值越大,生成的随机性越高;取值越低,生成的确定性越高。
- en_US: The probability threshold of the kernel sampling method during the generation process. For example, when the value is 0.8, only the smallest set of the most likely tokens with a sum of probabilities greater than or equal to 0.8 is retained as the candidate set. The value range is (0,1.0). The larger the value, the higher the randomness generated; the lower the value, the higher the certainty generated.
- - name: top_k
- type: int
- min: 0
- max: 99
- label:
- zh_Hans: 取样数量
- en_US: Top k
- help:
- zh_Hans: 生成时,采样候选集的大小。例如,取值为50时,仅将单次生成中得分最高的50个token组成随机采样的候选集。取值越大,生成的随机性越高;取值越小,生成的确定性越高。
- en_US: The size of the sample candidate set when generated. For example, when the value is 50, only the 50 highest-scoring tokens in a single generation form a randomly sampled candidate set. The larger the value, the higher the randomness generated; the smaller the value, the higher the certainty generated.
- - name: seed
- required: false
- type: int
- default: 1234
- label:
- zh_Hans: 随机种子
- en_US: Random seed
- help:
- zh_Hans: 生成时使用的随机数种子,用户控制模型生成内容的随机性。支持无符号64位整数,默认值为 1234。在使用seed时,模型将尽可能生成相同或相似的结果,但目前不保证每次生成的结果完全相同。
- en_US: The random number seed used when generating, the user controls the randomness of the content generated by the model. Supports unsigned 64-bit integers, default value is 1234. When using seed, the model will try its best to generate the same or similar results, but there is currently no guarantee that the results will be exactly the same every time.
- - name: repetition_penalty
- required: false
- type: float
- default: 1.1
- label:
- zh_Hans: 重复惩罚
- en_US: Repetition penalty
- help:
- zh_Hans: 用于控制模型生成时的重复度。提高repetition_penalty时可以降低模型生成的重复度。1.0表示不做惩罚。
- en_US: Used to control the repeatability when generating models. Increasing repetition_penalty can reduce the duplication of model generation. 1.0 means no punishment.
- - name: enable_search
- type: boolean
- default: false
- label:
- zh_Hans: 联网搜索
- en_US: Web Search
- help:
- zh_Hans: 模型内置了互联网搜索服务,该参数控制模型在生成文本时是否参考使用互联网搜索结果。启用互联网搜索,模型会将搜索结果作为文本生成过程中的参考信息,但模型会基于其内部逻辑“自行判断”是否使用互联网搜索结果。
- en_US: The model has a built-in Internet search service. This parameter controls whether the model refers to Internet search results when generating text. When Internet search is enabled, the model will use the search results as reference information in the text generation process, but the model will "judge" whether to use Internet search results based on its internal logic.
- - name: response_format
- use_template: response_format
-pricing:
- input: '0.0006'
- output: '0.0003'
- unit: '0.001'
- currency: RMB
diff --git a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-vl-max-0201.yaml b/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-vl-max-0201.yaml
deleted file mode 100644
index d80168ffc3..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-vl-max-0201.yaml
+++ /dev/null
@@ -1,49 +0,0 @@
-# for more details, please refer to https://help.aliyun.com/zh/model-studio/getting-started/models
-model: qwen-vl-max-0201
-label:
- en_US: qwen-vl-max-0201
-model_type: llm
-features:
- - vision
- - agent-thought
-model_properties:
- mode: chat
- context_size: 8192
-parameter_rules:
- - name: top_p
- use_template: top_p
- type: float
- default: 0.8
- min: 0.1
- max: 0.9
- help:
- zh_Hans: 生成过程中核采样方法概率阈值,例如,取值为0.8时,仅保留概率加起来大于等于0.8的最可能token的最小集合作为候选集。取值范围为(0,1.0),取值越大,生成的随机性越高;取值越低,生成的确定性越高。
- en_US: The probability threshold of the kernel sampling method during the generation process. For example, when the value is 0.8, only the smallest set of the most likely tokens with a sum of probabilities greater than or equal to 0.8 is retained as the candidate set. The value range is (0,1.0). The larger the value, the higher the randomness generated; the lower the value, the higher the certainty generated.
- - name: top_k
- type: int
- min: 0
- max: 99
- label:
- zh_Hans: 取样数量
- en_US: Top k
- help:
- zh_Hans: 生成时,采样候选集的大小。例如,取值为50时,仅将单次生成中得分最高的50个token组成随机采样的候选集。取值越大,生成的随机性越高;取值越小,生成的确定性越高。
- en_US: The size of the sample candidate set when generated. For example, when the value is 50, only the 50 highest-scoring tokens in a single generation form a randomly sampled candidate set. The larger the value, the higher the randomness generated; the smaller the value, the higher the certainty generated.
- - name: seed
- required: false
- type: int
- default: 1234
- label:
- zh_Hans: 随机种子
- en_US: Random seed
- help:
- zh_Hans: 生成时使用的随机数种子,用户控制模型生成内容的随机性。支持无符号64位整数,默认值为 1234。在使用seed时,模型将尽可能生成相同或相似的结果,但目前不保证每次生成的结果完全相同。
- en_US: The random number seed used when generating, the user controls the randomness of the content generated by the model. Supports unsigned 64-bit integers, default value is 1234. When using seed, the model will try its best to generate the same or similar results, but there is currently no guarantee that the results will be exactly the same every time.
- - name: response_format
- use_template: response_format
-pricing:
- input: '0.02'
- output: '0.02'
- unit: '0.001'
- currency: RMB
-deprecated: true
diff --git a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-vl-max-0809.yaml b/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-vl-max-0809.yaml
deleted file mode 100644
index 94b6666d05..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-vl-max-0809.yaml
+++ /dev/null
@@ -1,80 +0,0 @@
-# for more details, please refer to https://help.aliyun.com/zh/model-studio/getting-started/models
-model: qwen-vl-max-0809
-label:
- en_US: qwen-vl-max-0809
-model_type: llm
-features:
- - vision
- - agent-thought
- - video
-model_properties:
- mode: chat
- context_size: 32000
-parameter_rules:
- - name: temperature
- use_template: temperature
- type: float
- default: 0.3
- min: 0.0
- max: 2.0
- help:
- zh_Hans: 用于控制随机性和多样性的程度。具体来说,temperature值控制了生成文本时对每个候选词的概率分布进行平滑的程度。较高的temperature值会降低概率分布的峰值,使得更多的低概率词被选择,生成结果更加多样化;而较低的temperature值则会增强概率分布的峰值,使得高概率词更容易被选择,生成结果更加确定。
- en_US: Used to control the degree of randomness and diversity. Specifically, the temperature value controls the degree to which the probability distribution of each candidate word is smoothed when generating text. A higher temperature value will reduce the peak value of the probability distribution, allowing more low-probability words to be selected, and the generated results will be more diverse; while a lower temperature value will enhance the peak value of the probability distribution, making it easier for high-probability words to be selected. , the generated results are more certain.
- - name: top_p
- use_template: top_p
- type: float
- default: 0.8
- min: 0.1
- max: 0.9
- help:
- zh_Hans: 生成过程中核采样方法概率阈值,例如,取值为0.8时,仅保留概率加起来大于等于0.8的最可能token的最小集合作为候选集。取值范围为(0,1.0),取值越大,生成的随机性越高;取值越低,生成的确定性越高。
- en_US: The probability threshold of the kernel sampling method during the generation process. For example, when the value is 0.8, only the smallest set of the most likely tokens with a sum of probabilities greater than or equal to 0.8 is retained as the candidate set. The value range is (0,1.0). The larger the value, the higher the randomness generated; the lower the value, the higher the certainty generated.
- - name: top_k
- type: int
- min: 0
- max: 99
- label:
- zh_Hans: 取样数量
- en_US: Top k
- help:
- zh_Hans: 生成时,采样候选集的大小。例如,取值为50时,仅将单次生成中得分最高的50个token组成随机采样的候选集。取值越大,生成的随机性越高;取值越小,生成的确定性越高。
- en_US: The size of the sample candidate set when generated. For example, when the value is 50, only the 50 highest-scoring tokens in a single generation form a randomly sampled candidate set. The larger the value, the higher the randomness generated; the smaller the value, the higher the certainty generated.
- - name: max_tokens
- required: false
- use_template: max_tokens
- type: int
- default: 2000
- min: 1
- max: 2000
- help:
- zh_Hans: 用于指定模型在生成内容时token的最大数量,它定义了生成的上限,但不保证每次都会生成到这个数量。
- en_US: It is used to specify the maximum number of tokens when the model generates content. It defines the upper limit of generation, but does not guarantee that this number will be generated every time.
- - name: seed
- required: false
- type: int
- default: 1234
- label:
- zh_Hans: 随机种子
- en_US: Random seed
- help:
- zh_Hans: 生成时使用的随机数种子,用户控制模型生成内容的随机性。支持无符号64位整数,默认值为 1234。在使用seed时,模型将尽可能生成相同或相似的结果,但目前不保证每次生成的结果完全相同。
- en_US: The random number seed used when generating, the user controls the randomness of the content generated by the model. Supports unsigned 64-bit integers, default value is 1234. When using seed, the model will try its best to generate the same or similar results, but there is currently no guarantee that the results will be exactly the same every time.
- - name: response_format
- use_template: response_format
- - name: repetition_penalty
- required: false
- type: float
- default: 1.1
- label:
- zh_Hans: 重复惩罚
- en_US: Repetition penalty
- help:
- zh_Hans: 用于控制模型生成时的重复度。提高repetition_penalty时可以降低模型生成的重复度。1.0表示不做惩罚。
- en_US: Used to control the repeatability when generating models. Increasing repetition_penalty can reduce the duplication of model generation. 1.0 means no punishment.
- - name: response_format
- use_template: response_format
-pricing:
- input: '0.02'
- output: '0.02'
- unit: '0.001'
- currency: RMB
diff --git a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-vl-max-2025-01-25.yaml b/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-vl-max-2025-01-25.yaml
deleted file mode 100644
index f458f7b252..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-vl-max-2025-01-25.yaml
+++ /dev/null
@@ -1,78 +0,0 @@
-# for more details, please refer to https://help.aliyun.com/zh/model-studio/getting-started/models
-model: qwen-vl-max-2025-01-25
-label:
- en_US: qwen-vl-max-2025-01-25
-model_type: llm
-features:
- - vision
- - agent-thought
- - video
-model_properties:
- mode: chat
- context_size: 131072
-parameter_rules:
- - name: temperature
- use_template: temperature
- type: float
- default: 0.3
- min: 0.0
- max: 2.0
- help:
- zh_Hans: 用于控制随机性和多样性的程度。具体来说,temperature值控制了生成文本时对每个候选词的概率分布进行平滑的程度。较高的temperature值会降低概率分布的峰值,使得更多的低概率词被选择,生成结果更加多样化;而较低的temperature值则会增强概率分布的峰值,使得高概率词更容易被选择,生成结果更加确定。
- en_US: Used to control the degree of randomness and diversity. Specifically, the temperature value controls the degree to which the probability distribution of each candidate word is smoothed when generating text. A higher temperature value will reduce the peak value of the probability distribution, allowing more low-probability words to be selected, and the generated results will be more diverse; while a lower temperature value will enhance the peak value of the probability distribution, making it easier for high-probability words to be selected. , the generated results are more certain.
- - name: top_p
- use_template: top_p
- type: float
- default: 0.8
- min: 0.1
- max: 0.9
- help:
- zh_Hans: 生成过程中核采样方法概率阈值,例如,取值为0.8时,仅保留概率加起来大于等于0.8的最可能token的最小集合作为候选集。取值范围为(0,1.0),取值越大,生成的随机性越高;取值越低,生成的确定性越高。
- en_US: The probability threshold of the kernel sampling method during the generation process. For example, when the value is 0.8, only the smallest set of the most likely tokens with a sum of probabilities greater than or equal to 0.8 is retained as the candidate set. The value range is (0,1.0). The larger the value, the higher the randomness generated; the lower the value, the higher the certainty generated.
- - name: top_k
- type: int
- min: 0
- max: 99
- label:
- zh_Hans: 取样数量
- en_US: Top k
- help:
- zh_Hans: 生成时,采样候选集的大小。例如,取值为50时,仅将单次生成中得分最高的50个token组成随机采样的候选集。取值越大,生成的随机性越高;取值越小,生成的确定性越高。
- en_US: The size of the sample candidate set when generated. For example, when the value is 50, only the 50 highest-scoring tokens in a single generation form a randomly sampled candidate set. The larger the value, the higher the randomness generated; the smaller the value, the higher the certainty generated.
- - name: max_tokens
- required: false
- use_template: max_tokens
- type: int
- default: 4096
- min: 1
- max: 8192
- help:
- zh_Hans: 用于指定模型在生成内容时token的最大数量,它定义了生成的上限,但不保证每次都会生成到这个数量。
- en_US: It is used to specify the maximum number of tokens when the model generates content. It defines the upper limit of generation, but does not guarantee that this number will be generated every time.
- - name: seed
- required: false
- type: int
- default: 1234
- label:
- zh_Hans: 随机种子
- en_US: Random seed
- help:
- zh_Hans: 生成时使用的随机数种子,用户控制模型生成内容的随机性。支持无符号64位整数,默认值为 1234。在使用seed时,模型将尽可能生成相同或相似的结果,但目前不保证每次生成的结果完全相同。
- en_US: The random number seed used when generating, the user controls the randomness of the content generated by the model. Supports unsigned 64-bit integers, default value is 1234. When using seed, the model will try its best to generate the same or similar results, but there is currently no guarantee that the results will be exactly the same every time.
- - name: repetition_penalty
- required: false
- type: float
- default: 1.1
- label:
- zh_Hans: 重复惩罚
- en_US: Repetition penalty
- help:
- zh_Hans: 用于控制模型生成时的重复度。提高repetition_penalty时可以降低模型生成的重复度。1.0表示不做惩罚。
- en_US: Used to control the repeatability when generating models. Increasing repetition_penalty can reduce the duplication of model generation. 1.0 means no punishment.
- - name: response_format
- use_template: response_format
-pricing:
- input: '0.003'
- output: '0.009'
- unit: '0.001'
- currency: RMB
\ No newline at end of file
diff --git a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-vl-max-latest.yaml b/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-vl-max-latest.yaml
deleted file mode 100644
index 73b90ad8b0..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-vl-max-latest.yaml
+++ /dev/null
@@ -1,78 +0,0 @@
-# for more details, please refer to https://help.aliyun.com/zh/model-studio/getting-started/models
-model: qwen-vl-max-latest
-label:
- en_US: qwen-vl-max-latest
-model_type: llm
-features:
- - vision
- - agent-thought
- - video
-model_properties:
- mode: chat
- context_size: 131072
-parameter_rules:
- - name: temperature
- use_template: temperature
- type: float
- default: 0.3
- min: 0.0
- max: 2.0
- help:
- zh_Hans: 用于控制随机性和多样性的程度。具体来说,temperature值控制了生成文本时对每个候选词的概率分布进行平滑的程度。较高的temperature值会降低概率分布的峰值,使得更多的低概率词被选择,生成结果更加多样化;而较低的temperature值则会增强概率分布的峰值,使得高概率词更容易被选择,生成结果更加确定。
- en_US: Used to control the degree of randomness and diversity. Specifically, the temperature value controls the degree to which the probability distribution of each candidate word is smoothed when generating text. A higher temperature value will reduce the peak value of the probability distribution, allowing more low-probability words to be selected, and the generated results will be more diverse; while a lower temperature value will enhance the peak value of the probability distribution, making it easier for high-probability words to be selected. , the generated results are more certain.
- - name: top_p
- use_template: top_p
- type: float
- default: 0.8
- min: 0.1
- max: 0.9
- help:
- zh_Hans: 生成过程中核采样方法概率阈值,例如,取值为0.8时,仅保留概率加起来大于等于0.8的最可能token的最小集合作为候选集。取值范围为(0,1.0),取值越大,生成的随机性越高;取值越低,生成的确定性越高。
- en_US: The probability threshold of the kernel sampling method during the generation process. For example, when the value is 0.8, only the smallest set of the most likely tokens with a sum of probabilities greater than or equal to 0.8 is retained as the candidate set. The value range is (0,1.0). The larger the value, the higher the randomness generated; the lower the value, the higher the certainty generated.
- - name: top_k
- type: int
- min: 0
- max: 99
- label:
- zh_Hans: 取样数量
- en_US: Top k
- help:
- zh_Hans: 生成时,采样候选集的大小。例如,取值为50时,仅将单次生成中得分最高的50个token组成随机采样的候选集。取值越大,生成的随机性越高;取值越小,生成的确定性越高。
- en_US: The size of the sample candidate set when generated. For example, when the value is 50, only the 50 highest-scoring tokens in a single generation form a randomly sampled candidate set. The larger the value, the higher the randomness generated; the smaller the value, the higher the certainty generated.
- - name: max_tokens
- required: false
- use_template: max_tokens
- type: int
- default: 4096
- min: 1
- max: 8192
- help:
- zh_Hans: 用于指定模型在生成内容时token的最大数量,它定义了生成的上限,但不保证每次都会生成到这个数量。
- en_US: It is used to specify the maximum number of tokens when the model generates content. It defines the upper limit of generation, but does not guarantee that this number will be generated every time.
- - name: seed
- required: false
- type: int
- default: 1234
- label:
- zh_Hans: 随机种子
- en_US: Random seed
- help:
- zh_Hans: 生成时使用的随机数种子,用户控制模型生成内容的随机性。支持无符号64位整数,默认值为 1234。在使用seed时,模型将尽可能生成相同或相似的结果,但目前不保证每次生成的结果完全相同。
- en_US: The random number seed used when generating, the user controls the randomness of the content generated by the model. Supports unsigned 64-bit integers, default value is 1234. When using seed, the model will try its best to generate the same or similar results, but there is currently no guarantee that the results will be exactly the same every time.
- - name: repetition_penalty
- required: false
- type: float
- default: 1.1
- label:
- zh_Hans: 重复惩罚
- en_US: Repetition penalty
- help:
- zh_Hans: 用于控制模型生成时的重复度。提高repetition_penalty时可以降低模型生成的重复度。1.0表示不做惩罚。
- en_US: Used to control the repeatability when generating models. Increasing repetition_penalty can reduce the duplication of model generation. 1.0 means no punishment.
- - name: response_format
- use_template: response_format
-pricing:
- input: '0.003'
- output: '0.009'
- unit: '0.001'
- currency: RMB
\ No newline at end of file
diff --git a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-vl-max.yaml b/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-vl-max.yaml
deleted file mode 100644
index b6172c1cbc..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-vl-max.yaml
+++ /dev/null
@@ -1,80 +0,0 @@
-# for more details, please refer to https://help.aliyun.com/zh/model-studio/getting-started/models
-model: qwen-vl-max
-label:
- en_US: qwen-vl-max
-model_type: llm
-features:
- - vision
- - agent-thought
- - video
-model_properties:
- mode: chat
- context_size: 32000
-parameter_rules:
- - name: temperature
- use_template: temperature
- type: float
- default: 0.3
- min: 0.0
- max: 2.0
- help:
- zh_Hans: 用于控制随机性和多样性的程度。具体来说,temperature值控制了生成文本时对每个候选词的概率分布进行平滑的程度。较高的temperature值会降低概率分布的峰值,使得更多的低概率词被选择,生成结果更加多样化;而较低的temperature值则会增强概率分布的峰值,使得高概率词更容易被选择,生成结果更加确定。
- en_US: Used to control the degree of randomness and diversity. Specifically, the temperature value controls the degree to which the probability distribution of each candidate word is smoothed when generating text. A higher temperature value will reduce the peak value of the probability distribution, allowing more low-probability words to be selected, and the generated results will be more diverse; while a lower temperature value will enhance the peak value of the probability distribution, making it easier for high-probability words to be selected. , the generated results are more certain.
- - name: top_p
- use_template: top_p
- type: float
- default: 0.8
- min: 0.1
- max: 0.9
- help:
- zh_Hans: 生成过程中核采样方法概率阈值,例如,取值为0.8时,仅保留概率加起来大于等于0.8的最可能token的最小集合作为候选集。取值范围为(0,1.0),取值越大,生成的随机性越高;取值越低,生成的确定性越高。
- en_US: The probability threshold of the kernel sampling method during the generation process. For example, when the value is 0.8, only the smallest set of the most likely tokens with a sum of probabilities greater than or equal to 0.8 is retained as the candidate set. The value range is (0,1.0). The larger the value, the higher the randomness generated; the lower the value, the higher the certainty generated.
- - name: top_k
- type: int
- min: 0
- max: 99
- label:
- zh_Hans: 取样数量
- en_US: Top k
- help:
- zh_Hans: 生成时,采样候选集的大小。例如,取值为50时,仅将单次生成中得分最高的50个token组成随机采样的候选集。取值越大,生成的随机性越高;取值越小,生成的确定性越高。
- en_US: The size of the sample candidate set when generated. For example, when the value is 50, only the 50 highest-scoring tokens in a single generation form a randomly sampled candidate set. The larger the value, the higher the randomness generated; the smaller the value, the higher the certainty generated.
- - name: max_tokens
- required: false
- use_template: max_tokens
- type: int
- default: 2000
- min: 1
- max: 2000
- help:
- zh_Hans: 用于指定模型在生成内容时token的最大数量,它定义了生成的上限,但不保证每次都会生成到这个数量。
- en_US: It is used to specify the maximum number of tokens when the model generates content. It defines the upper limit of generation, but does not guarantee that this number will be generated every time.
- - name: seed
- required: false
- type: int
- default: 1234
- label:
- zh_Hans: 随机种子
- en_US: Random seed
- help:
- zh_Hans: 生成时使用的随机数种子,用户控制模型生成内容的随机性。支持无符号64位整数,默认值为 1234。在使用seed时,模型将尽可能生成相同或相似的结果,但目前不保证每次生成的结果完全相同。
- en_US: The random number seed used when generating, the user controls the randomness of the content generated by the model. Supports unsigned 64-bit integers, default value is 1234. When using seed, the model will try its best to generate the same or similar results, but there is currently no guarantee that the results will be exactly the same every time.
- - name: response_format
- use_template: response_format
- - name: repetition_penalty
- required: false
- type: float
- default: 1.1
- label:
- zh_Hans: 重复惩罚
- en_US: Repetition penalty
- help:
- zh_Hans: 用于控制模型生成时的重复度。提高repetition_penalty时可以降低模型生成的重复度。1.0表示不做惩罚。
- en_US: Used to control the repeatability when generating models. Increasing repetition_penalty can reduce the duplication of model generation. 1.0 means no punishment.
- - name: response_format
- use_template: response_format
-pricing:
- input: '0.02'
- output: '0.02'
- unit: '0.001'
- currency: RMB
diff --git a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-vl-plus-0809.yaml b/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-vl-plus-0809.yaml
deleted file mode 100644
index 0be4b68f4f..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-vl-plus-0809.yaml
+++ /dev/null
@@ -1,80 +0,0 @@
-# for more details, please refer to https://help.aliyun.com/zh/model-studio/getting-started/models
-model: qwen-vl-plus-0809
-label:
- en_US: qwen-vl-plus-0809
-model_type: llm
-features:
- - vision
- - agent-thought
- - video
-model_properties:
- mode: chat
- context_size: 32768
-parameter_rules:
- - name: temperature
- use_template: temperature
- type: float
- default: 0.3
- min: 0.0
- max: 2.0
- help:
- zh_Hans: 用于控制随机性和多样性的程度。具体来说,temperature值控制了生成文本时对每个候选词的概率分布进行平滑的程度。较高的temperature值会降低概率分布的峰值,使得更多的低概率词被选择,生成结果更加多样化;而较低的temperature值则会增强概率分布的峰值,使得高概率词更容易被选择,生成结果更加确定。
- en_US: Used to control the degree of randomness and diversity. Specifically, the temperature value controls the degree to which the probability distribution of each candidate word is smoothed when generating text. A higher temperature value will reduce the peak value of the probability distribution, allowing more low-probability words to be selected, and the generated results will be more diverse; while a lower temperature value will enhance the peak value of the probability distribution, making it easier for high-probability words to be selected. , the generated results are more certain.
- - name: top_p
- use_template: top_p
- type: float
- default: 0.8
- min: 0.1
- max: 0.9
- help:
- zh_Hans: 生成过程中核采样方法概率阈值,例如,取值为0.8时,仅保留概率加起来大于等于0.8的最可能token的最小集合作为候选集。取值范围为(0,1.0),取值越大,生成的随机性越高;取值越低,生成的确定性越高。
- en_US: The probability threshold of the kernel sampling method during the generation process. For example, when the value is 0.8, only the smallest set of the most likely tokens with a sum of probabilities greater than or equal to 0.8 is retained as the candidate set. The value range is (0,1.0). The larger the value, the higher the randomness generated; the lower the value, the higher the certainty generated.
- - name: top_k
- type: int
- min: 0
- max: 99
- label:
- zh_Hans: 取样数量
- en_US: Top k
- help:
- zh_Hans: 生成时,采样候选集的大小。例如,取值为50时,仅将单次生成中得分最高的50个token组成随机采样的候选集。取值越大,生成的随机性越高;取值越小,生成的确定性越高。
- en_US: The size of the sample candidate set when generated. For example, when the value is 50, only the 50 highest-scoring tokens in a single generation form a randomly sampled candidate set. The larger the value, the higher the randomness generated; the smaller the value, the higher the certainty generated.
- - name: max_tokens
- required: false
- use_template: max_tokens
- type: int
- default: 2000
- min: 1
- max: 2000
- help:
- zh_Hans: 用于指定模型在生成内容时token的最大数量,它定义了生成的上限,但不保证每次都会生成到这个数量。
- en_US: It is used to specify the maximum number of tokens when the model generates content. It defines the upper limit of generation, but does not guarantee that this number will be generated every time.
- - name: seed
- required: false
- type: int
- default: 1234
- label:
- zh_Hans: 随机种子
- en_US: Random seed
- help:
- zh_Hans: 生成时使用的随机数种子,用户控制模型生成内容的随机性。支持无符号64位整数,默认值为 1234。在使用seed时,模型将尽可能生成相同或相似的结果,但目前不保证每次生成的结果完全相同。
- en_US: The random number seed used when generating, the user controls the randomness of the content generated by the model. Supports unsigned 64-bit integers, default value is 1234. When using seed, the model will try its best to generate the same or similar results, but there is currently no guarantee that the results will be exactly the same every time.
- - name: response_format
- use_template: response_format
- - name: repetition_penalty
- required: false
- type: float
- default: 1.1
- label:
- zh_Hans: 重复惩罚
- en_US: Repetition penalty
- help:
- zh_Hans: 用于控制模型生成时的重复度。提高repetition_penalty时可以降低模型生成的重复度。1.0表示不做惩罚。
- en_US: Used to control the repeatability when generating models. Increasing repetition_penalty can reduce the duplication of model generation. 1.0 means no punishment.
- - name: response_format
- use_template: response_format
-pricing:
- input: '0.008'
- output: '0.008'
- unit: '0.001'
- currency: RMB
diff --git a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-vl-plus-2025-01-02.yaml b/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-vl-plus-2025-01-02.yaml
deleted file mode 100644
index c586fb6693..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-vl-plus-2025-01-02.yaml
+++ /dev/null
@@ -1,78 +0,0 @@
-# for more details, please refer to https://help.aliyun.com/zh/model-studio/getting-started/models
-model: qwen-vl-plus-2025-01-02
-label:
- en_US: qwen-vl-plus-2025-01-02
-model_type: llm
-features:
- - vision
- - agent-thought
- - video
-model_properties:
- mode: chat
- context_size: 32768
-parameter_rules:
- - name: temperature
- use_template: temperature
- type: float
- default: 0.3
- min: 0.0
- max: 2.0
- help:
- zh_Hans: 用于控制随机性和多样性的程度。具体来说,temperature值控制了生成文本时对每个候选词的概率分布进行平滑的程度。较高的temperature值会降低概率分布的峰值,使得更多的低概率词被选择,生成结果更加多样化;而较低的temperature值则会增强概率分布的峰值,使得高概率词更容易被选择,生成结果更加确定。
- en_US: Used to control the degree of randomness and diversity. Specifically, the temperature value controls the degree to which the probability distribution of each candidate word is smoothed when generating text. A higher temperature value will reduce the peak value of the probability distribution, allowing more low-probability words to be selected, and the generated results will be more diverse; while a lower temperature value will enhance the peak value of the probability distribution, making it easier for high-probability words to be selected. , the generated results are more certain.
- - name: top_p
- use_template: top_p
- type: float
- default: 0.8
- min: 0.1
- max: 0.9
- help:
- zh_Hans: 生成过程中核采样方法概率阈值,例如,取值为0.8时,仅保留概率加起来大于等于0.8的最可能token的最小集合作为候选集。取值范围为(0,1.0),取值越大,生成的随机性越高;取值越低,生成的确定性越高。
- en_US: The probability threshold of the kernel sampling method during the generation process. For example, when the value is 0.8, only the smallest set of the most likely tokens with a sum of probabilities greater than or equal to 0.8 is retained as the candidate set. The value range is (0,1.0). The larger the value, the higher the randomness generated; the lower the value, the higher the certainty generated.
- - name: top_k
- type: int
- min: 0
- max: 99
- label:
- zh_Hans: 取样数量
- en_US: Top k
- help:
- zh_Hans: 生成时,采样候选集的大小。例如,取值为50时,仅将单次生成中得分最高的50个token组成随机采样的候选集。取值越大,生成的随机性越高;取值越小,生成的确定性越高。
- en_US: The size of the sample candidate set when generated. For example, when the value is 50, only the 50 highest-scoring tokens in a single generation form a randomly sampled candidate set. The larger the value, the higher the randomness generated; the smaller the value, the higher the certainty generated.
- - name: max_tokens
- required: false
- use_template: max_tokens
- type: int
- default: 1024
- min: 1
- max: 2048
- help:
- zh_Hans: 用于指定模型在生成内容时token的最大数量,它定义了生成的上限,但不保证每次都会生成到这个数量。
- en_US: It is used to specify the maximum number of tokens when the model generates content. It defines the upper limit of generation, but does not guarantee that this number will be generated every time.
- - name: seed
- required: false
- type: int
- default: 1234
- label:
- zh_Hans: 随机种子
- en_US: Random seed
- help:
- zh_Hans: 生成时使用的随机数种子,用户控制模型生成内容的随机性。支持无符号64位整数,默认值为 1234。在使用seed时,模型将尽可能生成相同或相似的结果,但目前不保证每次生成的结果完全相同。
- en_US: The random number seed used when generating, the user controls the randomness of the content generated by the model. Supports unsigned 64-bit integers, default value is 1234. When using seed, the model will try its best to generate the same or similar results, but there is currently no guarantee that the results will be exactly the same every time.
- - name: repetition_penalty
- required: false
- type: float
- default: 1.1
- label:
- zh_Hans: 重复惩罚
- en_US: Repetition penalty
- help:
- zh_Hans: 用于控制模型生成时的重复度。提高repetition_penalty时可以降低模型生成的重复度。1.0表示不做惩罚。
- en_US: Used to control the repeatability when generating models. Increasing repetition_penalty can reduce the duplication of model generation. 1.0 means no punishment.
- - name: response_format
- use_template: response_format
-pricing:
- input: '0.0015'
- output: '0.0045'
- unit: '0.001'
- currency: RMB
\ No newline at end of file
diff --git a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-vl-plus-2025-01-25.yaml b/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-vl-plus-2025-01-25.yaml
deleted file mode 100644
index f30b3749e1..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-vl-plus-2025-01-25.yaml
+++ /dev/null
@@ -1,78 +0,0 @@
-# for more details, please refer to https://help.aliyun.com/zh/model-studio/getting-started/models
-model: qwen-vl-plus-2025-01-25
-label:
- en_US: qwen-vl-plus-2025-01-25
-model_type: llm
-features:
- - vision
- - agent-thought
- - video
-model_properties:
- mode: chat
- context_size: 131072
-parameter_rules:
- - name: temperature
- use_template: temperature
- type: float
- default: 0.3
- min: 0.0
- max: 2.0
- help:
- zh_Hans: 用于控制随机性和多样性的程度。具体来说,temperature值控制了生成文本时对每个候选词的概率分布进行平滑的程度。较高的temperature值会降低概率分布的峰值,使得更多的低概率词被选择,生成结果更加多样化;而较低的temperature值则会增强概率分布的峰值,使得高概率词更容易被选择,生成结果更加确定。
- en_US: Used to control the degree of randomness and diversity. Specifically, the temperature value controls the degree to which the probability distribution of each candidate word is smoothed when generating text. A higher temperature value will reduce the peak value of the probability distribution, allowing more low-probability words to be selected, and the generated results will be more diverse; while a lower temperature value will enhance the peak value of the probability distribution, making it easier for high-probability words to be selected. , the generated results are more certain.
- - name: top_p
- use_template: top_p
- type: float
- default: 0.8
- min: 0.1
- max: 0.9
- help:
- zh_Hans: 生成过程中核采样方法概率阈值,例如,取值为0.8时,仅保留概率加起来大于等于0.8的最可能token的最小集合作为候选集。取值范围为(0,1.0),取值越大,生成的随机性越高;取值越低,生成的确定性越高。
- en_US: The probability threshold of the kernel sampling method during the generation process. For example, when the value is 0.8, only the smallest set of the most likely tokens with a sum of probabilities greater than or equal to 0.8 is retained as the candidate set. The value range is (0,1.0). The larger the value, the higher the randomness generated; the lower the value, the higher the certainty generated.
- - name: top_k
- type: int
- min: 0
- max: 99
- label:
- zh_Hans: 取样数量
- en_US: Top k
- help:
- zh_Hans: 生成时,采样候选集的大小。例如,取值为50时,仅将单次生成中得分最高的50个token组成随机采样的候选集。取值越大,生成的随机性越高;取值越小,生成的确定性越高。
- en_US: The size of the sample candidate set when generated. For example, when the value is 50, only the 50 highest-scoring tokens in a single generation form a randomly sampled candidate set. The larger the value, the higher the randomness generated; the smaller the value, the higher the certainty generated.
- - name: max_tokens
- required: false
- use_template: max_tokens
- type: int
- default: 4096
- min: 1
- max: 8192
- help:
- zh_Hans: 用于指定模型在生成内容时token的最大数量,它定义了生成的上限,但不保证每次都会生成到这个数量。
- en_US: It is used to specify the maximum number of tokens when the model generates content. It defines the upper limit of generation, but does not guarantee that this number will be generated every time.
- - name: seed
- required: false
- type: int
- default: 1234
- label:
- zh_Hans: 随机种子
- en_US: Random seed
- help:
- zh_Hans: 生成时使用的随机数种子,用户控制模型生成内容的随机性。支持无符号64位整数,默认值为 1234。在使用seed时,模型将尽可能生成相同或相似的结果,但目前不保证每次生成的结果完全相同。
- en_US: The random number seed used when generating, the user controls the randomness of the content generated by the model. Supports unsigned 64-bit integers, default value is 1234. When using seed, the model will try its best to generate the same or similar results, but there is currently no guarantee that the results will be exactly the same every time.
- - name: repetition_penalty
- required: false
- type: float
- default: 1.1
- label:
- zh_Hans: 重复惩罚
- en_US: Repetition penalty
- help:
- zh_Hans: 用于控制模型生成时的重复度。提高repetition_penalty时可以降低模型生成的重复度。1.0表示不做惩罚。
- en_US: Used to control the repeatability when generating models. Increasing repetition_penalty can reduce the duplication of model generation. 1.0 means no punishment.
- - name: response_format
- use_template: response_format
-pricing:
- input: '0.003'
- output: '0.009'
- unit: '0.001'
- currency: RMB
\ No newline at end of file
diff --git a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-vl-plus-latest.yaml b/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-vl-plus-latest.yaml
deleted file mode 100644
index 5787c45f4b..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-vl-plus-latest.yaml
+++ /dev/null
@@ -1,78 +0,0 @@
-# for more details, please refer to https://help.aliyun.com/zh/model-studio/getting-started/models
-model: qwen-vl-plus-latest
-label:
- en_US: qwen-vl-plus-latest
-model_type: llm
-features:
- - vision
- - agent-thought
- - video
-model_properties:
- mode: chat
- context_size: 131072
-parameter_rules:
- - name: temperature
- use_template: temperature
- type: float
- default: 0.3
- min: 0.0
- max: 2.0
- help:
- zh_Hans: 用于控制随机性和多样性的程度。具体来说,temperature值控制了生成文本时对每个候选词的概率分布进行平滑的程度。较高的temperature值会降低概率分布的峰值,使得更多的低概率词被选择,生成结果更加多样化;而较低的temperature值则会增强概率分布的峰值,使得高概率词更容易被选择,生成结果更加确定。
- en_US: Used to control the degree of randomness and diversity. Specifically, the temperature value controls the degree to which the probability distribution of each candidate word is smoothed when generating text. A higher temperature value will reduce the peak value of the probability distribution, allowing more low-probability words to be selected, and the generated results will be more diverse; while a lower temperature value will enhance the peak value of the probability distribution, making it easier for high-probability words to be selected. , the generated results are more certain.
- - name: top_p
- use_template: top_p
- type: float
- default: 0.8
- min: 0.1
- max: 0.9
- help:
- zh_Hans: 生成过程中核采样方法概率阈值,例如,取值为0.8时,仅保留概率加起来大于等于0.8的最可能token的最小集合作为候选集。取值范围为(0,1.0),取值越大,生成的随机性越高;取值越低,生成的确定性越高。
- en_US: The probability threshold of the kernel sampling method during the generation process. For example, when the value is 0.8, only the smallest set of the most likely tokens with a sum of probabilities greater than or equal to 0.8 is retained as the candidate set. The value range is (0,1.0). The larger the value, the higher the randomness generated; the lower the value, the higher the certainty generated.
- - name: top_k
- type: int
- min: 0
- max: 99
- label:
- zh_Hans: 取样数量
- en_US: Top k
- help:
- zh_Hans: 生成时,采样候选集的大小。例如,取值为50时,仅将单次生成中得分最高的50个token组成随机采样的候选集。取值越大,生成的随机性越高;取值越小,生成的确定性越高。
- en_US: The size of the sample candidate set when generated. For example, when the value is 50, only the 50 highest-scoring tokens in a single generation form a randomly sampled candidate set. The larger the value, the higher the randomness generated; the smaller the value, the higher the certainty generated.
- - name: max_tokens
- required: false
- use_template: max_tokens
- type: int
- default: 4096
- min: 1
- max: 8192
- help:
- zh_Hans: 用于指定模型在生成内容时token的最大数量,它定义了生成的上限,但不保证每次都会生成到这个数量。
- en_US: It is used to specify the maximum number of tokens when the model generates content. It defines the upper limit of generation, but does not guarantee that this number will be generated every time.
- - name: seed
- required: false
- type: int
- default: 1234
- label:
- zh_Hans: 随机种子
- en_US: Random seed
- help:
- zh_Hans: 生成时使用的随机数种子,用户控制模型生成内容的随机性。支持无符号64位整数,默认值为 1234。在使用seed时,模型将尽可能生成相同或相似的结果,但目前不保证每次生成的结果完全相同。
- en_US: The random number seed used when generating, the user controls the randomness of the content generated by the model. Supports unsigned 64-bit integers, default value is 1234. When using seed, the model will try its best to generate the same or similar results, but there is currently no guarantee that the results will be exactly the same every time.
- - name: repetition_penalty
- required: false
- type: float
- default: 1.1
- label:
- zh_Hans: 重复惩罚
- en_US: Repetition penalty
- help:
- zh_Hans: 用于控制模型生成时的重复度。提高repetition_penalty时可以降低模型生成的重复度。1.0表示不做惩罚。
- en_US: Used to control the repeatability when generating models. Increasing repetition_penalty can reduce the duplication of model generation. 1.0 means no punishment.
- - name: response_format
- use_template: response_format
-pricing:
- input: '0.003'
- output: '0.009'
- unit: '0.001'
- currency: RMB
\ No newline at end of file
diff --git a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-vl-plus.yaml b/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-vl-plus.yaml
deleted file mode 100644
index 6c8a8121c6..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen-vl-plus.yaml
+++ /dev/null
@@ -1,80 +0,0 @@
-# for more details, please refer to https://help.aliyun.com/zh/model-studio/getting-started/models
-model: qwen-vl-plus
-label:
- en_US: qwen-vl-plus
-model_type: llm
-features:
- - vision
- - agent-thought
- - video
-model_properties:
- mode: chat
- context_size: 8000
-parameter_rules:
- - name: temperature
- use_template: temperature
- type: float
- default: 0.3
- min: 0.0
- max: 2.0
- help:
- zh_Hans: 用于控制随机性和多样性的程度。具体来说,temperature值控制了生成文本时对每个候选词的概率分布进行平滑的程度。较高的temperature值会降低概率分布的峰值,使得更多的低概率词被选择,生成结果更加多样化;而较低的temperature值则会增强概率分布的峰值,使得高概率词更容易被选择,生成结果更加确定。
- en_US: Used to control the degree of randomness and diversity. Specifically, the temperature value controls the degree to which the probability distribution of each candidate word is smoothed when generating text. A higher temperature value will reduce the peak value of the probability distribution, allowing more low-probability words to be selected, and the generated results will be more diverse; while a lower temperature value will enhance the peak value of the probability distribution, making it easier for high-probability words to be selected. , the generated results are more certain.
- - name: top_p
- use_template: top_p
- type: float
- default: 0.8
- min: 0.1
- max: 0.9
- help:
- zh_Hans: 生成过程中核采样方法概率阈值,例如,取值为0.8时,仅保留概率加起来大于等于0.8的最可能token的最小集合作为候选集。取值范围为(0,1.0),取值越大,生成的随机性越高;取值越低,生成的确定性越高。
- en_US: The probability threshold of the kernel sampling method during the generation process. For example, when the value is 0.8, only the smallest set of the most likely tokens with a sum of probabilities greater than or equal to 0.8 is retained as the candidate set. The value range is (0,1.0). The larger the value, the higher the randomness generated; the lower the value, the higher the certainty generated.
- - name: top_k
- type: int
- min: 0
- max: 99
- label:
- zh_Hans: 取样数量
- en_US: Top k
- help:
- zh_Hans: 生成时,采样候选集的大小。例如,取值为50时,仅将单次生成中得分最高的50个token组成随机采样的候选集。取值越大,生成的随机性越高;取值越小,生成的确定性越高。
- en_US: The size of the sample candidate set when generated. For example, when the value is 50, only the 50 highest-scoring tokens in a single generation form a randomly sampled candidate set. The larger the value, the higher the randomness generated; the smaller the value, the higher the certainty generated.
- - name: max_tokens
- required: false
- use_template: max_tokens
- type: int
- default: 2000
- min: 1
- max: 2000
- help:
- zh_Hans: 用于指定模型在生成内容时token的最大数量,它定义了生成的上限,但不保证每次都会生成到这个数量。
- en_US: It is used to specify the maximum number of tokens when the model generates content. It defines the upper limit of generation, but does not guarantee that this number will be generated every time.
- - name: seed
- required: false
- type: int
- default: 1234
- label:
- zh_Hans: 随机种子
- en_US: Random seed
- help:
- zh_Hans: 生成时使用的随机数种子,用户控制模型生成内容的随机性。支持无符号64位整数,默认值为 1234。在使用seed时,模型将尽可能生成相同或相似的结果,但目前不保证每次生成的结果完全相同。
- en_US: The random number seed used when generating, the user controls the randomness of the content generated by the model. Supports unsigned 64-bit integers, default value is 1234. When using seed, the model will try its best to generate the same or similar results, but there is currently no guarantee that the results will be exactly the same every time.
- - name: response_format
- use_template: response_format
- - name: repetition_penalty
- required: false
- type: float
- default: 1.1
- label:
- zh_Hans: 重复惩罚
- en_US: Repetition penalty
- help:
- zh_Hans: 用于控制模型生成时的重复度。提高repetition_penalty时可以降低模型生成的重复度。1.0表示不做惩罚。
- en_US: Used to control the repeatability when generating models. Increasing repetition_penalty can reduce the duplication of model generation. 1.0 means no punishment.
- - name: response_format
- use_template: response_format
-pricing:
- input: '0.008'
- output: '0.008'
- unit: '0.001'
- currency: RMB
diff --git a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen2-math-1.5b-instruct.yaml b/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen2-math-1.5b-instruct.yaml
deleted file mode 100644
index ea157f42de..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen2-math-1.5b-instruct.yaml
+++ /dev/null
@@ -1,75 +0,0 @@
-# for more details, please refer to https://help.aliyun.com/zh/model-studio/getting-started/models
-model: qwen2-math-1.5b-instruct
-label:
- en_US: qwen2-math-1.5b-instruct
-model_type: llm
-features:
- - agent-thought
-model_properties:
- mode: chat
- context_size: 4096
-parameter_rules:
- - name: temperature
- use_template: temperature
- type: float
- default: 0.3
- min: 0.0
- max: 2.0
- help:
- zh_Hans: 用于控制随机性和多样性的程度。具体来说,temperature值控制了生成文本时对每个候选词的概率分布进行平滑的程度。较高的temperature值会降低概率分布的峰值,使得更多的低概率词被选择,生成结果更加多样化;而较低的temperature值则会增强概率分布的峰值,使得高概率词更容易被选择,生成结果更加确定。
- en_US: Used to control the degree of randomness and diversity. Specifically, the temperature value controls the degree to which the probability distribution of each candidate word is smoothed when generating text. A higher temperature value will reduce the peak value of the probability distribution, allowing more low-probability words to be selected, and the generated results will be more diverse; while a lower temperature value will enhance the peak value of the probability distribution, making it easier for high-probability words to be selected. , the generated results are more certain.
- - name: max_tokens
- use_template: max_tokens
- type: int
- default: 2000
- min: 1
- max: 2000
- help:
- zh_Hans: 用于指定模型在生成内容时token的最大数量,它定义了生成的上限,但不保证每次都会生成到这个数量。
- en_US: It is used to specify the maximum number of tokens when the model generates content. It defines the upper limit of generation, but does not guarantee that this number will be generated every time.
- - name: top_p
- use_template: top_p
- type: float
- default: 0.8
- min: 0.1
- max: 0.9
- help:
- zh_Hans: 生成过程中核采样方法概率阈值,例如,取值为0.8时,仅保留概率加起来大于等于0.8的最可能token的最小集合作为候选集。取值范围为(0,1.0),取值越大,生成的随机性越高;取值越低,生成的确定性越高。
- en_US: The probability threshold of the kernel sampling method during the generation process. For example, when the value is 0.8, only the smallest set of the most likely tokens with a sum of probabilities greater than or equal to 0.8 is retained as the candidate set. The value range is (0,1.0). The larger the value, the higher the randomness generated; the lower the value, the higher the certainty generated.
- - name: top_k
- type: int
- min: 0
- max: 99
- label:
- zh_Hans: 取样数量
- en_US: Top k
- help:
- zh_Hans: 生成时,采样候选集的大小。例如,取值为50时,仅将单次生成中得分最高的50个token组成随机采样的候选集。取值越大,生成的随机性越高;取值越小,生成的确定性越高。
- en_US: The size of the sample candidate set when generated. For example, when the value is 50, only the 50 highest-scoring tokens in a single generation form a randomly sampled candidate set. The larger the value, the higher the randomness generated; the smaller the value, the higher the certainty generated.
- - name: seed
- required: false
- type: int
- default: 1234
- label:
- zh_Hans: 随机种子
- en_US: Random seed
- help:
- zh_Hans: 生成时使用的随机数种子,用户控制模型生成内容的随机性。支持无符号64位整数,默认值为 1234。在使用seed时,模型将尽可能生成相同或相似的结果,但目前不保证每次生成的结果完全相同。
- en_US: The random number seed used when generating, the user controls the randomness of the content generated by the model. Supports unsigned 64-bit integers, default value is 1234. When using seed, the model will try its best to generate the same or similar results, but there is currently no guarantee that the results will be exactly the same every time.
- - name: repetition_penalty
- required: false
- type: float
- default: 1.1
- label:
- zh_Hans: 重复惩罚
- en_US: Repetition penalty
- help:
- zh_Hans: 用于控制模型生成时的重复度。提高repetition_penalty时可以降低模型生成的重复度。1.0表示不做惩罚。
- en_US: Used to control the repeatability when generating models. Increasing repetition_penalty can reduce the duplication of model generation. 1.0 means no punishment.
- - name: response_format
- use_template: response_format
-pricing:
- input: '0.004'
- output: '0.012'
- unit: '0.001'
- currency: RMB
diff --git a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen2-math-72b-instruct.yaml b/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen2-math-72b-instruct.yaml
deleted file mode 100644
index 37052a9233..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen2-math-72b-instruct.yaml
+++ /dev/null
@@ -1,75 +0,0 @@
-# for more details, please refer to https://help.aliyun.com/zh/model-studio/getting-started/models
-model: qwen2-math-72b-instruct
-label:
- en_US: qwen2-math-72b-instruct
-model_type: llm
-features:
- - agent-thought
-model_properties:
- mode: chat
- context_size: 4096
-parameter_rules:
- - name: temperature
- use_template: temperature
- type: float
- default: 0.3
- min: 0.0
- max: 2.0
- help:
- zh_Hans: 用于控制随机性和多样性的程度。具体来说,temperature值控制了生成文本时对每个候选词的概率分布进行平滑的程度。较高的temperature值会降低概率分布的峰值,使得更多的低概率词被选择,生成结果更加多样化;而较低的temperature值则会增强概率分布的峰值,使得高概率词更容易被选择,生成结果更加确定。
- en_US: Used to control the degree of randomness and diversity. Specifically, the temperature value controls the degree to which the probability distribution of each candidate word is smoothed when generating text. A higher temperature value will reduce the peak value of the probability distribution, allowing more low-probability words to be selected, and the generated results will be more diverse; while a lower temperature value will enhance the peak value of the probability distribution, making it easier for high-probability words to be selected. , the generated results are more certain.
- - name: max_tokens
- use_template: max_tokens
- type: int
- default: 2000
- min: 1
- max: 2000
- help:
- zh_Hans: 用于指定模型在生成内容时token的最大数量,它定义了生成的上限,但不保证每次都会生成到这个数量。
- en_US: It is used to specify the maximum number of tokens when the model generates content. It defines the upper limit of generation, but does not guarantee that this number will be generated every time.
- - name: top_p
- use_template: top_p
- type: float
- default: 0.8
- min: 0.1
- max: 0.9
- help:
- zh_Hans: 生成过程中核采样方法概率阈值,例如,取值为0.8时,仅保留概率加起来大于等于0.8的最可能token的最小集合作为候选集。取值范围为(0,1.0),取值越大,生成的随机性越高;取值越低,生成的确定性越高。
- en_US: The probability threshold of the kernel sampling method during the generation process. For example, when the value is 0.8, only the smallest set of the most likely tokens with a sum of probabilities greater than or equal to 0.8 is retained as the candidate set. The value range is (0,1.0). The larger the value, the higher the randomness generated; the lower the value, the higher the certainty generated.
- - name: top_k
- type: int
- min: 0
- max: 99
- label:
- zh_Hans: 取样数量
- en_US: Top k
- help:
- zh_Hans: 生成时,采样候选集的大小。例如,取值为50时,仅将单次生成中得分最高的50个token组成随机采样的候选集。取值越大,生成的随机性越高;取值越小,生成的确定性越高。
- en_US: The size of the sample candidate set when generated. For example, when the value is 50, only the 50 highest-scoring tokens in a single generation form a randomly sampled candidate set. The larger the value, the higher the randomness generated; the smaller the value, the higher the certainty generated.
- - name: seed
- required: false
- type: int
- default: 1234
- label:
- zh_Hans: 随机种子
- en_US: Random seed
- help:
- zh_Hans: 生成时使用的随机数种子,用户控制模型生成内容的随机性。支持无符号64位整数,默认值为 1234。在使用seed时,模型将尽可能生成相同或相似的结果,但目前不保证每次生成的结果完全相同。
- en_US: The random number seed used when generating, the user controls the randomness of the content generated by the model. Supports unsigned 64-bit integers, default value is 1234. When using seed, the model will try its best to generate the same or similar results, but there is currently no guarantee that the results will be exactly the same every time.
- - name: repetition_penalty
- required: false
- type: float
- default: 1.1
- label:
- zh_Hans: 重复惩罚
- en_US: Repetition penalty
- help:
- zh_Hans: 用于控制模型生成时的重复度。提高repetition_penalty时可以降低模型生成的重复度。1.0表示不做惩罚。
- en_US: Used to control the repeatability when generating models. Increasing repetition_penalty can reduce the duplication of model generation. 1.0 means no punishment.
- - name: response_format
- use_template: response_format
-pricing:
- input: '0.004'
- output: '0.012'
- unit: '0.001'
- currency: RMB
diff --git a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen2-math-7b-instruct.yaml b/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen2-math-7b-instruct.yaml
deleted file mode 100644
index e182f1c27f..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen2-math-7b-instruct.yaml
+++ /dev/null
@@ -1,75 +0,0 @@
-# for more details, please refer to https://help.aliyun.com/zh/model-studio/getting-started/models
-model: qwen2-math-7b-instruct
-label:
- en_US: qwen2-math-7b-instruct
-model_type: llm
-features:
- - agent-thought
-model_properties:
- mode: chat
- context_size: 4096
-parameter_rules:
- - name: temperature
- use_template: temperature
- type: float
- default: 0.3
- min: 0.0
- max: 2.0
- help:
- zh_Hans: 用于控制随机性和多样性的程度。具体来说,temperature值控制了生成文本时对每个候选词的概率分布进行平滑的程度。较高的temperature值会降低概率分布的峰值,使得更多的低概率词被选择,生成结果更加多样化;而较低的temperature值则会增强概率分布的峰值,使得高概率词更容易被选择,生成结果更加确定。
- en_US: Used to control the degree of randomness and diversity. Specifically, the temperature value controls the degree to which the probability distribution of each candidate word is smoothed when generating text. A higher temperature value will reduce the peak value of the probability distribution, allowing more low-probability words to be selected, and the generated results will be more diverse; while a lower temperature value will enhance the peak value of the probability distribution, making it easier for high-probability words to be selected. , the generated results are more certain.
- - name: max_tokens
- use_template: max_tokens
- type: int
- default: 2000
- min: 1
- max: 2000
- help:
- zh_Hans: 用于指定模型在生成内容时token的最大数量,它定义了生成的上限,但不保证每次都会生成到这个数量。
- en_US: It is used to specify the maximum number of tokens when the model generates content. It defines the upper limit of generation, but does not guarantee that this number will be generated every time.
- - name: top_p
- use_template: top_p
- type: float
- default: 0.8
- min: 0.1
- max: 0.9
- help:
- zh_Hans: 生成过程中核采样方法概率阈值,例如,取值为0.8时,仅保留概率加起来大于等于0.8的最可能token的最小集合作为候选集。取值范围为(0,1.0),取值越大,生成的随机性越高;取值越低,生成的确定性越高。
- en_US: The probability threshold of the kernel sampling method during the generation process. For example, when the value is 0.8, only the smallest set of the most likely tokens with a sum of probabilities greater than or equal to 0.8 is retained as the candidate set. The value range is (0,1.0). The larger the value, the higher the randomness generated; the lower the value, the higher the certainty generated.
- - name: top_k
- type: int
- min: 0
- max: 99
- label:
- zh_Hans: 取样数量
- en_US: Top k
- help:
- zh_Hans: 生成时,采样候选集的大小。例如,取值为50时,仅将单次生成中得分最高的50个token组成随机采样的候选集。取值越大,生成的随机性越高;取值越小,生成的确定性越高。
- en_US: The size of the sample candidate set when generated. For example, when the value is 50, only the 50 highest-scoring tokens in a single generation form a randomly sampled candidate set. The larger the value, the higher the randomness generated; the smaller the value, the higher the certainty generated.
- - name: seed
- required: false
- type: int
- default: 1234
- label:
- zh_Hans: 随机种子
- en_US: Random seed
- help:
- zh_Hans: 生成时使用的随机数种子,用户控制模型生成内容的随机性。支持无符号64位整数,默认值为 1234。在使用seed时,模型将尽可能生成相同或相似的结果,但目前不保证每次生成的结果完全相同。
- en_US: The random number seed used when generating, the user controls the randomness of the content generated by the model. Supports unsigned 64-bit integers, default value is 1234. When using seed, the model will try its best to generate the same or similar results, but there is currently no guarantee that the results will be exactly the same every time.
- - name: repetition_penalty
- required: false
- type: float
- default: 1.1
- label:
- zh_Hans: 重复惩罚
- en_US: Repetition penalty
- help:
- zh_Hans: 用于控制模型生成时的重复度。提高repetition_penalty时可以降低模型生成的重复度。1.0表示不做惩罚。
- en_US: Used to control the repeatability when generating models. Increasing repetition_penalty can reduce the duplication of model generation. 1.0 means no punishment.
- - name: response_format
- use_template: response_format
-pricing:
- input: '0.004'
- output: '0.012'
- unit: '0.001'
- currency: RMB
diff --git a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen2.5-0.5b-instruct.yaml b/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen2.5-0.5b-instruct.yaml
deleted file mode 100644
index 9e75ccc1f2..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen2.5-0.5b-instruct.yaml
+++ /dev/null
@@ -1,75 +0,0 @@
-# for more details, please refer to https://help.aliyun.com/zh/model-studio/getting-started/models
-model: qwen2.5-0.5b-instruct
-label:
- en_US: qwen2.5-0.5b-instruct
-model_type: llm
-features:
- - agent-thought
-model_properties:
- mode: chat
- context_size: 32768
-parameter_rules:
- - name: temperature
- use_template: temperature
- type: float
- default: 0.3
- min: 0.0
- max: 2.0
- help:
- zh_Hans: 用于控制随机性和多样性的程度。具体来说,temperature值控制了生成文本时对每个候选词的概率分布进行平滑的程度。较高的temperature值会降低概率分布的峰值,使得更多的低概率词被选择,生成结果更加多样化;而较低的temperature值则会增强概率分布的峰值,使得高概率词更容易被选择,生成结果更加确定。
- en_US: Used to control the degree of randomness and diversity. Specifically, the temperature value controls the degree to which the probability distribution of each candidate word is smoothed when generating text. A higher temperature value will reduce the peak value of the probability distribution, allowing more low-probability words to be selected, and the generated results will be more diverse; while a lower temperature value will enhance the peak value of the probability distribution, making it easier for high-probability words to be selected. , the generated results are more certain.
- - name: max_tokens
- use_template: max_tokens
- type: int
- default: 8192
- min: 1
- max: 8192
- help:
- zh_Hans: 用于指定模型在生成内容时token的最大数量,它定义了生成的上限,但不保证每次都会生成到这个数量。
- en_US: It is used to specify the maximum number of tokens when the model generates content. It defines the upper limit of generation, but does not guarantee that this number will be generated every time.
- - name: top_p
- use_template: top_p
- type: float
- default: 0.8
- min: 0.1
- max: 0.9
- help:
- zh_Hans: 生成过程中核采样方法概率阈值,例如,取值为0.8时,仅保留概率加起来大于等于0.8的最可能token的最小集合作为候选集。取值范围为(0,1.0),取值越大,生成的随机性越高;取值越低,生成的确定性越高。
- en_US: The probability threshold of the kernel sampling method during the generation process. For example, when the value is 0.8, only the smallest set of the most likely tokens with a sum of probabilities greater than or equal to 0.8 is retained as the candidate set. The value range is (0,1.0). The larger the value, the higher the randomness generated; the lower the value, the higher the certainty generated.
- - name: top_k
- type: int
- min: 0
- max: 99
- label:
- zh_Hans: 取样数量
- en_US: Top k
- help:
- zh_Hans: 生成时,采样候选集的大小。例如,取值为50时,仅将单次生成中得分最高的50个token组成随机采样的候选集。取值越大,生成的随机性越高;取值越小,生成的确定性越高。
- en_US: The size of the sample candidate set when generated. For example, when the value is 50, only the 50 highest-scoring tokens in a single generation form a randomly sampled candidate set. The larger the value, the higher the randomness generated; the smaller the value, the higher the certainty generated.
- - name: seed
- required: false
- type: int
- default: 1234
- label:
- zh_Hans: 随机种子
- en_US: Random seed
- help:
- zh_Hans: 生成时使用的随机数种子,用户控制模型生成内容的随机性。支持无符号64位整数,默认值为 1234。在使用seed时,模型将尽可能生成相同或相似的结果,但目前不保证每次生成的结果完全相同。
- en_US: The random number seed used when generating, the user controls the randomness of the content generated by the model. Supports unsigned 64-bit integers, default value is 1234. When using seed, the model will try its best to generate the same or similar results, but there is currently no guarantee that the results will be exactly the same every time.
- - name: repetition_penalty
- required: false
- type: float
- default: 1.1
- label:
- zh_Hans: 重复惩罚
- en_US: Repetition penalty
- help:
- zh_Hans: 用于控制模型生成时的重复度。提高repetition_penalty时可以降低模型生成的重复度。1.0表示不做惩罚。
- en_US: Used to control the repeatability when generating models. Increasing repetition_penalty can reduce the duplication of model generation. 1.0 means no punishment.
- - name: response_format
- use_template: response_format
-pricing:
- input: '0.000'
- output: '0.000'
- unit: '0.001'
- currency: RMB
diff --git a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen2.5-1.5b-instruct.yaml b/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen2.5-1.5b-instruct.yaml
deleted file mode 100644
index 67c9d31243..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen2.5-1.5b-instruct.yaml
+++ /dev/null
@@ -1,75 +0,0 @@
-# for more details, please refer to https://help.aliyun.com/zh/model-studio/getting-started/models
-model: qwen2.5-1.5b-instruct
-label:
- en_US: qwen2.5-1.5b-instruct
-model_type: llm
-features:
- - agent-thought
-model_properties:
- mode: chat
- context_size: 32768
-parameter_rules:
- - name: temperature
- use_template: temperature
- type: float
- default: 0.3
- min: 0.0
- max: 2.0
- help:
- zh_Hans: 用于控制随机性和多样性的程度。具体来说,temperature值控制了生成文本时对每个候选词的概率分布进行平滑的程度。较高的temperature值会降低概率分布的峰值,使得更多的低概率词被选择,生成结果更加多样化;而较低的temperature值则会增强概率分布的峰值,使得高概率词更容易被选择,生成结果更加确定。
- en_US: Used to control the degree of randomness and diversity. Specifically, the temperature value controls the degree to which the probability distribution of each candidate word is smoothed when generating text. A higher temperature value will reduce the peak value of the probability distribution, allowing more low-probability words to be selected, and the generated results will be more diverse; while a lower temperature value will enhance the peak value of the probability distribution, making it easier for high-probability words to be selected. , the generated results are more certain.
- - name: max_tokens
- use_template: max_tokens
- type: int
- default: 8192
- min: 1
- max: 8192
- help:
- zh_Hans: 用于指定模型在生成内容时token的最大数量,它定义了生成的上限,但不保证每次都会生成到这个数量。
- en_US: It is used to specify the maximum number of tokens when the model generates content. It defines the upper limit of generation, but does not guarantee that this number will be generated every time.
- - name: top_p
- use_template: top_p
- type: float
- default: 0.8
- min: 0.1
- max: 0.9
- help:
- zh_Hans: 生成过程中核采样方法概率阈值,例如,取值为0.8时,仅保留概率加起来大于等于0.8的最可能token的最小集合作为候选集。取值范围为(0,1.0),取值越大,生成的随机性越高;取值越低,生成的确定性越高。
- en_US: The probability threshold of the kernel sampling method during the generation process. For example, when the value is 0.8, only the smallest set of the most likely tokens with a sum of probabilities greater than or equal to 0.8 is retained as the candidate set. The value range is (0,1.0). The larger the value, the higher the randomness generated; the lower the value, the higher the certainty generated.
- - name: top_k
- type: int
- min: 0
- max: 99
- label:
- zh_Hans: 取样数量
- en_US: Top k
- help:
- zh_Hans: 生成时,采样候选集的大小。例如,取值为50时,仅将单次生成中得分最高的50个token组成随机采样的候选集。取值越大,生成的随机性越高;取值越小,生成的确定性越高。
- en_US: The size of the sample candidate set when generated. For example, when the value is 50, only the 50 highest-scoring tokens in a single generation form a randomly sampled candidate set. The larger the value, the higher the randomness generated; the smaller the value, the higher the certainty generated.
- - name: seed
- required: false
- type: int
- default: 1234
- label:
- zh_Hans: 随机种子
- en_US: Random seed
- help:
- zh_Hans: 生成时使用的随机数种子,用户控制模型生成内容的随机性。支持无符号64位整数,默认值为 1234。在使用seed时,模型将尽可能生成相同或相似的结果,但目前不保证每次生成的结果完全相同。
- en_US: The random number seed used when generating, the user controls the randomness of the content generated by the model. Supports unsigned 64-bit integers, default value is 1234. When using seed, the model will try its best to generate the same or similar results, but there is currently no guarantee that the results will be exactly the same every time.
- - name: repetition_penalty
- required: false
- type: float
- default: 1.1
- label:
- zh_Hans: 重复惩罚
- en_US: Repetition penalty
- help:
- zh_Hans: 用于控制模型生成时的重复度。提高repetition_penalty时可以降低模型生成的重复度。1.0表示不做惩罚。
- en_US: Used to control the repeatability when generating models. Increasing repetition_penalty can reduce the duplication of model generation. 1.0 means no punishment.
- - name: response_format
- use_template: response_format
-pricing:
- input: '0.000'
- output: '0.000'
- unit: '0.001'
- currency: RMB
diff --git a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen2.5-14b-instruct-1m.yaml b/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen2.5-14b-instruct-1m.yaml
deleted file mode 100644
index 87c83bf0bb..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen2.5-14b-instruct-1m.yaml
+++ /dev/null
@@ -1,75 +0,0 @@
-# for more details, please refer to https://help.aliyun.com/zh/model-studio/getting-started/models
-model: qwen2.5-14b-instruct-1m
-label:
- en_US: qwen2.5-14b-instruct-1m
-model_type: llm
-features:
- - agent-thought
-model_properties:
- mode: chat
- context_size: 1000000
-parameter_rules:
- - name: temperature
- use_template: temperature
- type: float
- default: 0.3
- min: 0.0
- max: 2.0
- help:
- zh_Hans: 用于控制随机性和多样性的程度。具体来说,temperature值控制了生成文本时对每个候选词的概率分布进行平滑的程度。较高的temperature值会降低概率分布的峰值,使得更多的低概率词被选择,生成结果更加多样化;而较低的temperature值则会增强概率分布的峰值,使得高概率词更容易被选择,生成结果更加确定。
- en_US: Used to control the degree of randomness and diversity. Specifically, the temperature value controls the degree to which the probability distribution of each candidate word is smoothed when generating text. A higher temperature value will reduce the peak value of the probability distribution, allowing more low-probability words to be selected, and the generated results will be more diverse; while a lower temperature value will enhance the peak value of the probability distribution, making it easier for high-probability words to be selected. , the generated results are more certain.
- - name: max_tokens
- use_template: max_tokens
- type: int
- default: 8192
- min: 1
- max: 8192
- help:
- zh_Hans: 用于指定模型在生成内容时token的最大数量,它定义了生成的上限,但不保证每次都会生成到这个数量。
- en_US: It is used to specify the maximum number of tokens when the model generates content. It defines the upper limit of generation, but does not guarantee that this number will be generated every time.
- - name: top_p
- use_template: top_p
- type: float
- default: 0.8
- min: 0.1
- max: 0.9
- help:
- zh_Hans: 生成过程中核采样方法概率阈值,例如,取值为0.8时,仅保留概率加起来大于等于0.8的最可能token的最小集合作为候选集。取值范围为(0,1.0),取值越大,生成的随机性越高;取值越低,生成的确定性越高。
- en_US: The probability threshold of the kernel sampling method during the generation process. For example, when the value is 0.8, only the smallest set of the most likely tokens with a sum of probabilities greater than or equal to 0.8 is retained as the candidate set. The value range is (0,1.0). The larger the value, the higher the randomness generated; the lower the value, the higher the certainty generated.
- - name: top_k
- type: int
- min: 0
- max: 99
- label:
- zh_Hans: 取样数量
- en_US: Top k
- help:
- zh_Hans: 生成时,采样候选集的大小。例如,取值为50时,仅将单次生成中得分最高的50个token组成随机采样的候选集。取值越大,生成的随机性越高;取值越小,生成的确定性越高。
- en_US: The size of the sample candidate set when generated. For example, when the value is 50, only the 50 highest-scoring tokens in a single generation form a randomly sampled candidate set. The larger the value, the higher the randomness generated; the smaller the value, the higher the certainty generated.
- - name: seed
- required: false
- type: int
- default: 1234
- label:
- zh_Hans: 随机种子
- en_US: Random seed
- help:
- zh_Hans: 生成时使用的随机数种子,用户控制模型生成内容的随机性。支持无符号64位整数,默认值为 1234。在使用seed时,模型将尽可能生成相同或相似的结果,但目前不保证每次生成的结果完全相同。
- en_US: The random number seed used when generating, the user controls the randomness of the content generated by the model. Supports unsigned 64-bit integers, default value is 1234. When using seed, the model will try its best to generate the same or similar results, but there is currently no guarantee that the results will be exactly the same every time.
- - name: repetition_penalty
- required: false
- type: float
- default: 1.1
- label:
- zh_Hans: 重复惩罚
- en_US: Repetition penalty
- help:
- zh_Hans: 用于控制模型生成时的重复度。提高repetition_penalty时可以降低模型生成的重复度。1.0表示不做惩罚。
- en_US: Used to control the repeatability when generating models. Increasing repetition_penalty can reduce the duplication of model generation. 1.0 means no punishment.
- - name: response_format
- use_template: response_format
-pricing:
- input: "0.001"
- output: "0.003"
- unit: "0.001"
- currency: RMB
diff --git a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen2.5-14b-instruct.yaml b/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen2.5-14b-instruct.yaml
deleted file mode 100644
index 2a38be921c..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen2.5-14b-instruct.yaml
+++ /dev/null
@@ -1,75 +0,0 @@
-# for more details, please refer to https://help.aliyun.com/zh/model-studio/getting-started/models
-model: qwen2.5-14b-instruct
-label:
- en_US: qwen2.5-14b-instruct
-model_type: llm
-features:
- - agent-thought
-model_properties:
- mode: chat
- context_size: 131072
-parameter_rules:
- - name: temperature
- use_template: temperature
- type: float
- default: 0.3
- min: 0.0
- max: 2.0
- help:
- zh_Hans: 用于控制随机性和多样性的程度。具体来说,temperature值控制了生成文本时对每个候选词的概率分布进行平滑的程度。较高的temperature值会降低概率分布的峰值,使得更多的低概率词被选择,生成结果更加多样化;而较低的temperature值则会增强概率分布的峰值,使得高概率词更容易被选择,生成结果更加确定。
- en_US: Used to control the degree of randomness and diversity. Specifically, the temperature value controls the degree to which the probability distribution of each candidate word is smoothed when generating text. A higher temperature value will reduce the peak value of the probability distribution, allowing more low-probability words to be selected, and the generated results will be more diverse; while a lower temperature value will enhance the peak value of the probability distribution, making it easier for high-probability words to be selected. , the generated results are more certain.
- - name: max_tokens
- use_template: max_tokens
- type: int
- default: 8192
- min: 1
- max: 8192
- help:
- zh_Hans: 用于指定模型在生成内容时token的最大数量,它定义了生成的上限,但不保证每次都会生成到这个数量。
- en_US: It is used to specify the maximum number of tokens when the model generates content. It defines the upper limit of generation, but does not guarantee that this number will be generated every time.
- - name: top_p
- use_template: top_p
- type: float
- default: 0.8
- min: 0.1
- max: 0.9
- help:
- zh_Hans: 生成过程中核采样方法概率阈值,例如,取值为0.8时,仅保留概率加起来大于等于0.8的最可能token的最小集合作为候选集。取值范围为(0,1.0),取值越大,生成的随机性越高;取值越低,生成的确定性越高。
- en_US: The probability threshold of the kernel sampling method during the generation process. For example, when the value is 0.8, only the smallest set of the most likely tokens with a sum of probabilities greater than or equal to 0.8 is retained as the candidate set. The value range is (0,1.0). The larger the value, the higher the randomness generated; the lower the value, the higher the certainty generated.
- - name: top_k
- type: int
- min: 0
- max: 99
- label:
- zh_Hans: 取样数量
- en_US: Top k
- help:
- zh_Hans: 生成时,采样候选集的大小。例如,取值为50时,仅将单次生成中得分最高的50个token组成随机采样的候选集。取值越大,生成的随机性越高;取值越小,生成的确定性越高。
- en_US: The size of the sample candidate set when generated. For example, when the value is 50, only the 50 highest-scoring tokens in a single generation form a randomly sampled candidate set. The larger the value, the higher the randomness generated; the smaller the value, the higher the certainty generated.
- - name: seed
- required: false
- type: int
- default: 1234
- label:
- zh_Hans: 随机种子
- en_US: Random seed
- help:
- zh_Hans: 生成时使用的随机数种子,用户控制模型生成内容的随机性。支持无符号64位整数,默认值为 1234。在使用seed时,模型将尽可能生成相同或相似的结果,但目前不保证每次生成的结果完全相同。
- en_US: The random number seed used when generating, the user controls the randomness of the content generated by the model. Supports unsigned 64-bit integers, default value is 1234. When using seed, the model will try its best to generate the same or similar results, but there is currently no guarantee that the results will be exactly the same every time.
- - name: repetition_penalty
- required: false
- type: float
- default: 1.1
- label:
- zh_Hans: 重复惩罚
- en_US: Repetition penalty
- help:
- zh_Hans: 用于控制模型生成时的重复度。提高repetition_penalty时可以降低模型生成的重复度。1.0表示不做惩罚。
- en_US: Used to control the repeatability when generating models. Increasing repetition_penalty can reduce the duplication of model generation. 1.0 means no punishment.
- - name: response_format
- use_template: response_format
-pricing:
- input: '0.002'
- output: '0.006'
- unit: '0.001'
- currency: RMB
diff --git a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen2.5-32b-instruct.yaml b/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen2.5-32b-instruct.yaml
deleted file mode 100644
index e6e4fbf978..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen2.5-32b-instruct.yaml
+++ /dev/null
@@ -1,75 +0,0 @@
-# for more details, please refer to https://help.aliyun.com/zh/model-studio/getting-started/models
-model: qwen2.5-32b-instruct
-label:
- en_US: qwen2.5-32b-instruct
-model_type: llm
-features:
- - agent-thought
-model_properties:
- mode: chat
- context_size: 131072
-parameter_rules:
- - name: temperature
- use_template: temperature
- type: float
- default: 0.3
- min: 0.0
- max: 2.0
- help:
- zh_Hans: 用于控制随机性和多样性的程度。具体来说,temperature值控制了生成文本时对每个候选词的概率分布进行平滑的程度。较高的temperature值会降低概率分布的峰值,使得更多的低概率词被选择,生成结果更加多样化;而较低的temperature值则会增强概率分布的峰值,使得高概率词更容易被选择,生成结果更加确定。
- en_US: Used to control the degree of randomness and diversity. Specifically, the temperature value controls the degree to which the probability distribution of each candidate word is smoothed when generating text. A higher temperature value will reduce the peak value of the probability distribution, allowing more low-probability words to be selected, and the generated results will be more diverse; while a lower temperature value will enhance the peak value of the probability distribution, making it easier for high-probability words to be selected. , the generated results are more certain.
- - name: max_tokens
- use_template: max_tokens
- type: int
- default: 8192
- min: 1
- max: 8192
- help:
- zh_Hans: 用于指定模型在生成内容时token的最大数量,它定义了生成的上限,但不保证每次都会生成到这个数量。
- en_US: It is used to specify the maximum number of tokens when the model generates content. It defines the upper limit of generation, but does not guarantee that this number will be generated every time.
- - name: top_p
- use_template: top_p
- type: float
- default: 0.8
- min: 0.1
- max: 0.9
- help:
- zh_Hans: 生成过程中核采样方法概率阈值,例如,取值为0.8时,仅保留概率加起来大于等于0.8的最可能token的最小集合作为候选集。取值范围为(0,1.0),取值越大,生成的随机性越高;取值越低,生成的确定性越高。
- en_US: The probability threshold of the kernel sampling method during the generation process. For example, when the value is 0.8, only the smallest set of the most likely tokens with a sum of probabilities greater than or equal to 0.8 is retained as the candidate set. The value range is (0,1.0). The larger the value, the higher the randomness generated; the lower the value, the higher the certainty generated.
- - name: top_k
- type: int
- min: 0
- max: 99
- label:
- zh_Hans: 取样数量
- en_US: Top k
- help:
- zh_Hans: 生成时,采样候选集的大小。例如,取值为50时,仅将单次生成中得分最高的50个token组成随机采样的候选集。取值越大,生成的随机性越高;取值越小,生成的确定性越高。
- en_US: The size of the sample candidate set when generated. For example, when the value is 50, only the 50 highest-scoring tokens in a single generation form a randomly sampled candidate set. The larger the value, the higher the randomness generated; the smaller the value, the higher the certainty generated.
- - name: seed
- required: false
- type: int
- default: 1234
- label:
- zh_Hans: 随机种子
- en_US: Random seed
- help:
- zh_Hans: 生成时使用的随机数种子,用户控制模型生成内容的随机性。支持无符号64位整数,默认值为 1234。在使用seed时,模型将尽可能生成相同或相似的结果,但目前不保证每次生成的结果完全相同。
- en_US: The random number seed used when generating, the user controls the randomness of the content generated by the model. Supports unsigned 64-bit integers, default value is 1234. When using seed, the model will try its best to generate the same or similar results, but there is currently no guarantee that the results will be exactly the same every time.
- - name: repetition_penalty
- required: false
- type: float
- default: 1.1
- label:
- zh_Hans: 重复惩罚
- en_US: Repetition penalty
- help:
- zh_Hans: 用于控制模型生成时的重复度。提高repetition_penalty时可以降低模型生成的重复度。1.0表示不做惩罚。
- en_US: Used to control the repeatability when generating models. Increasing repetition_penalty can reduce the duplication of model generation. 1.0 means no punishment.
- - name: response_format
- use_template: response_format
-pricing:
- input: '0.0035'
- output: '0.007'
- unit: '0.001'
- currency: RMB
diff --git a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen2.5-3b-instruct.yaml b/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen2.5-3b-instruct.yaml
deleted file mode 100644
index 8f250379a7..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen2.5-3b-instruct.yaml
+++ /dev/null
@@ -1,75 +0,0 @@
-# for more details, please refer to https://help.aliyun.com/zh/model-studio/getting-started/models
-model: qwen2.5-3b-instruct
-label:
- en_US: qwen2.5-3b-instruct
-model_type: llm
-features:
- - agent-thought
-model_properties:
- mode: chat
- context_size: 32768
-parameter_rules:
- - name: temperature
- use_template: temperature
- type: float
- default: 0.3
- min: 0.0
- max: 2.0
- help:
- zh_Hans: 用于控制随机性和多样性的程度。具体来说,temperature值控制了生成文本时对每个候选词的概率分布进行平滑的程度。较高的temperature值会降低概率分布的峰值,使得更多的低概率词被选择,生成结果更加多样化;而较低的temperature值则会增强概率分布的峰值,使得高概率词更容易被选择,生成结果更加确定。
- en_US: Used to control the degree of randomness and diversity. Specifically, the temperature value controls the degree to which the probability distribution of each candidate word is smoothed when generating text. A higher temperature value will reduce the peak value of the probability distribution, allowing more low-probability words to be selected, and the generated results will be more diverse; while a lower temperature value will enhance the peak value of the probability distribution, making it easier for high-probability words to be selected. , the generated results are more certain.
- - name: max_tokens
- use_template: max_tokens
- type: int
- default: 8192
- min: 1
- max: 8192
- help:
- zh_Hans: 用于指定模型在生成内容时token的最大数量,它定义了生成的上限,但不保证每次都会生成到这个数量。
- en_US: It is used to specify the maximum number of tokens when the model generates content. It defines the upper limit of generation, but does not guarantee that this number will be generated every time.
- - name: top_p
- use_template: top_p
- type: float
- default: 0.8
- min: 0.1
- max: 0.9
- help:
- zh_Hans: 生成过程中核采样方法概率阈值,例如,取值为0.8时,仅保留概率加起来大于等于0.8的最可能token的最小集合作为候选集。取值范围为(0,1.0),取值越大,生成的随机性越高;取值越低,生成的确定性越高。
- en_US: The probability threshold of the kernel sampling method during the generation process. For example, when the value is 0.8, only the smallest set of the most likely tokens with a sum of probabilities greater than or equal to 0.8 is retained as the candidate set. The value range is (0,1.0). The larger the value, the higher the randomness generated; the lower the value, the higher the certainty generated.
- - name: top_k
- type: int
- min: 0
- max: 99
- label:
- zh_Hans: 取样数量
- en_US: Top k
- help:
- zh_Hans: 生成时,采样候选集的大小。例如,取值为50时,仅将单次生成中得分最高的50个token组成随机采样的候选集。取值越大,生成的随机性越高;取值越小,生成的确定性越高。
- en_US: The size of the sample candidate set when generated. For example, when the value is 50, only the 50 highest-scoring tokens in a single generation form a randomly sampled candidate set. The larger the value, the higher the randomness generated; the smaller the value, the higher the certainty generated.
- - name: seed
- required: false
- type: int
- default: 1234
- label:
- zh_Hans: 随机种子
- en_US: Random seed
- help:
- zh_Hans: 生成时使用的随机数种子,用户控制模型生成内容的随机性。支持无符号64位整数,默认值为 1234。在使用seed时,模型将尽可能生成相同或相似的结果,但目前不保证每次生成的结果完全相同。
- en_US: The random number seed used when generating, the user controls the randomness of the content generated by the model. Supports unsigned 64-bit integers, default value is 1234. When using seed, the model will try its best to generate the same or similar results, but there is currently no guarantee that the results will be exactly the same every time.
- - name: repetition_penalty
- required: false
- type: float
- default: 1.1
- label:
- zh_Hans: 重复惩罚
- en_US: Repetition penalty
- help:
- zh_Hans: 用于控制模型生成时的重复度。提高repetition_penalty时可以降低模型生成的重复度。1.0表示不做惩罚。
- en_US: Used to control the repeatability when generating models. Increasing repetition_penalty can reduce the duplication of model generation. 1.0 means no punishment.
- - name: response_format
- use_template: response_format
-pricing:
- input: '0.000'
- output: '0.000'
- unit: '0.001'
- currency: RMB
diff --git a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen2.5-72b-instruct.yaml b/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen2.5-72b-instruct.yaml
deleted file mode 100644
index bb3cdd6141..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen2.5-72b-instruct.yaml
+++ /dev/null
@@ -1,75 +0,0 @@
-# for more details, please refer to https://help.aliyun.com/zh/model-studio/getting-started/models
-model: qwen2.5-72b-instruct
-label:
- en_US: qwen2.5-72b-instruct
-model_type: llm
-features:
- - agent-thought
-model_properties:
- mode: chat
- context_size: 131072
-parameter_rules:
- - name: temperature
- use_template: temperature
- type: float
- default: 0.3
- min: 0.0
- max: 2.0
- help:
- zh_Hans: 用于控制随机性和多样性的程度。具体来说,temperature值控制了生成文本时对每个候选词的概率分布进行平滑的程度。较高的temperature值会降低概率分布的峰值,使得更多的低概率词被选择,生成结果更加多样化;而较低的temperature值则会增强概率分布的峰值,使得高概率词更容易被选择,生成结果更加确定。
- en_US: Used to control the degree of randomness and diversity. Specifically, the temperature value controls the degree to which the probability distribution of each candidate word is smoothed when generating text. A higher temperature value will reduce the peak value of the probability distribution, allowing more low-probability words to be selected, and the generated results will be more diverse; while a lower temperature value will enhance the peak value of the probability distribution, making it easier for high-probability words to be selected. , the generated results are more certain.
- - name: max_tokens
- use_template: max_tokens
- type: int
- default: 8192
- min: 1
- max: 8192
- help:
- zh_Hans: 用于指定模型在生成内容时token的最大数量,它定义了生成的上限,但不保证每次都会生成到这个数量。
- en_US: It is used to specify the maximum number of tokens when the model generates content. It defines the upper limit of generation, but does not guarantee that this number will be generated every time.
- - name: top_p
- use_template: top_p
- type: float
- default: 0.8
- min: 0.1
- max: 0.9
- help:
- zh_Hans: 生成过程中核采样方法概率阈值,例如,取值为0.8时,仅保留概率加起来大于等于0.8的最可能token的最小集合作为候选集。取值范围为(0,1.0),取值越大,生成的随机性越高;取值越低,生成的确定性越高。
- en_US: The probability threshold of the kernel sampling method during the generation process. For example, when the value is 0.8, only the smallest set of the most likely tokens with a sum of probabilities greater than or equal to 0.8 is retained as the candidate set. The value range is (0,1.0). The larger the value, the higher the randomness generated; the lower the value, the higher the certainty generated.
- - name: top_k
- type: int
- min: 0
- max: 99
- label:
- zh_Hans: 取样数量
- en_US: Top k
- help:
- zh_Hans: 生成时,采样候选集的大小。例如,取值为50时,仅将单次生成中得分最高的50个token组成随机采样的候选集。取值越大,生成的随机性越高;取值越小,生成的确定性越高。
- en_US: The size of the sample candidate set when generated. For example, when the value is 50, only the 50 highest-scoring tokens in a single generation form a randomly sampled candidate set. The larger the value, the higher the randomness generated; the smaller the value, the higher the certainty generated.
- - name: seed
- required: false
- type: int
- default: 1234
- label:
- zh_Hans: 随机种子
- en_US: Random seed
- help:
- zh_Hans: 生成时使用的随机数种子,用户控制模型生成内容的随机性。支持无符号64位整数,默认值为 1234。在使用seed时,模型将尽可能生成相同或相似的结果,但目前不保证每次生成的结果完全相同。
- en_US: The random number seed used when generating, the user controls the randomness of the content generated by the model. Supports unsigned 64-bit integers, default value is 1234. When using seed, the model will try its best to generate the same or similar results, but there is currently no guarantee that the results will be exactly the same every time.
- - name: repetition_penalty
- required: false
- type: float
- default: 1.1
- label:
- zh_Hans: 重复惩罚
- en_US: Repetition penalty
- help:
- zh_Hans: 用于控制模型生成时的重复度。提高repetition_penalty时可以降低模型生成的重复度。1.0表示不做惩罚。
- en_US: Used to control the repeatability when generating models. Increasing repetition_penalty can reduce the duplication of model generation. 1.0 means no punishment.
- - name: response_format
- use_template: response_format
-pricing:
- input: '0.004'
- output: '0.012'
- unit: '0.001'
- currency: RMB
diff --git a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen2.5-7b-instruct-1m.yaml b/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen2.5-7b-instruct-1m.yaml
deleted file mode 100644
index fee32794b4..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen2.5-7b-instruct-1m.yaml
+++ /dev/null
@@ -1,75 +0,0 @@
-# for more details, please refer to https://help.aliyun.com/zh/model-studio/getting-started/models
-model: qwen2.5-7b-instruct-1m
-label:
- en_US: qwen2.5-7b-instruct-1m
-model_type: llm
-features:
- - agent-thought
-model_properties:
- mode: chat
- context_size: 1000000
-parameter_rules:
- - name: temperature
- use_template: temperature
- type: float
- default: 0.3
- min: 0.0
- max: 2.0
- help:
- zh_Hans: 用于控制随机性和多样性的程度。具体来说,temperature值控制了生成文本时对每个候选词的概率分布进行平滑的程度。较高的temperature值会降低概率分布的峰值,使得更多的低概率词被选择,生成结果更加多样化;而较低的temperature值则会增强概率分布的峰值,使得高概率词更容易被选择,生成结果更加确定。
- en_US: Used to control the degree of randomness and diversity. Specifically, the temperature value controls the degree to which the probability distribution of each candidate word is smoothed when generating text. A higher temperature value will reduce the peak value of the probability distribution, allowing more low-probability words to be selected, and the generated results will be more diverse; while a lower temperature value will enhance the peak value of the probability distribution, making it easier for high-probability words to be selected. , the generated results are more certain.
- - name: max_tokens
- use_template: max_tokens
- type: int
- default: 8192
- min: 1
- max: 8192
- help:
- zh_Hans: 用于指定模型在生成内容时token的最大数量,它定义了生成的上限,但不保证每次都会生成到这个数量。
- en_US: It is used to specify the maximum number of tokens when the model generates content. It defines the upper limit of generation, but does not guarantee that this number will be generated every time.
- - name: top_p
- use_template: top_p
- type: float
- default: 0.8
- min: 0.1
- max: 0.9
- help:
- zh_Hans: 生成过程中核采样方法概率阈值,例如,取值为0.8时,仅保留概率加起来大于等于0.8的最可能token的最小集合作为候选集。取值范围为(0,1.0),取值越大,生成的随机性越高;取值越低,生成的确定性越高。
- en_US: The probability threshold of the kernel sampling method during the generation process. For example, when the value is 0.8, only the smallest set of the most likely tokens with a sum of probabilities greater than or equal to 0.8 is retained as the candidate set. The value range is (0,1.0). The larger the value, the higher the randomness generated; the lower the value, the higher the certainty generated.
- - name: top_k
- type: int
- min: 0
- max: 99
- label:
- zh_Hans: 取样数量
- en_US: Top k
- help:
- zh_Hans: 生成时,采样候选集的大小。例如,取值为50时,仅将单次生成中得分最高的50个token组成随机采样的候选集。取值越大,生成的随机性越高;取值越小,生成的确定性越高。
- en_US: The size of the sample candidate set when generated. For example, when the value is 50, only the 50 highest-scoring tokens in a single generation form a randomly sampled candidate set. The larger the value, the higher the randomness generated; the smaller the value, the higher the certainty generated.
- - name: seed
- required: false
- type: int
- default: 1234
- label:
- zh_Hans: 随机种子
- en_US: Random seed
- help:
- zh_Hans: 生成时使用的随机数种子,用户控制模型生成内容的随机性。支持无符号64位整数,默认值为 1234。在使用seed时,模型将尽可能生成相同或相似的结果,但目前不保证每次生成的结果完全相同。
- en_US: The random number seed used when generating, the user controls the randomness of the content generated by the model. Supports unsigned 64-bit integers, default value is 1234. When using seed, the model will try its best to generate the same or similar results, but there is currently no guarantee that the results will be exactly the same every time.
- - name: repetition_penalty
- required: false
- type: float
- default: 1.1
- label:
- zh_Hans: 重复惩罚
- en_US: Repetition penalty
- help:
- zh_Hans: 用于控制模型生成时的重复度。提高repetition_penalty时可以降低模型生成的重复度。1.0表示不做惩罚。
- en_US: Used to control the repeatability when generating models. Increasing repetition_penalty can reduce the duplication of model generation. 1.0 means no punishment.
- - name: response_format
- use_template: response_format
-pricing:
- input: "0.0005"
- output: "0.001"
- unit: "0.001"
- currency: RMB
diff --git a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen2.5-7b-instruct.yaml b/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen2.5-7b-instruct.yaml
deleted file mode 100644
index fdcd3d4275..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen2.5-7b-instruct.yaml
+++ /dev/null
@@ -1,75 +0,0 @@
-# for more details, please refer to https://help.aliyun.com/zh/model-studio/getting-started/models
-model: qwen2.5-7b-instruct
-label:
- en_US: qwen2.5-7b-instruct
-model_type: llm
-features:
- - agent-thought
-model_properties:
- mode: chat
- context_size: 131072
-parameter_rules:
- - name: temperature
- use_template: temperature
- type: float
- default: 0.3
- min: 0.0
- max: 2.0
- help:
- zh_Hans: 用于控制随机性和多样性的程度。具体来说,temperature值控制了生成文本时对每个候选词的概率分布进行平滑的程度。较高的temperature值会降低概率分布的峰值,使得更多的低概率词被选择,生成结果更加多样化;而较低的temperature值则会增强概率分布的峰值,使得高概率词更容易被选择,生成结果更加确定。
- en_US: Used to control the degree of randomness and diversity. Specifically, the temperature value controls the degree to which the probability distribution of each candidate word is smoothed when generating text. A higher temperature value will reduce the peak value of the probability distribution, allowing more low-probability words to be selected, and the generated results will be more diverse; while a lower temperature value will enhance the peak value of the probability distribution, making it easier for high-probability words to be selected. , the generated results are more certain.
- - name: max_tokens
- use_template: max_tokens
- type: int
- default: 8192
- min: 1
- max: 8192
- help:
- zh_Hans: 用于指定模型在生成内容时token的最大数量,它定义了生成的上限,但不保证每次都会生成到这个数量。
- en_US: It is used to specify the maximum number of tokens when the model generates content. It defines the upper limit of generation, but does not guarantee that this number will be generated every time.
- - name: top_p
- use_template: top_p
- type: float
- default: 0.8
- min: 0.1
- max: 0.9
- help:
- zh_Hans: 生成过程中核采样方法概率阈值,例如,取值为0.8时,仅保留概率加起来大于等于0.8的最可能token的最小集合作为候选集。取值范围为(0,1.0),取值越大,生成的随机性越高;取值越低,生成的确定性越高。
- en_US: The probability threshold of the kernel sampling method during the generation process. For example, when the value is 0.8, only the smallest set of the most likely tokens with a sum of probabilities greater than or equal to 0.8 is retained as the candidate set. The value range is (0,1.0). The larger the value, the higher the randomness generated; the lower the value, the higher the certainty generated.
- - name: top_k
- type: int
- min: 0
- max: 99
- label:
- zh_Hans: 取样数量
- en_US: Top k
- help:
- zh_Hans: 生成时,采样候选集的大小。例如,取值为50时,仅将单次生成中得分最高的50个token组成随机采样的候选集。取值越大,生成的随机性越高;取值越小,生成的确定性越高。
- en_US: The size of the sample candidate set when generated. For example, when the value is 50, only the 50 highest-scoring tokens in a single generation form a randomly sampled candidate set. The larger the value, the higher the randomness generated; the smaller the value, the higher the certainty generated.
- - name: seed
- required: false
- type: int
- default: 1234
- label:
- zh_Hans: 随机种子
- en_US: Random seed
- help:
- zh_Hans: 生成时使用的随机数种子,用户控制模型生成内容的随机性。支持无符号64位整数,默认值为 1234。在使用seed时,模型将尽可能生成相同或相似的结果,但目前不保证每次生成的结果完全相同。
- en_US: The random number seed used when generating, the user controls the randomness of the content generated by the model. Supports unsigned 64-bit integers, default value is 1234. When using seed, the model will try its best to generate the same or similar results, but there is currently no guarantee that the results will be exactly the same every time.
- - name: repetition_penalty
- required: false
- type: float
- default: 1.1
- label:
- zh_Hans: 重复惩罚
- en_US: Repetition penalty
- help:
- zh_Hans: 用于控制模型生成时的重复度。提高repetition_penalty时可以降低模型生成的重复度。1.0表示不做惩罚。
- en_US: Used to control the repeatability when generating models. Increasing repetition_penalty can reduce the duplication of model generation. 1.0 means no punishment.
- - name: response_format
- use_template: response_format
-pricing:
- input: '0.001'
- output: '0.002'
- unit: '0.001'
- currency: RMB
diff --git a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen2.5-coder-7b-instruct.yaml b/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen2.5-coder-7b-instruct.yaml
deleted file mode 100644
index 7ebeec3953..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen2.5-coder-7b-instruct.yaml
+++ /dev/null
@@ -1,75 +0,0 @@
-# for more details, please refer to https://help.aliyun.com/zh/model-studio/getting-started/models
-model: qwen2.5-coder-7b-instruct
-label:
- en_US: qwen2.5-coder-7b-instruct
-model_type: llm
-features:
- - agent-thought
-model_properties:
- mode: chat
- context_size: 131072
-parameter_rules:
- - name: temperature
- use_template: temperature
- type: float
- default: 0.3
- min: 0.0
- max: 2.0
- help:
- zh_Hans: 用于控制随机性和多样性的程度。具体来说,temperature值控制了生成文本时对每个候选词的概率分布进行平滑的程度。较高的temperature值会降低概率分布的峰值,使得更多的低概率词被选择,生成结果更加多样化;而较低的temperature值则会增强概率分布的峰值,使得高概率词更容易被选择,生成结果更加确定。
- en_US: Used to control the degree of randomness and diversity. Specifically, the temperature value controls the degree to which the probability distribution of each candidate word is smoothed when generating text. A higher temperature value will reduce the peak value of the probability distribution, allowing more low-probability words to be selected, and the generated results will be more diverse; while a lower temperature value will enhance the peak value of the probability distribution, making it easier for high-probability words to be selected. , the generated results are more certain.
- - name: max_tokens
- use_template: max_tokens
- type: int
- default: 8192
- min: 1
- max: 8192
- help:
- zh_Hans: 用于指定模型在生成内容时token的最大数量,它定义了生成的上限,但不保证每次都会生成到这个数量。
- en_US: It is used to specify the maximum number of tokens when the model generates content. It defines the upper limit of generation, but does not guarantee that this number will be generated every time.
- - name: top_p
- use_template: top_p
- type: float
- default: 0.8
- min: 0.1
- max: 0.9
- help:
- zh_Hans: 生成过程中核采样方法概率阈值,例如,取值为0.8时,仅保留概率加起来大于等于0.8的最可能token的最小集合作为候选集。取值范围为(0,1.0),取值越大,生成的随机性越高;取值越低,生成的确定性越高。
- en_US: The probability threshold of the kernel sampling method during the generation process. For example, when the value is 0.8, only the smallest set of the most likely tokens with a sum of probabilities greater than or equal to 0.8 is retained as the candidate set. The value range is (0,1.0). The larger the value, the higher the randomness generated; the lower the value, the higher the certainty generated.
- - name: top_k
- type: int
- min: 0
- max: 99
- label:
- zh_Hans: 取样数量
- en_US: Top k
- help:
- zh_Hans: 生成时,采样候选集的大小。例如,取值为50时,仅将单次生成中得分最高的50个token组成随机采样的候选集。取值越大,生成的随机性越高;取值越小,生成的确定性越高。
- en_US: The size of the sample candidate set when generated. For example, when the value is 50, only the 50 highest-scoring tokens in a single generation form a randomly sampled candidate set. The larger the value, the higher the randomness generated; the smaller the value, the higher the certainty generated.
- - name: seed
- required: false
- type: int
- default: 1234
- label:
- zh_Hans: 随机种子
- en_US: Random seed
- help:
- zh_Hans: 生成时使用的随机数种子,用户控制模型生成内容的随机性。支持无符号64位整数,默认值为 1234。在使用seed时,模型将尽可能生成相同或相似的结果,但目前不保证每次生成的结果完全相同。
- en_US: The random number seed used when generating, the user controls the randomness of the content generated by the model. Supports unsigned 64-bit integers, default value is 1234. When using seed, the model will try its best to generate the same or similar results, but there is currently no guarantee that the results will be exactly the same every time.
- - name: repetition_penalty
- required: false
- type: float
- default: 1.1
- label:
- zh_Hans: 重复惩罚
- en_US: Repetition penalty
- help:
- zh_Hans: 用于控制模型生成时的重复度。提高repetition_penalty时可以降低模型生成的重复度。1.0表示不做惩罚。
- en_US: Used to control the repeatability when generating models. Increasing repetition_penalty can reduce the duplication of model generation. 1.0 means no punishment.
- - name: response_format
- use_template: response_format
-pricing:
- input: '0.001'
- output: '0.002'
- unit: '0.001'
- currency: RMB
diff --git a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen2.5-vl-3b-instruct.yaml b/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen2.5-vl-3b-instruct.yaml
deleted file mode 100644
index 02c5d3f2d0..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen2.5-vl-3b-instruct.yaml
+++ /dev/null
@@ -1,77 +0,0 @@
-# for more details, please refer to https://help.aliyun.com/zh/model-studio/getting-started/models
-model: qwen2.5-vl-3b-instruct
-label:
- en_US: qwen2.5-vl-3b-instruct
-model_type: llm
-features:
- - vision
- - agent-thought
- - video
-model_properties:
- mode: chat
- context_size: 131072
-parameter_rules:
- - name: temperature
- use_template: temperature
- type: float
- default: 0.3
- min: 0.0
- max: 2.0
- help:
- zh_Hans: 用于控制随机性和多样性的程度。具体来说,temperature值控制了生成文本时对每个候选词的概率分布进行平滑的程度。较高的temperature值会降低概率分布的峰值,使得更多的低概率词被选择,生成结果更加多样化;而较低的temperature值则会增强概率分布的峰值,使得高概率词更容易被选择,生成结果更加确定。
- en_US: Used to control the degree of randomness and diversity. Specifically, the temperature value controls the degree to which the probability distribution of each candidate word is smoothed when generating text. A higher temperature value will reduce the peak value of the probability distribution, allowing more low-probability words to be selected, and the generated results will be more diverse; while a lower temperature value will enhance the peak value of the probability distribution, making it easier for high-probability words to be selected. , the generated results are more certain.
- - name: max_tokens
- use_template: max_tokens
- type: int
- default: 8192
- min: 1
- max: 8192
- help:
- zh_Hans: 用于指定模型在生成内容时token的最大数量,它定义了生成的上限,但不保证每次都会生成到这个数量。
- en_US: It is used to specify the maximum number of tokens when the model generates content. It defines the upper limit of generation, but does not guarantee that this number will be generated every time.
- - name: top_p
- use_template: top_p
- type: float
- default: 0.8
- min: 0.1
- max: 0.9
- help:
- zh_Hans: 生成过程中核采样方法概率阈值,例如,取值为0.8时,仅保留概率加起来大于等于0.8的最可能token的最小集合作为候选集。取值范围为(0,1.0),取值越大,生成的随机性越高;取值越低,生成的确定性越高。
- en_US: The probability threshold of the kernel sampling method during the generation process. For example, when the value is 0.8, only the smallest set of the most likely tokens with a sum of probabilities greater than or equal to 0.8 is retained as the candidate set. The value range is (0,1.0). The larger the value, the higher the randomness generated; the lower the value, the higher the certainty generated.
- - name: top_k
- type: int
- min: 0
- max: 99
- label:
- zh_Hans: 取样数量
- en_US: Top k
- help:
- zh_Hans: 生成时,采样候选集的大小。例如,取值为50时,仅将单次生成中得分最高的50个token组成随机采样的候选集。取值越大,生成的随机性越高;取值越小,生成的确定性越高。
- en_US: The size of the sample candidate set when generated. For example, when the value is 50, only the 50 highest-scoring tokens in a single generation form a randomly sampled candidate set. The larger the value, the higher the randomness generated; the smaller the value, the higher the certainty generated.
- - name: seed
- required: false
- type: int
- default: 1234
- label:
- zh_Hans: 随机种子
- en_US: Random seed
- help:
- zh_Hans: 生成时使用的随机数种子,用户控制模型生成内容的随机性。支持无符号64位整数,默认值为 1234。在使用seed时,模型将尽可能生成相同或相似的结果,但目前不保证每次生成的结果完全相同。
- en_US: The random number seed used when generating, the user controls the randomness of the content generated by the model. Supports unsigned 64-bit integers, default value is 1234. When using seed, the model will try its best to generate the same or similar results, but there is currently no guarantee that the results will be exactly the same every time.
- - name: repetition_penalty
- required: false
- type: float
- default: 1.1
- label:
- zh_Hans: 重复惩罚
- en_US: Repetition penalty
- help:
- zh_Hans: 用于控制模型生成时的重复度。提高repetition_penalty时可以降低模型生成的重复度。1.0表示不做惩罚。
- en_US: Used to control the repeatability when generating models. Increasing repetition_penalty can reduce the duplication of model generation. 1.0 means no punishment.
- - name: response_format
- use_template: response_format
-pricing:
- input: '0.0012'
- output: '0.0036'
- unit: '0.001'
- currency: RMB
diff --git a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen2.5-vl-72b-instruct.yaml b/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen2.5-vl-72b-instruct.yaml
deleted file mode 100644
index 4fb5e2d2c9..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen2.5-vl-72b-instruct.yaml
+++ /dev/null
@@ -1,77 +0,0 @@
-# for more details, please refer to https://help.aliyun.com/zh/model-studio/getting-started/models
-model: qwen2.5-vl-72b-instruct
-label:
- en_US: qwen2.5-vl-72b-instruct
-model_type: llm
-features:
- - vision
- - agent-thought
- - video
-model_properties:
- mode: chat
- context_size: 131072
-parameter_rules:
- - name: temperature
- use_template: temperature
- type: float
- default: 0.3
- min: 0.0
- max: 2.0
- help:
- zh_Hans: 用于控制随机性和多样性的程度。具体来说,temperature值控制了生成文本时对每个候选词的概率分布进行平滑的程度。较高的temperature值会降低概率分布的峰值,使得更多的低概率词被选择,生成结果更加多样化;而较低的temperature值则会增强概率分布的峰值,使得高概率词更容易被选择,生成结果更加确定。
- en_US: Used to control the degree of randomness and diversity. Specifically, the temperature value controls the degree to which the probability distribution of each candidate word is smoothed when generating text. A higher temperature value will reduce the peak value of the probability distribution, allowing more low-probability words to be selected, and the generated results will be more diverse; while a lower temperature value will enhance the peak value of the probability distribution, making it easier for high-probability words to be selected. , the generated results are more certain.
- - name: max_tokens
- use_template: max_tokens
- type: int
- default: 8192
- min: 1
- max: 8192
- help:
- zh_Hans: 用于指定模型在生成内容时token的最大数量,它定义了生成的上限,但不保证每次都会生成到这个数量。
- en_US: It is used to specify the maximum number of tokens when the model generates content. It defines the upper limit of generation, but does not guarantee that this number will be generated every time.
- - name: top_p
- use_template: top_p
- type: float
- default: 0.8
- min: 0.1
- max: 0.9
- help:
- zh_Hans: 生成过程中核采样方法概率阈值,例如,取值为0.8时,仅保留概率加起来大于等于0.8的最可能token的最小集合作为候选集。取值范围为(0,1.0),取值越大,生成的随机性越高;取值越低,生成的确定性越高。
- en_US: The probability threshold of the kernel sampling method during the generation process. For example, when the value is 0.8, only the smallest set of the most likely tokens with a sum of probabilities greater than or equal to 0.8 is retained as the candidate set. The value range is (0,1.0). The larger the value, the higher the randomness generated; the lower the value, the higher the certainty generated.
- - name: top_k
- type: int
- min: 0
- max: 99
- label:
- zh_Hans: 取样数量
- en_US: Top k
- help:
- zh_Hans: 生成时,采样候选集的大小。例如,取值为50时,仅将单次生成中得分最高的50个token组成随机采样的候选集。取值越大,生成的随机性越高;取值越小,生成的确定性越高。
- en_US: The size of the sample candidate set when generated. For example, when the value is 50, only the 50 highest-scoring tokens in a single generation form a randomly sampled candidate set. The larger the value, the higher the randomness generated; the smaller the value, the higher the certainty generated.
- - name: seed
- required: false
- type: int
- default: 1234
- label:
- zh_Hans: 随机种子
- en_US: Random seed
- help:
- zh_Hans: 生成时使用的随机数种子,用户控制模型生成内容的随机性。支持无符号64位整数,默认值为 1234。在使用seed时,模型将尽可能生成相同或相似的结果,但目前不保证每次生成的结果完全相同。
- en_US: The random number seed used when generating, the user controls the randomness of the content generated by the model. Supports unsigned 64-bit integers, default value is 1234. When using seed, the model will try its best to generate the same or similar results, but there is currently no guarantee that the results will be exactly the same every time.
- - name: repetition_penalty
- required: false
- type: float
- default: 1.1
- label:
- zh_Hans: 重复惩罚
- en_US: Repetition penalty
- help:
- zh_Hans: 用于控制模型生成时的重复度。提高repetition_penalty时可以降低模型生成的重复度。1.0表示不做惩罚。
- en_US: Used to control the repeatability when generating models. Increasing repetition_penalty can reduce the duplication of model generation. 1.0 means no punishment.
- - name: response_format
- use_template: response_format
-pricing:
- input: '0.016'
- output: '0.048'
- unit: '0.001'
- currency: RMB
diff --git a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen2.5-vl-7b-instruct.yaml b/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen2.5-vl-7b-instruct.yaml
deleted file mode 100644
index 4284ba0563..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwen2.5-vl-7b-instruct.yaml
+++ /dev/null
@@ -1,77 +0,0 @@
-# for more details, please refer to https://help.aliyun.com/zh/model-studio/getting-started/models
-model: qwen2.5-vl-7b-instruct
-label:
- en_US: qwen2.5-vl-7b-instruct
-model_type: llm
-features:
- - vision
- - agent-thought
- - video
-model_properties:
- mode: chat
- context_size: 131072
-parameter_rules:
- - name: temperature
- use_template: temperature
- type: float
- default: 0.3
- min: 0.0
- max: 2.0
- help:
- zh_Hans: 用于控制随机性和多样性的程度。具体来说,temperature值控制了生成文本时对每个候选词的概率分布进行平滑的程度。较高的temperature值会降低概率分布的峰值,使得更多的低概率词被选择,生成结果更加多样化;而较低的temperature值则会增强概率分布的峰值,使得高概率词更容易被选择,生成结果更加确定。
- en_US: Used to control the degree of randomness and diversity. Specifically, the temperature value controls the degree to which the probability distribution of each candidate word is smoothed when generating text. A higher temperature value will reduce the peak value of the probability distribution, allowing more low-probability words to be selected, and the generated results will be more diverse; while a lower temperature value will enhance the peak value of the probability distribution, making it easier for high-probability words to be selected. , the generated results are more certain.
- - name: max_tokens
- use_template: max_tokens
- type: int
- default: 8192
- min: 1
- max: 8192
- help:
- zh_Hans: 用于指定模型在生成内容时token的最大数量,它定义了生成的上限,但不保证每次都会生成到这个数量。
- en_US: It is used to specify the maximum number of tokens when the model generates content. It defines the upper limit of generation, but does not guarantee that this number will be generated every time.
- - name: top_p
- use_template: top_p
- type: float
- default: 0.8
- min: 0.1
- max: 0.9
- help:
- zh_Hans: 生成过程中核采样方法概率阈值,例如,取值为0.8时,仅保留概率加起来大于等于0.8的最可能token的最小集合作为候选集。取值范围为(0,1.0),取值越大,生成的随机性越高;取值越低,生成的确定性越高。
- en_US: The probability threshold of the kernel sampling method during the generation process. For example, when the value is 0.8, only the smallest set of the most likely tokens with a sum of probabilities greater than or equal to 0.8 is retained as the candidate set. The value range is (0,1.0). The larger the value, the higher the randomness generated; the lower the value, the higher the certainty generated.
- - name: top_k
- type: int
- min: 0
- max: 99
- label:
- zh_Hans: 取样数量
- en_US: Top k
- help:
- zh_Hans: 生成时,采样候选集的大小。例如,取值为50时,仅将单次生成中得分最高的50个token组成随机采样的候选集。取值越大,生成的随机性越高;取值越小,生成的确定性越高。
- en_US: The size of the sample candidate set when generated. For example, when the value is 50, only the 50 highest-scoring tokens in a single generation form a randomly sampled candidate set. The larger the value, the higher the randomness generated; the smaller the value, the higher the certainty generated.
- - name: seed
- required: false
- type: int
- default: 1234
- label:
- zh_Hans: 随机种子
- en_US: Random seed
- help:
- zh_Hans: 生成时使用的随机数种子,用户控制模型生成内容的随机性。支持无符号64位整数,默认值为 1234。在使用seed时,模型将尽可能生成相同或相似的结果,但目前不保证每次生成的结果完全相同。
- en_US: The random number seed used when generating, the user controls the randomness of the content generated by the model. Supports unsigned 64-bit integers, default value is 1234. When using seed, the model will try its best to generate the same or similar results, but there is currently no guarantee that the results will be exactly the same every time.
- - name: repetition_penalty
- required: false
- type: float
- default: 1.1
- label:
- zh_Hans: 重复惩罚
- en_US: Repetition penalty
- help:
- zh_Hans: 用于控制模型生成时的重复度。提高repetition_penalty时可以降低模型生成的重复度。1.0表示不做惩罚。
- en_US: Used to control the repeatability when generating models. Increasing repetition_penalty can reduce the duplication of model generation. 1.0 means no punishment.
- - name: response_format
- use_template: response_format
-pricing:
- input: '0.002'
- output: '0.005'
- unit: '0.001'
- currency: RMB
diff --git a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwq-32b.yaml b/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwq-32b.yaml
deleted file mode 100644
index e36599fd47..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwq-32b.yaml
+++ /dev/null
@@ -1,48 +0,0 @@
-# this model corresponds to qwen-max, for more details
-# please refer to (https://help.aliyun.com/zh/model-studio/getting-started/models#cf6cc4aa2aokf)
-model: qwq-32b
-label:
- en_US: qwq-32b
- zh_Hans: 通义千问QWQ-32B
-model_type: llm
-features:
- - agent-thought
- - stream-tool-call
-model_properties:
- mode: chat
- context_size: 131072
-parameter_rules:
- - name: max_tokens
- use_template: max_tokens
- type: int
- default: 2000
- min: 1
- max: 8192
- help:
- zh_Hans: 用于指定模型在生成内容时token的最大数量,它定义了生成的上限,但不保证每次都会生成到这个数量。
- en_US: It is used to specify the maximum number of tokens when the model generates content. It defines the upper limit of generation, but does not guarantee that this number will be generated every time.
- - name: top_k
- type: int
- min: 0
- max: 99
- label:
- zh_Hans: 取样数量
- en_US: Top k
- help:
- zh_Hans: 生成时,采样候选集的大小。例如,取值为50时,仅将单次生成中得分最高的50个token组成随机采样的候选集。取值越大,生成的随机性越高;取值越小,生成的确定性越高。
- en_US: The size of the sample candidate set when generated. For example, when the value is 50, only the 50 highest-scoring tokens in a single generation form a randomly sampled candidate set. The larger the value, the higher the randomness generated; the smaller the value, the higher the certainty generated.
- - name: seed
- required: false
- type: int
- default: 1234
- label:
- zh_Hans: 随机种子
- en_US: Random seed
- help:
- zh_Hans: 生成时使用的随机数种子,用户控制模型生成内容的随机性。支持无符号64位整数,默认值为 1234。在使用seed时,模型将尽可能生成相同或相似的结果,但目前不保证每次生成的结果完全相同。
- en_US: The random number seed used when generating, the user controls the randomness of the content generated by the model. Supports unsigned 64-bit integers, default value is 1234. When using seed, the model will try its best to generate the same or similar results, but there is currently no guarantee that the results will be exactly the same every time.
-pricing:
- input: '0.012'
- output: '0.036'
- unit: '0.001'
- currency: RMB
diff --git a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwq-plus-0305.yaml b/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwq-plus-0305.yaml
deleted file mode 100644
index fcb52ed26b..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwq-plus-0305.yaml
+++ /dev/null
@@ -1,48 +0,0 @@
-# this model corresponds to qwen-max, for more details
-# please refer to (https://help.aliyun.com/zh/model-studio/getting-started/models#cf6cc4aa2aokf)
-model: qwq-plus-0305
-label:
- en_US: qwq-plus-0305
- zh_Hans: 通义千问QWQ-Plus-0305
-model_type: llm
-features:
- - agent-thought
- - stream-tool-call
-model_properties:
- mode: chat
- context_size: 131072
-parameter_rules:
- - name: max_tokens
- use_template: max_tokens
- type: int
- default: 2000
- min: 1
- max: 8192
- help:
- zh_Hans: 用于指定模型在生成内容时token的最大数量,它定义了生成的上限,但不保证每次都会生成到这个数量。
- en_US: It is used to specify the maximum number of tokens when the model generates content. It defines the upper limit of generation, but does not guarantee that this number will be generated every time.
- - name: top_k
- type: int
- min: 0
- max: 99
- label:
- zh_Hans: 取样数量
- en_US: Top k
- help:
- zh_Hans: 生成时,采样候选集的大小。例如,取值为50时,仅将单次生成中得分最高的50个token组成随机采样的候选集。取值越大,生成的随机性越高;取值越小,生成的确定性越高。
- en_US: The size of the sample candidate set when generated. For example, when the value is 50, only the 50 highest-scoring tokens in a single generation form a randomly sampled candidate set. The larger the value, the higher the randomness generated; the smaller the value, the higher the certainty generated.
- - name: seed
- required: false
- type: int
- default: 1234
- label:
- zh_Hans: 随机种子
- en_US: Random seed
- help:
- zh_Hans: 生成时使用的随机数种子,用户控制模型生成内容的随机性。支持无符号64位整数,默认值为 1234。在使用seed时,模型将尽可能生成相同或相似的结果,但目前不保证每次生成的结果完全相同。
- en_US: The random number seed used when generating, the user controls the randomness of the content generated by the model. Supports unsigned 64-bit integers, default value is 1234. When using seed, the model will try its best to generate the same or similar results, but there is currently no guarantee that the results will be exactly the same every time.
-pricing:
- input: '0.0016'
- output: '0.004'
- unit: '0.001'
- currency: RMB
diff --git a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwq-plus.yaml b/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwq-plus.yaml
deleted file mode 100644
index 48d58997a3..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/llm/qwq-plus.yaml
+++ /dev/null
@@ -1,48 +0,0 @@
-# this model corresponds to qwen-max, for more details
-# please refer to (https://help.aliyun.com/zh/model-studio/getting-started/models#cf6cc4aa2aokf)
-model: qwq-plus
-label:
- en_US: qwq-plus
- zh_Hans: 通义千问QWQ-Plus
-model_type: llm
-features:
- - agent-thought
- - stream-tool-call
-model_properties:
- mode: chat
- context_size: 131072
-parameter_rules:
- - name: max_tokens
- use_template: max_tokens
- type: int
- default: 2000
- min: 1
- max: 8192
- help:
- zh_Hans: 用于指定模型在生成内容时token的最大数量,它定义了生成的上限,但不保证每次都会生成到这个数量。
- en_US: It is used to specify the maximum number of tokens when the model generates content. It defines the upper limit of generation, but does not guarantee that this number will be generated every time.
- - name: top_k
- type: int
- min: 0
- max: 99
- label:
- zh_Hans: 取样数量
- en_US: Top k
- help:
- zh_Hans: 生成时,采样候选集的大小。例如,取值为50时,仅将单次生成中得分最高的50个token组成随机采样的候选集。取值越大,生成的随机性越高;取值越小,生成的确定性越高。
- en_US: The size of the sample candidate set when generated. For example, when the value is 50, only the 50 highest-scoring tokens in a single generation form a randomly sampled candidate set. The larger the value, the higher the randomness generated; the smaller the value, the higher the certainty generated.
- - name: seed
- required: false
- type: int
- default: 1234
- label:
- zh_Hans: 随机种子
- en_US: Random seed
- help:
- zh_Hans: 生成时使用的随机数种子,用户控制模型生成内容的随机性。支持无符号64位整数,默认值为 1234。在使用seed时,模型将尽可能生成相同或相似的结果,但目前不保证每次生成的结果完全相同。
- en_US: The random number seed used when generating, the user controls the randomness of the content generated by the model. Supports unsigned 64-bit integers, default value is 1234. When using seed, the model will try its best to generate the same or similar results, but there is currently no guarantee that the results will be exactly the same every time.
-pricing:
- input: '0.0016'
- output: '0.004'
- unit: '0.001'
- currency: RMB
diff --git a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/rerank/__init__.py b/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/rerank/__init__.py
deleted file mode 100644
index e69de29bb2..0000000000
diff --git a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/rerank/_position.yaml b/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/rerank/_position.yaml
deleted file mode 100644
index 439afda992..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/rerank/_position.yaml
+++ /dev/null
@@ -1 +0,0 @@
-- gte-rerank
diff --git a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/rerank/gte-rerank.yaml b/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/rerank/gte-rerank.yaml
deleted file mode 100644
index 44d51b9b0d..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/rerank/gte-rerank.yaml
+++ /dev/null
@@ -1,4 +0,0 @@
-model: gte-rerank
-model_type: rerank
-model_properties:
- context_size: 4000
diff --git a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/rerank/rerank.py b/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/rerank/rerank.py
deleted file mode 100644
index c82bcadfa9..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/rerank/rerank.py
+++ /dev/null
@@ -1,110 +0,0 @@
-from typing import Optional
-import dashscope
-from dashscope.common.error import (
- AuthenticationError,
- InvalidParameter,
- RequestFailure,
- ServiceUnavailableError,
- UnsupportedHTTPMethod,
- UnsupportedModel,
-)
-from dify_plugin.entities.model.rerank import RerankDocument, RerankResult
-from dify_plugin.errors.model import (
- CredentialsValidateFailedError,
- InvokeAuthorizationError,
- InvokeBadRequestError,
- InvokeConnectionError,
- InvokeError,
- InvokeRateLimitError,
- InvokeServerUnavailableError,
-)
-from dify_plugin.interfaces.model.rerank_model import RerankModel
-
-
-class GTERerankModel(RerankModel):
- """
- Model class for GTE rerank model.
- """
-
- def _invoke(
- self,
- model: str,
- credentials: dict,
- query: str,
- docs: list[str],
- score_threshold: Optional[float] = None,
- top_n: Optional[int] = None,
- user: Optional[str] = None,
- ) -> RerankResult:
- """
- Invoke rerank model
-
- :param model: model name
- :param credentials: model credentials
- :param query: search query
- :param docs: docs for reranking
- :param score_threshold: score threshold
- :param top_n: top n
- :param user: unique user id
- :return: rerank result
- """
- if len(docs) == 0:
- return RerankResult(model=model, docs=docs)
- dashscope.api_key = credentials["dashscope_api_key"]
- response = dashscope.TextReRank.call(
- query=query, documents=docs, model=model, top_n=top_n, return_documents=True
- )
- rerank_documents = []
- if not response.output:
- return RerankResult(model=model, docs=rerank_documents)
- for _, result in enumerate(response.output.results):
- rerank_document = RerankDocument(
- index=result.index, score=result.relevance_score, text=result["document"]["text"]
- )
- if score_threshold is not None:
- if result.relevance_score >= score_threshold:
- rerank_documents.append(rerank_document)
- else:
- rerank_documents.append(rerank_document)
- return RerankResult(model=model, docs=rerank_documents)
-
- def validate_credentials(self, model: str, credentials: dict) -> None:
- """
- Validate model credentials
-
- :param model: model name
- :param credentials: model credentials
- :return:
- """
- try:
- self.invoke(
- model=model,
- credentials=credentials,
- query="What is the capital of the United States?",
- docs=[
- "Carson City is the capital city of the American state of Nevada. At the 2010 United States Census, Carson City had a population of 55,274.",
- "The Commonwealth of the Northern Mariana Islands is a group of islands in the Pacific Ocean that are a political division controlled by the United States. Its capital is Saipan.",
- ],
- score_threshold=0.8,
- )
- except Exception as ex:
- print(ex)
- raise CredentialsValidateFailedError(str(ex))
-
- @property
- def _invoke_error_mapping(self) -> dict[type[InvokeError], list[type[Exception]]]:
- """
- Map model invoke error to unified error
- The key is the error type thrown to the caller
- The value is the error type thrown by the model,
- which needs to be converted into a unified error type for the caller.
-
- :return: Invoke error mapping
- """
- return {
- InvokeConnectionError: [RequestFailure],
- InvokeServerUnavailableError: [ServiceUnavailableError],
- InvokeRateLimitError: [],
- InvokeAuthorizationError: [AuthenticationError],
- InvokeBadRequestError: [InvalidParameter, UnsupportedModel, UnsupportedHTTPMethod],
- }
diff --git a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/text_embedding/__init__.py b/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/text_embedding/__init__.py
deleted file mode 100644
index e69de29bb2..0000000000
diff --git a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/text_embedding/text-embedding-v1.yaml b/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/text_embedding/text-embedding-v1.yaml
deleted file mode 100644
index 52e35d8b50..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/text_embedding/text-embedding-v1.yaml
+++ /dev/null
@@ -1,10 +0,0 @@
-# for more details, please refer to https://help.aliyun.com/zh/model-studio/getting-started/models#3383780daf8hw
-model: text-embedding-v1
-model_type: text-embedding
-model_properties:
- context_size: 2048
- max_chunks: 25
-pricing:
- input: "0.0007"
- unit: "0.001"
- currency: RMB
diff --git a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/text_embedding/text-embedding-v2.yaml b/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/text_embedding/text-embedding-v2.yaml
deleted file mode 100644
index 5bb6a8f424..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/text_embedding/text-embedding-v2.yaml
+++ /dev/null
@@ -1,10 +0,0 @@
-# for more details, please refer to https://help.aliyun.com/zh/model-studio/getting-started/models#3383780daf8hw
-model: text-embedding-v2
-model_type: text-embedding
-model_properties:
- context_size: 2048
- max_chunks: 25
-pricing:
- input: "0.0007"
- unit: "0.001"
- currency: RMB
diff --git a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/text_embedding/text-embedding-v3.yaml b/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/text_embedding/text-embedding-v3.yaml
deleted file mode 100644
index d8af0e2b63..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/text_embedding/text-embedding-v3.yaml
+++ /dev/null
@@ -1,10 +0,0 @@
-# for more details, please refer to https://help.aliyun.com/zh/model-studio/getting-started/models#3383780daf8hw
-model: text-embedding-v3
-model_type: text-embedding
-model_properties:
- context_size: 8192
- max_chunks: 25
-pricing:
- input: "0.0007"
- unit: "0.001"
- currency: RMB
diff --git a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/text_embedding/text_embedding.py b/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/text_embedding/text_embedding.py
deleted file mode 100644
index b5e12c4c81..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/text_embedding/text_embedding.py
+++ /dev/null
@@ -1,167 +0,0 @@
-import time
-from typing import Optional
-import dashscope
-import numpy as np
-from dify_plugin.entities.model import EmbeddingInputType, PriceType
-from dify_plugin.entities.model.text_embedding import EmbeddingUsage, TextEmbeddingResult
-from dify_plugin.errors.model import CredentialsValidateFailedError
-from dify_plugin.interfaces.model.text_embedding_model import TextEmbeddingModel
-from models._common import _CommonTongyi
-
-
-class TongyiTextEmbeddingModel(_CommonTongyi, TextEmbeddingModel):
- """
- Model class for Tongyi text embedding model.
- """
-
- def _invoke(
- self,
- model: str,
- credentials: dict,
- texts: list[str],
- user: Optional[str] = None,
- input_type: EmbeddingInputType = EmbeddingInputType.DOCUMENT,
- ) -> TextEmbeddingResult:
- """
- Invoke text embedding model
-
- :param model: model name
- :param credentials: model credentials
- :param texts: texts to embed
- :param user: unique user id
- :param input_type: input type
- :return: embeddings result
- """
- credentials_kwargs = self._to_credential_kwargs(credentials)
- context_size = self._get_context_size(model, credentials)
- max_chunks = self._get_max_chunks(model, credentials)
- inputs = []
- indices = []
- used_tokens = 0
- for i, text in enumerate(texts):
- num_tokens = self._get_num_tokens_by_gpt2(text)
- if num_tokens >= context_size:
- cutoff = int(np.floor(len(text) * (context_size / num_tokens)))
- inputs.append(text[0:cutoff])
- else:
- inputs.append(text)
- indices += [i]
- batched_embeddings = []
- _iter = range(0, len(inputs), max_chunks)
- for i in _iter:
- (embeddings_batch, embedding_used_tokens) = self.embed_documents(
- credentials_kwargs=credentials_kwargs, model=model, texts=inputs[i : i + max_chunks]
- )
- used_tokens += embedding_used_tokens
- batched_embeddings += embeddings_batch
- usage = self._calc_response_usage(model=model, credentials=credentials, tokens=used_tokens)
- return TextEmbeddingResult(embeddings=batched_embeddings, usage=usage, model=model)
-
- def get_num_tokens(self, model: str, credentials: dict, texts: list[str]) -> list[int]:
- """
- Get number of tokens for given prompt messages
-
- :param model: model name
- :param credentials: model credentials
- :param texts: texts to embed
- :return:
- """
- if len(texts) == 0:
- return []
- tokens = []
- for text in texts:
- tokens.append(self._get_num_tokens_by_gpt2(text))
- return tokens
-
- def validate_credentials(self, model: str, credentials: dict) -> None:
- """
- Validate model credentials
-
- :param model: model name
- :param credentials: model credentials
- :return:
- """
- try:
- credentials_kwargs = self._to_credential_kwargs(credentials)
- self.embed_documents(credentials_kwargs=credentials_kwargs, model=model, texts=["ping"])
- except Exception as ex:
- raise CredentialsValidateFailedError(str(ex))
-
- @staticmethod
- def embed_documents(credentials_kwargs: dict, model: str, texts: list[str]) -> tuple[list[list[float]], int]:
- """Call out to Tongyi's embedding endpoint.
-
- Args:
- credentials_kwargs: The credentials to use for the call.
- model: The model to use for embedding.
- texts: The list of texts to embed.
-
- Returns:
- List of embeddings, one for each text, and tokens usage.
- """
- embeddings = []
- embedding_used_tokens = 0
-
- def call_embedding_api(text):
- try:
- return dashscope.TextEmbedding.call(
- api_key=credentials_kwargs["dashscope_api_key"],
- model=model,
- input=text,
- text_type="document"
- )
- except Exception as e:
- # Return the exception to be handled by the caller
- return e
-
- for text in texts:
- # First attempt
- response = call_embedding_api(text)
-
- # Handle rate limit error (429)
- # Check if response is an exception with rate limit info
- if hasattr(response, 'status_code') and response.status_code == 429:
- print(f"Rate limit exceeded (429). Response: {response}")
- import time
- time.sleep(10)
- # Retry once after sleeping
- response = call_embedding_api(text)
-
- # Process response
- if hasattr(response, 'output') and response.output and "embeddings" in response.output and response.output["embeddings"]:
- data = response.output["embeddings"][0]
- if "embedding" in data:
- embeddings.append(data["embedding"])
- else:
- raise ValueError(f"Embedding data is missing in the response: {response}")
- else:
- raise ValueError(f"Response output is missing or does not contain embeddings: {response}")
-
- if hasattr(response, 'usage') and response.usage and "total_tokens" in response.usage:
- embedding_used_tokens += response.usage["total_tokens"]
- else:
- raise ValueError(f"Response usage is missing or does not contain total tokens: {response}")
-
- return ([list(map(float, e)) for e in embeddings], embedding_used_tokens)
-
- def _calc_response_usage(self, model: str, credentials: dict, tokens: int) -> EmbeddingUsage:
- """
- Calculate response usage
-
- :param model: model name
- :param tokens: input tokens
- :return: usage
- """
- input_price_info = self.get_price(
- model=model, credentials=credentials, price_type=PriceType.INPUT, tokens=tokens
- )
- usage = EmbeddingUsage(
- tokens=tokens,
- total_tokens=tokens,
- unit_price=input_price_info.unit_price,
- price_unit=input_price_info.unit,
- total_price=input_price_info.total_amount,
- currency=input_price_info.currency,
- latency=time.perf_counter() - self.started_at,
- )
- return usage
diff --git a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/tts/__init__.py b/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/tts/__init__.py
deleted file mode 100644
index e69de29bb2..0000000000
diff --git a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/tts/tts-1.yaml b/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/tts/tts-1.yaml
deleted file mode 100644
index 4eaa0ff361..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/tts/tts-1.yaml
+++ /dev/null
@@ -1,139 +0,0 @@
-model: tts-1
-model_type: tts
-model_properties:
- default_voice: 'sambert-zhiru-v1'
- voices:
- - mode: "sambert-zhinan-v1"
- name: "知楠(广告男声)"
- language: [ "zh-Hans", "en-US" ]
- - mode: "sambert-zhiqi-v1"
- name: "知琪(温柔女声)"
- language: [ "zh-Hans", "en-US" ]
- - mode: "sambert-zhichu-v1"
- name: "知厨(新闻播报)"
- language: [ "zh-Hans", "en-US" ]
- - mode: "sambert-zhide-v1"
- name: "知德(新闻男声)"
- language: [ "zh-Hans", "en-US" ]
- - mode: "sambert-zhijia-v1"
- name: "知佳(标准女声)"
- language: [ "zh-Hans", "en-US" ]
- - mode: "sambert-zhiru-v1"
- name: "知茹(新闻女声)"
- language: [ "zh-Hans", "en-US" ]
- - mode: "sambert-zhiqian-v1"
- name: "知倩(配音解说、新闻播报)"
- language: [ "zh-Hans", "en-US" ]
- - mode: "sambert-zhixiang-v1"
- name: "知祥(配音解说)"
- language: [ "zh-Hans", "en-US" ]
- - mode: "sambert-zhiwei-v1"
- name: "知薇(萝莉女声)"
- language: [ "zh-Hans", "en-US" ]
- - mode: "sambert-zhihao-v1"
- name: "知浩(咨询男声)"
- language: [ "zh-Hans", "en-US" ]
- - mode: "sambert-zhijing-v1"
- name: "知婧(严厉女声)"
- language: [ "zh-Hans", "en-US" ]
- - mode: "sambert-zhiming-v1"
- name: "知茗(诙谐男声)"
- language: [ "zh-Hans", "en-US" ]
- - mode: "sambert-zhimo-v1"
- name: "知墨(情感男声)"
- language: [ "zh-Hans", "en-US" ]
- - mode: "sambert-zhina-v1"
- name: "知娜(浙普女声)"
- language: [ "zh-Hans", "en-US" ]
- - mode: "sambert-zhishu-v1"
- name: "知树(资讯男声)"
- language: [ "zh-Hans", "en-US" ]
- - mode: "sambert-zhistella-v1"
- name: "知莎(知性女声)"
- language: [ "zh-Hans", "en-US" ]
- - mode: "sambert-zhiting-v1"
- name: "知婷(电台女声)"
- language: [ "zh-Hans", "en-US" ]
- - mode: "sambert-zhixiao-v1"
- name: "知笑(资讯女声)"
- language: [ "zh-Hans", "en-US" ]
- - mode: "sambert-zhiya-v1"
- name: "知雅(严厉女声)"
- language: [ "zh-Hans", "en-US" ]
- - mode: "sambert-zhiye-v1"
- name: "知晔(青年男声)"
- language: [ "zh-Hans", "en-US" ]
- - mode: "sambert-zhiying-v1"
- name: "知颖(软萌童声)"
- language: [ "zh-Hans", "en-US" ]
- - mode: "sambert-zhiyuan-v1"
- name: "知媛(知心姐姐)"
- language: [ "zh-Hans", "en-US" ]
- - mode: "sambert-zhigui-v1"
- name: "知柜(直播女声)"
- language: [ "zh-Hans", "en-US" ]
- - mode: "sambert-zhishuo-v1"
- name: "知硕(自然男声)"
- language: [ "zh-Hans", "en-US" ]
- - mode: "sambert-zhimiao-emo-v1"
- name: "知妙(多种情感女声)"
- language: [ "zh-Hans", "en-US" ]
- - mode: "sambert-zhimao-v1"
- name: "知猫(直播女声)"
- language: [ "zh-Hans", "en-US" ]
- - mode: "sambert-zhilun-v1"
- name: "知伦(悬疑解说)"
- language: [ "zh-Hans", "en-US" ]
- - mode: "sambert-zhifei-v1"
- name: "知飞(激昂解说)"
- language: [ "zh-Hans", "en-US" ]
- - mode: "sambert-zhida-v1"
- name: "知达(标准男声)"
- language: [ "zh-Hans", "en-US" ]
- - mode: "sambert-camila-v1"
- name: "Camila(西班牙语女声)"
- language: [ "es-ES" ]
- - mode: "sambert-perla-v1"
- name: "Perla(意大利语女声)"
- language: [ "it-IT" ]
- - mode: "sambert-indah-v1"
- name: "Indah(印尼语女声)"
- language: [ "id-ID" ]
- - mode: "sambert-clara-v1"
- name: "Clara(法语女声)"
- language: [ "fr-FR" ]
- - mode: "sambert-hanna-v1"
- name: "Hanna(德语女声)"
- language: [ "de-DE" ]
- - mode: "sambert-beth-v1"
- name: "Beth(咨询女声)"
- language: [ "en-US" ]
- - mode: "sambert-betty-v1"
- name: "Betty(客服女声)"
- language: [ "en-US" ]
- - mode: "sambert-cally-v1"
- name: "Cally(自然女声)"
- language: [ "en-US" ]
- - mode: "sambert-cindy-v1"
- name: "Cindy(对话女声)"
- language: [ "en-US" ]
- - mode: "sambert-eva-v1"
- name: "Eva(陪伴女声)"
- language: [ "en-US" ]
- - mode: "sambert-donna-v1"
- name: "Donna(教育女声)"
- language: [ "en-US" ]
- - mode: "sambert-brian-v1"
- name: "Brian(客服男声)"
- language: [ "en-US" ]
- - mode: "sambert-waan-v1"
- name: "Waan(泰语女声)"
- language: [ "th-TH" ]
- word_limit: 7000
- audio_type: 'mp3'
- max_workers: 5
-pricing:
- input: '1'
- output: '0'
- unit: '0.0001'
- currency: RMB
diff --git a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/tts/tts.py b/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/tts/tts.py
deleted file mode 100644
index 78787ad62f..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/models/tts/tts.py
+++ /dev/null
@@ -1,146 +0,0 @@
-import threading
-from queue import Queue
-from typing import Any, Optional
-import dashscope
-from dashscope import SpeechSynthesizer
-from dashscope.api_entities.dashscope_response import SpeechSynthesisResponse
-from dashscope.audio.tts import ResultCallback, SpeechSynthesisResult
-from dify_plugin.errors.model import CredentialsValidateFailedError, InvokeBadRequestError
-from dify_plugin.interfaces.model.tts_model import TTSModel
-from models._common import _CommonTongyi
-
-
-class TongyiText2SpeechModel(_CommonTongyi, TTSModel):
- """
- Model class for Tongyi Speech to text model.
- """
-
- def _invoke(
- self, model: str, tenant_id: str, credentials: dict, content_text: str, voice: str, user: Optional[str] = None
- ) -> Any:
- """
- _invoke text2speech model
-
- :param model: model name
- :param tenant_id: user tenant id
- :param credentials: model credentials
- :param voice: model timbre
- :param content_text: text content to be translated
- :param user: unique user id
- :return: text translated to audio file
- """
- if not voice or voice not in [
- d["value"] for d in self.get_tts_model_voices(model=model, credentials=credentials)
- ]:
- voice = self._get_model_default_voice(model, credentials)
- return self._tts_invoke_streaming(model=model, credentials=credentials, content_text=content_text, voice=voice)
-
- def validate_credentials(self, model: str, credentials: dict, user: Optional[str] = None) -> None:
- """
- validate credentials text2speech model
-
- :param model: model name
- :param credentials: model credentials
- :param user: unique user id
- :return: text translated to audio file
- """
- try:
- self._tts_invoke_streaming(
- model=model,
- credentials=credentials,
- content_text="Hello Dify!",
- voice=self._get_model_default_voice(model, credentials),
- )
- except Exception as ex:
- raise CredentialsValidateFailedError(str(ex))
-
- def _tts_invoke_streaming(self, model: str, credentials: dict, content_text: str, voice: str) -> Any:
- """
- _tts_invoke_streaming text2speech model
-
- :param model: model name
- :param credentials: model credentials
- :param voice: model timbre
- :param content_text: text content to be translated
- :return: text translated to audio file
- """
- word_limit = self._get_model_word_limit(model, credentials)
- audio_type = self._get_model_audio_type(model, credentials)
- try:
- audio_queue: Queue = Queue()
- callback = Callback(queue=audio_queue)
-
- def invoke_remote(content, v, api_key, cb, at, wl):
- if len(content) < word_limit:
- sentences = [content]
- else:
- sentences = list(self._split_text_into_sentences(org_text=content, max_length=wl))
- for sentence in sentences:
- SpeechSynthesizer.call(
- model=v,
- sample_rate=16000,
- api_key=api_key,
- text=sentence.strip(),
- callback=cb,
- format=at,
- word_timestamp_enabled=True,
- phoneme_timestamp_enabled=True,
- )
-
- threading.Thread(
- target=invoke_remote,
- args=(content_text, voice, credentials.get("dashscope_api_key"), callback, audio_type, word_limit),
- ).start()
- while True:
- audio = audio_queue.get()
- if audio is None:
- break
- yield audio
- except Exception as ex:
- raise InvokeBadRequestError(str(ex))
-
- @staticmethod
- def _process_sentence(sentence: str, credentials: dict, voice: str, audio_type: str):
- """
- _tts_invoke Tongyi text2speech model api
-
- :param credentials: model credentials
- :param sentence: text content to be translated
- :param voice: model timbre
- :param audio_type: audio file type
- :return: text translated to audio file
- """
- response = dashscope.audio.tts.SpeechSynthesizer.call(
- model=voice,
- sample_rate=48000,
- api_key=credentials.get("dashscope_api_key"),
- text=sentence.strip(),
- format=audio_type,
- )
- if isinstance(response.get_audio_data(), bytes):
- return response.get_audio_data()
-
-
-class Callback(ResultCallback):
- def __init__(self, queue: Queue):
- self._queue = queue
-
- def on_open(self):
- pass
-
- def on_complete(self):
- self._queue.put(None)
- self._queue.task_done()
-
- def on_error(self, response: SpeechSynthesisResponse):
- self._queue.put(None)
- self._queue.task_done()
-
- def on_close(self):
- self._queue.put(None)
- self._queue.task_done()
-
- def on_event(self, result: SpeechSynthesisResult):
- ad = result.get_audio_frame()
- if ad:
- self._queue.put(ad)
diff --git a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/provider/tongyi.py b/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/provider/tongyi.py
deleted file mode 100644
index bb9df97fb7..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/provider/tongyi.py
+++ /dev/null
@@ -1,25 +0,0 @@
-import logging
-from dify_plugin.entities.model import ModelType
-from dify_plugin.errors.model import CredentialsValidateFailedError
-from dify_plugin import ModelProvider
-
-logger = logging.getLogger(__name__)
-
-
-class TongyiProvider(ModelProvider):
- def validate_provider_credentials(self, credentials: dict) -> None:
- """
- Validate provider credentials
-
- if validate failed, raise exception
-
- :param credentials: provider credentials, credentials form defined in `provider_credential_schema`.
- """
- try:
- model_instance = self.get_model_instance(ModelType.LLM)
- model_instance.validate_credentials(model="qwen-turbo", credentials=credentials)
- except CredentialsValidateFailedError as ex:
- raise ex
- except Exception as ex:
- logger.exception(f"{self.get_provider_schema().provider} credentials validate failed")
- raise ex
diff --git a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/provider/tongyi.yaml b/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/provider/tongyi.yaml
deleted file mode 100644
index 2c925c02b6..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/provider/tongyi.yaml
+++ /dev/null
@@ -1,111 +0,0 @@
-background: '#EFF1FE'
-configurate_methods:
-- predefined-model
-- customizable-model
-extra:
- python:
- model_sources:
- - models/llm/llm.py
- - models/rerank/rerank.py
- - models/text_embedding/text_embedding.py
- - models/tts/tts.py
- provider_source: provider/tongyi.py
-help:
- title:
- en_US: Get your API key from AliCloud
- zh_Hans: 从阿里云百炼获取 API Key
- url:
- en_US: https://bailian.console.aliyun.com/?apiKey=1#/api-key
-icon_large:
- en_US: icon_l_en.png
- zh_Hans: icon_l_zh.png
-icon_small:
- en_US: icon_s_en.png
-label:
- en_US: TONGYI
- zh_Hans: 通义千问
-model_credential_schema:
- credential_form_schemas:
- - label:
- en_US: API Key
- placeholder:
- en_US: Enter your API Key
- zh_Hans: 在此输入您的 API Key
- required: true
- type: secret-input
- variable: dashscope_api_key
- - default: '4096'
- label:
- en_US: Model context size
- zh_Hans: 模型上下文长度
- placeholder:
- en_US: Enter your Model context size
- zh_Hans: 在此输入您的模型上下文长度
- required: true
- type: text-input
- variable: context_size
- - default: '4096'
- label:
- en_US: Upper bound for max tokens
- zh_Hans: 最大 token 上限
- show_on:
- - value: llm
- variable: __model_type
- type: text-input
- variable: max_tokens
- - default: no_call
- label:
- en_US: Function calling
- options:
- - label:
- en_US: Not Support
- zh_Hans: 不支持
- value: no_call
- - label:
- en_US: Support
- zh_Hans: 支持
- value: function_call
- required: false
- show_on:
- - value: llm
- variable: __model_type
- type: select
- variable: function_calling_type
- model:
- label:
- en_US: Model Name
- zh_Hans: 模型名称
- placeholder:
- en_US: Enter your model name
- zh_Hans: 输入模型名称
-models:
- llm:
- position: models/llm/_position.yaml
- predefined:
- - models/llm/*.yaml
- rerank:
- position: models/rerank/_position.yaml
- predefined:
- - models/rerank/*.yaml
- text_embedding:
- predefined:
- - models/text_embedding/*.yaml
- tts:
- predefined:
- - models/tts/*.yaml
-provider: tongyi
-provider_credential_schema:
- credential_form_schemas:
- - label:
- en_US: API Key
- placeholder:
- en_US: Enter your API Key
- zh_Hans: 在此输入您的 API Key
- required: true
- type: secret-input
- variable: dashscope_api_key
-supported_model_types:
-- llm
-- tts
-- text-embedding
-- rerank
diff --git a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/requirements.txt b/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/requirements.txt
deleted file mode 100644
index 07a3a40cd5..0000000000
--- a/api/init_data/plugins/storage/cwd/langgenius/tongyi-0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb/requirements.txt
+++ /dev/null
@@ -1,4 +0,0 @@
-dify_plugin==0.0.1b73
-numpy~=2.2.3
-dashscope~=1.22.2
-openai~=1.65.4
diff --git a/api/init_data/plugins/storage/plugin/langgenius/agent0.0.11@6b60e6812d1428f06a4dee70a1e9c7dd2af217bf123103758fb40483069c12c9 b/api/init_data/plugins/storage/plugin/langgenius/agent0.0.11@6b60e6812d1428f06a4dee70a1e9c7dd2af217bf123103758fb40483069c12c9
deleted file mode 100644
index eb7ac5f66e..0000000000
Binary files a/api/init_data/plugins/storage/plugin/langgenius/agent0.0.11@6b60e6812d1428f06a4dee70a1e9c7dd2af217bf123103758fb40483069c12c9 and /dev/null differ
diff --git a/api/init_data/plugins/storage/plugin/langgenius/deepseek0.0.5@fd6efd37c2a931911de8ab9ca3ba2da303bef146d45ee87ad896b04b36d09403 b/api/init_data/plugins/storage/plugin/langgenius/deepseek0.0.5@fd6efd37c2a931911de8ab9ca3ba2da303bef146d45ee87ad896b04b36d09403
deleted file mode 100644
index cbcbc0b37d..0000000000
Binary files a/api/init_data/plugins/storage/plugin/langgenius/deepseek0.0.5@fd6efd37c2a931911de8ab9ca3ba2da303bef146d45ee87ad896b04b36d09403 and /dev/null differ
diff --git a/api/init_data/plugins/storage/plugin/langgenius/ollama0.0.3@9ded90ac00e8510119a24be7396ba77191c9610d5e1e29f59d68fa1229822fc7 b/api/init_data/plugins/storage/plugin/langgenius/ollama0.0.3@9ded90ac00e8510119a24be7396ba77191c9610d5e1e29f59d68fa1229822fc7
deleted file mode 100644
index 4a6554f134..0000000000
Binary files a/api/init_data/plugins/storage/plugin/langgenius/ollama0.0.3@9ded90ac00e8510119a24be7396ba77191c9610d5e1e29f59d68fa1229822fc7 and /dev/null differ
diff --git a/api/init_data/plugins/storage/plugin/langgenius/siliconflow0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3 b/api/init_data/plugins/storage/plugin/langgenius/siliconflow0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3
deleted file mode 100644
index 4a5441cd85..0000000000
Binary files a/api/init_data/plugins/storage/plugin/langgenius/siliconflow0.0.8@217f973bd7ced1b099c2f0c669f1356bdf4cc38b8372fd58d7874f9940b95de3 and /dev/null differ
diff --git a/api/init_data/plugins/storage/plugin_packages/langgenius/agent0.0.11@6b60e6812d1428f06a4dee70a1e9c7dd2af217bf123103758fb40483069c12c9 b/api/init_data/plugins/storage/plugin_packages/langgenius/agent0.0.11@6b60e6812d1428f06a4dee70a1e9c7dd2af217bf123103758fb40483069c12c9
deleted file mode 100644
index eb7ac5f66e..0000000000
Binary files a/api/init_data/plugins/storage/plugin_packages/langgenius/agent0.0.11@6b60e6812d1428f06a4dee70a1e9c7dd2af217bf123103758fb40483069c12c9 and /dev/null differ
diff --git a/api/init_data/plugins/storage/plugin_packages/langgenius/deepseek0.0.5@fd6efd37c2a931911de8ab9ca3ba2da303bef146d45ee87ad896b04b36d09403 b/api/init_data/plugins/storage/plugin_packages/langgenius/deepseek0.0.5@fd6efd37c2a931911de8ab9ca3ba2da303bef146d45ee87ad896b04b36d09403
deleted file mode 100644
index cbcbc0b37d..0000000000
Binary files a/api/init_data/plugins/storage/plugin_packages/langgenius/deepseek0.0.5@fd6efd37c2a931911de8ab9ca3ba2da303bef146d45ee87ad896b04b36d09403 and /dev/null differ
diff --git a/api/init_data/plugins/storage/plugin_packages/langgenius/ollama0.0.3@9ded90ac00e8510119a24be7396ba77191c9610d5e1e29f59d68fa1229822fc7 b/api/init_data/plugins/storage/plugin_packages/langgenius/ollama0.0.3@9ded90ac00e8510119a24be7396ba77191c9610d5e1e29f59d68fa1229822fc7
deleted file mode 100644
index 4a6554f134..0000000000
Binary files a/api/init_data/plugins/storage/plugin_packages/langgenius/ollama0.0.3@9ded90ac00e8510119a24be7396ba77191c9610d5e1e29f59d68fa1229822fc7 and /dev/null differ
diff --git a/api/init_data/plugins/storage/plugin_packages/langgenius/openai_api_compatible0.0.11@410445eba2fa0f693d26dea2c3b9ffe51ad0777e021146ff877af6098412efc7 b/api/init_data/plugins/storage/plugin_packages/langgenius/openai_api_compatible0.0.11@410445eba2fa0f693d26dea2c3b9ffe51ad0777e021146ff877af6098412efc7
deleted file mode 100644
index 151db5c4a6..0000000000
Binary files a/api/init_data/plugins/storage/plugin_packages/langgenius/openai_api_compatible0.0.11@410445eba2fa0f693d26dea2c3b9ffe51ad0777e021146ff877af6098412efc7 and /dev/null differ
diff --git a/api/init_data/plugins/storage/plugin_packages/langgenius/tongyi0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb b/api/init_data/plugins/storage/plugin_packages/langgenius/tongyi0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb
deleted file mode 100644
index 8532a7140e..0000000000
Binary files a/api/init_data/plugins/storage/plugin_packages/langgenius/tongyi0.0.14@d333909fe8d75a335b44da4b878d5120779b8703f12c21cf4730135d6864afbb and /dev/null differ
diff --git a/api/init_data/workflows/en/Container CPU usage analysis.yml b/api/init_data/workflows/en/Container CPU usage analysis.yml
index 46c7f21426..22f99dab39 100644
--- a/api/init_data/workflows/en/Container CPU usage analysis.yml
+++ b/api/init_data/workflows/en/Container CPU usage analysis.yml
@@ -147,7 +147,7 @@ workflow:
- data:
desc: ''
selected: true
- title: 开始
+ title: start
type: start
variables:
- label: Container runtime type(containered or docker)
@@ -340,7 +340,7 @@ workflow:
provider_name: apo_select
provider_type: builtin
selected: false
- title: 容器CPU使用率(使用Containerd容器运行时,按容器和Pod统计)
+ title: Container CPU Usage
tool_configurations: {}
tool_label: 容器CPU使用率(使用Containerd容器运行时,按容器和Pod统计)
tool_name: 容器CPU使用率(使用Containerd容器运行时,按容器和Pod统计)
@@ -513,7 +513,7 @@ workflow:
provider_name: apo_select
provider_type: builtin
selected: false
- title: 容器CPU使用率(使用Docker容器运行时,按Pod统计)
+ title: Container CPU usage
tool_configurations: {}
tool_label: 容器CPU使用率(使用Docker容器运行时,按Pod统计)
tool_name: 容器CPU使用率(使用Docker容器运行时,按Pod统计)
@@ -566,7 +566,7 @@ workflow:
logical_operator: and
desc: ''
selected: false
- title: 条件分支
+ title: if-else
type: if-else
height: 125
id: '1742544615331'
@@ -585,7 +585,7 @@ workflow:
desc: ''
output_type: string
selected: false
- title: 变量聚合器
+ title: summary
type: variable-aggregator
variables:
- - '1742544602116'
@@ -613,7 +613,7 @@ workflow:
- text
variable: text
selected: false
- title: 结束
+ title: end
type: end
height: 89
id: '1742545032360'
diff --git a/api/init_data/workflows/en/Container memory analysis.yml b/api/init_data/workflows/en/Container memory analysis.yml
index 2bf24d679b..91c55af2fb 100644
--- a/api/init_data/workflows/en/Container memory analysis.yml
+++ b/api/init_data/workflows/en/Container memory analysis.yml
@@ -142,7 +142,7 @@ workflow:
- data:
desc: ''
selected: false
- title: 开始
+ title: start
type: start
variables:
- label: pod
@@ -259,7 +259,7 @@ workflow:
- text
variable: text
selected: true
- title: 结束
+ title: end
type: end
height: 89
id: '1741075309105'
@@ -409,7 +409,7 @@ workflow:
provider_name: apo_select
provider_type: builtin
selected: false
- title: 容器内存使用字节数(使用Containerd容器运行时,按容器和Pod统计)
+ title: Container memory usage
tool_configurations: {}
tool_label: 容器内存使用字节数(使用Containerd容器运行时,按容器和Pod统计)
tool_name: 容器内存使用字节数(使用Containerd容器运行时,按容器和Pod统计)
@@ -582,7 +582,7 @@ workflow:
provider_name: apo_select
provider_type: builtin
selected: false
- title: 容器内存使用字节数(使用Docker容器运行时,按Pod统计)
+ title: Container memory usage
tool_configurations: {}
tool_label: 容器内存使用字节数(使用Docker容器运行时,按Pod统计)
tool_name: 容器内存使用字节数(使用Docker容器运行时,按Pod统计)
@@ -635,7 +635,7 @@ workflow:
logical_operator: and
desc: ''
selected: false
- title: 条件分支
+ title: if-else
type: if-else
height: 125
id: '1742545677987'
@@ -654,7 +654,7 @@ workflow:
desc: ''
output_type: string
selected: false
- title: 变量聚合器
+ title: summary
type: variable-aggregator
variables:
- - '1742545659582'
diff --git a/api/init_data/workflows/en/Host CPU IO Wait.yml b/api/init_data/workflows/en/Host CPU IO Wait.yml
index cad3cd436a..adf48397fa 100644
--- a/api/init_data/workflows/en/Host CPU IO Wait.yml
+++ b/api/init_data/workflows/en/Host CPU IO Wait.yml
@@ -97,7 +97,7 @@ workflow:
- data:
desc: ''
selected: false
- title: 开始
+ title: start
type: start
variables:
- label: Query start time(Microsecond)
@@ -216,7 +216,7 @@ workflow:
provider_name: apo_select
provider_type: builtin
selected: false
- title: 宿主机IO等待CPU繁忙率
+ title: Query Host IO Wait
tool_configurations: {}
tool_label: 宿主机IO等待CPU繁忙率
tool_name: host_cpu_iowait
@@ -307,7 +307,7 @@ workflow:
- text
variable: text
selected: false
- title: 结束
+ title: end
type: end
height: 89
id: '1742548523246'
diff --git a/api/init_data/workflows/en/Host CPU usage analysis.yml b/api/init_data/workflows/en/Host CPU usage analysis.yml
index f87ef0632e..fe6dba16ae 100644
--- a/api/init_data/workflows/en/Host CPU usage analysis.yml
+++ b/api/init_data/workflows/en/Host CPU usage analysis.yml
@@ -167,7 +167,7 @@ workflow:
- data:
desc: ''
selected: false
- title: 开始
+ title: start
type: start
variables:
- label: Node name
@@ -221,7 +221,7 @@ workflow:
- text
variable: text
selected: false
- title: 结束
+ title: end
type: end
height: 89
id: '1740015067036'
@@ -398,7 +398,7 @@ workflow:
provider_name: apo_select
provider_type: builtin
selected: false
- title: 查询宿主机CPU压力
+ title: Query Host CPU Usage
tool_configurations: {}
tool_label: 查询宿主机CPU压力
tool_name: 查询宿主机CPU压力
@@ -448,7 +448,7 @@ workflow:
logical_operator: and
desc: ''
selected: false
- title: 条件分支
+ title: if-else
type: if-else
height: 125
id: '1742549684668'
@@ -598,7 +598,7 @@ workflow:
provider_name: apo_select
provider_type: builtin
selected: false
- title: 容器CPU使用率(使用Containerd容器运行时,按容器和Pod统计)
+ title: Container CPU usage
tool_configurations: {}
tool_label: 容器CPU使用率(使用Containerd容器运行时,按容器和Pod统计)
tool_name: 容器CPU使用率(使用Containerd容器运行时,按容器和Pod统计)
@@ -768,7 +768,7 @@ workflow:
provider_name: apo_select
provider_type: builtin
selected: false
- title: 容器CPU使用率(使用Docker容器运行时,按Pod统计)
+ title: Container CPU usage
tool_configurations: {}
tool_label: 容器CPU使用率(使用Docker容器运行时,按Pod统计)
tool_name: 容器CPU使用率(使用Docker容器运行时,按Pod统计)
@@ -801,7 +801,7 @@ workflow:
desc: ''
output_type: string
selected: false
- title: 变量聚合器
+ title: summary
type: variable-aggregator
variables:
- - '1742549705555'
diff --git a/api/init_data/workflows/en/Host disk usage.yml b/api/init_data/workflows/en/Host disk usage.yml
index 8014d776d8..2407c89a41 100644
--- a/api/init_data/workflows/en/Host disk usage.yml
+++ b/api/init_data/workflows/en/Host disk usage.yml
@@ -97,7 +97,7 @@ workflow:
- data:
desc: ''
selected: false
- title: 开始
+ title: start
type: start
variables:
- label: Node name
@@ -216,7 +216,7 @@ workflow:
provider_name: apo_select
provider_type: builtin
selected: false
- title: 宿主机磁盘使用率(百分比,不含rootfs)
+ title: Host disk usage
tool_configurations: {}
tool_label: 宿主机磁盘使用率(百分比,不含rootfs)
tool_name: 宿主机磁盘使用率(百分比,不含rootfs)
@@ -306,7 +306,7 @@ workflow:
- text
variable: text
selected: false
- title: 结束
+ title: end
type: end
height: 89
id: '1742549028365'
diff --git a/api/init_data/workflows/en/Host memory analysis.yml b/api/init_data/workflows/en/Host memory analysis.yml
index a36cda4a9a..113632068a 100644
--- a/api/init_data/workflows/en/Host memory analysis.yml
+++ b/api/init_data/workflows/en/Host memory analysis.yml
@@ -119,7 +119,7 @@ workflow:
- data:
desc: ''
selected: false
- title: 开始
+ title: start
type: start
variables:
- label: Query start time(Microsecond)
@@ -275,7 +275,7 @@ workflow:
provider_name: apo_select
provider_type: builtin
selected: false
- title: 查询宿主机RAM使用率
+ title: Query Host RAM Usage
tool_configurations: {}
tool_label: 查询宿主机RAM使用率
tool_name: 查询宿主机RAM使用率
@@ -420,7 +420,7 @@ workflow:
provider_name: apo_select
provider_type: builtin
selected: false
- title: 查询宿主机RAM总大小
+ title: Query Host RAM Total Size
tool_configurations: {}
tool_label: 查询宿主机RAM总大小
tool_name: 查询宿主机RAM总大小
@@ -513,7 +513,7 @@ workflow:
- text
variable: text
selected: false
- title: 结束
+ title: end
type: end
height: 89
id: '1742546671231'
diff --git a/api/init_data/workflows/en/Log analysis.yml b/api/init_data/workflows/en/Log analysis.yml
index 3dd96ed973..6970135224 100644
--- a/api/init_data/workflows/en/Log analysis.yml
+++ b/api/init_data/workflows/en/Log analysis.yml
@@ -97,7 +97,7 @@ workflow:
- data:
desc: ''
selected: false
- title: 开始
+ title: start
type: start
variables:
- label: Service Name
@@ -118,7 +118,7 @@ workflow:
required: true
type: number
variable: endTime
- height: 141
+ height: 142
id: '1740548057126'
position:
x: 80
@@ -130,7 +130,7 @@ workflow:
sourcePosition: right
targetPosition: left
type: custom
- width: 243
+ width: 244
- data:
desc: ''
outputs:
@@ -139,9 +139,9 @@ workflow:
- text
variable: text
selected: false
- title: 结束
+ title: end
type: end
- height: 89
+ height: 90
id: '1740550714241'
position:
x: 988
@@ -153,7 +153,7 @@ workflow:
sourcePosition: right
targetPosition: left
type: custom
- width: 243
+ width: 244
- data:
context:
enabled: false
@@ -174,13 +174,13 @@ workflow:
role: user
text: Here are the logs from the specified time period {{#1741576642510.text#}}.
Please help summarize the exception occurrences in the logs.
- selected: true
+ selected: false
title: LLM
type: llm
variables: []
vision:
enabled: false
- height: 89
+ height: 90
id: '1740647123944'
position:
x: 687.0472902605677
@@ -188,11 +188,11 @@ workflow:
positionAbsolute:
x: 687.0472902605677
y: 282
- selected: true
+ selected: false
sourcePosition: right
targetPosition: left
type: custom
- width: 243
+ width: 244
- data:
desc: ''
is_team_authorization: true
@@ -277,8 +277,8 @@ workflow:
provider_id: apo_select
provider_name: apo_select
provider_type: builtin
- selected: false
- title: 查询服务日志数据
+ selected: true
+ title: query service log
tool_configurations: {}
tool_label: 查询服务日志数据
tool_name: 查询服务日志数据
@@ -297,7 +297,7 @@ workflow:
- '1740548057126'
- startTime
type: tool
- height: 53
+ height: 54
id: '1741576642510'
position:
x: 384
@@ -305,12 +305,12 @@ workflow:
positionAbsolute:
x: 384
y: 282
- selected: false
+ selected: true
sourcePosition: right
targetPosition: left
type: custom
- width: 243
+ width: 244
viewport:
- x: -336.5210134696184
- y: -51.41093641424487
- zoom: 0.9137626364719462
+ x: 175.96621796218471
+ y: 168.67603979204648
+ zoom: 0.5074056864830986
diff --git a/api/init_data/workflows/en/Network anomalies analysis.yml b/api/init_data/workflows/en/Network anomalies analysis.yml
index a33b1d8fa9..13e1126cf6 100644
--- a/api/init_data/workflows/en/Network anomalies analysis.yml
+++ b/api/init_data/workflows/en/Network anomalies analysis.yml
@@ -98,7 +98,7 @@ workflow:
- data:
desc: ''
selected: true
- title: 开始
+ title: start
type: start
variables:
- label: Pod
@@ -204,7 +204,7 @@ workflow:
- text
variable: text
selected: false
- title: 结束
+ title: end
type: end
height: 89
id: '1741075309105'
@@ -329,7 +329,7 @@ workflow:
provider_name: apo_select
provider_type: builtin
selected: false
- title: 容器与下游服务的网络往返时间(RTT,按命名空间和Pod统计)
+ title: Container Network RTT
tool_configurations: {}
tool_label: 容器与下游服务的网络往返时间(RTT,按命名空间和Pod统计)
tool_name: 查询容器网络与下游RTT
diff --git a/api/init_data/workflows/en/Service alert event.yml b/api/init_data/workflows/en/Service alert event.yml
index 0ef1519626..36c42050f9 100644
--- a/api/init_data/workflows/en/Service alert event.yml
+++ b/api/init_data/workflows/en/Service alert event.yml
@@ -97,7 +97,7 @@ workflow:
- data:
desc: ''
selected: false
- title: 开始
+ title: start
type: start
variables:
- label: Query start time(Microsecond)
@@ -196,7 +196,7 @@ workflow:
- text
variable: text
selected: false
- title: 结束
+ title: end
type: end
height: 89
id: '1741075309105'
@@ -321,7 +321,7 @@ workflow:
provider_name: apo_select
provider_type: builtin
selected: false
- title: 查询入口服务告警事件
+ title: query entry service alert events
tool_configurations: {}
tool_label: 查询入口服务告警事件
tool_name: alert
diff --git a/api/init_data/workflows/en/alert validity confirmation.yml b/api/init_data/workflows/en/alert validity confirmation.yml
index 28cb78d449..bdb6672430 100644
--- a/api/init_data/workflows/en/alert validity confirmation.yml
+++ b/api/init_data/workflows/en/alert validity confirmation.yml
@@ -60,42 +60,6 @@ workflow:
voice: ''
graph:
edges:
- - data:
- isInIteration: false
- sourceType: code
- targetType: question-classifier
- id: 1741161440242-source-1741158559444-target
- selected: false
- source: '1741161440242'
- sourceHandle: source
- target: '1741158559444'
- targetHandle: target
- type: custom
- zIndex: 0
- - data:
- isInIteration: false
- sourceType: variable-aggregator
- targetType: tool
- id: 1741162531836-source-1741166377433-target
- selected: false
- source: '1741162531836'
- sourceHandle: source
- target: '1741166377433'
- targetHandle: target
- type: custom
- zIndex: 0
- - data:
- isInIteration: false
- sourceType: start
- targetType: code
- id: 1741157526222-source-1741161440242-target
- selected: false
- source: '1741157526222'
- sourceHandle: source
- target: '1741161440242'
- targetHandle: target
- type: custom
- zIndex: 0
- data:
isInIteration: false
sourceType: agent
@@ -144,18 +108,6 @@ workflow:
targetHandle: target
type: custom
zIndex: 0
- - data:
- isInIteration: false
- sourceType: tool
- targetType: variable-aggregator
- id: 1741166377433-source-1741311394752-target
- selected: false
- source: '1741166377433'
- sourceHandle: source
- target: '1741311394752'
- targetHandle: target
- type: custom
- zIndex: 0
- data:
isInIteration: false
sourceType: question-classifier
@@ -180,18 +132,6 @@ workflow:
targetHandle: target
type: custom
zIndex: 0
- - data:
- isInIteration: false
- sourceType: question-classifier
- targetType: tool
- id: 1741158559444-1741158765960-1741328058981-target
- selected: false
- source: '1741158559444'
- sourceHandle: '1741158765960'
- target: '1741328058981'
- targetHandle: target
- type: custom
- zIndex: 0
- data:
isInIteration: false
sourceType: question-classifier
@@ -204,18 +144,6 @@ workflow:
targetHandle: target
type: custom
zIndex: 0
- - data:
- isInIteration: false
- sourceType: question-classifier
- targetType: tool
- id: 1741158559444-1741318899444-1741328169934-target
- selected: false
- source: '1741158559444'
- sourceHandle: '1741318899444'
- target: '1741328169934'
- targetHandle: target
- type: custom
- zIndex: 0
- data:
isInIteration: false
sourceType: question-classifier
@@ -276,18 +204,6 @@ workflow:
targetHandle: target
type: custom
zIndex: 0
- - data:
- isInIteration: false
- sourceType: question-classifier
- targetType: tool
- id: 1741158559444-1741319171199-1741328692906-target
- selected: false
- source: '1741158559444'
- sourceHandle: '1741319171199'
- target: '1741328692906'
- targetHandle: target
- type: custom
- zIndex: 0
- data:
isInIteration: false
sourceType: question-classifier
@@ -338,13 +254,59 @@ workflow:
zIndex: 0
- data:
isInIteration: false
- sourceType: tool
+ sourceType: llm
+ targetType: question-classifier
+ id: 1742366141890-source-1742366303110-target
+ selected: false
+ source: '1742366141890'
+ sourceHandle: source
+ target: '1742366303110'
+ targetHandle: target
+ type: custom
+ zIndex: 0
+ - data:
+ isInIteration: false
+ sourceType: question-classifier
targetType: variable-aggregator
- id: 1741328045214-source-1741162531836-target
+ id: 1742366303110-1-1741311394752-target
selected: false
+ source: '1742366303110'
+ sourceHandle: '1'
+ target: '1741311394752'
+ targetHandle: target
+ type: custom
+ zIndex: 0
+ - data:
+ isInIteration: false
+ sourceType: question-classifier
+ targetType: variable-aggregator
+ id: 1742366303110-2-1741311394752-target
+ selected: false
+ source: '1742366303110'
+ sourceHandle: '2'
+ target: '1741311394752'
+ targetHandle: target
+ type: custom
+ zIndex: 0
+ - data:
+ isInIteration: false
+ sourceType: code
+ targetType: question-classifier
+ id: 1742433446760-source-1741158559444-target
+ source: '1742433446760'
+ sourceHandle: source
+ target: '1741158559444'
+ targetHandle: target
+ type: custom
+ zIndex: 0
+ - data:
+ isInIteration: false
+ sourceType: tool
+ targetType: tool
+ id: 1741328045214-source-17424339242280-target
source: '1741328045214'
sourceHandle: source
- target: '1741162531836'
+ target: '17424339242280'
targetHandle: target
type: custom
zIndex: 0
@@ -352,9 +314,8 @@ workflow:
isInIteration: false
sourceType: tool
targetType: variable-aggregator
- id: 1741328058981-source-1741162531836-target
- selected: false
- source: '1741328058981'
+ id: 17424339242280-source-1741162531836-target
+ source: '17424339242280'
sourceHandle: source
target: '1741162531836'
targetHandle: target
@@ -362,13 +323,23 @@ workflow:
zIndex: 0
- data:
isInIteration: false
- sourceType: tool
+ sourceType: variable-aggregator
targetType: variable-aggregator
- id: 1741328076453-source-1741162531836-target
- selected: false
- source: '1741328076453'
+ id: 1741162531836-source-1742434016239-target
+ source: '1741162531836'
sourceHandle: source
- target: '1741162531836'
+ target: '1742434016239'
+ targetHandle: target
+ type: custom
+ zIndex: 0
+ - data:
+ isInIteration: false
+ sourceType: variable-aggregator
+ targetType: llm
+ id: 1742434016239-source-1742366141890-target
+ source: '1742434016239'
+ sourceHandle: source
+ target: '1742366141890'
targetHandle: target
type: custom
zIndex: 0
@@ -376,9 +347,8 @@ workflow:
isInIteration: false
sourceType: tool
targetType: variable-aggregator
- id: 1741328169934-source-1741162531836-target
- selected: false
- source: '1741328169934'
+ id: 17424342365860-source-1741162531836-target
+ source: '17424342365860'
sourceHandle: source
target: '1741162531836'
targetHandle: target
@@ -387,12 +357,22 @@ workflow:
- data:
isInIteration: false
sourceType: tool
- targetType: variable-aggregator
- id: 1741329632798-source-1741162531836-target
- selected: false
+ targetType: tool
+ id: 1741328076453-source-17424342365860-target
+ source: '1741328076453'
+ sourceHandle: source
+ target: '17424342365860'
+ targetHandle: target
+ type: custom
+ zIndex: 0
+ - data:
+ isInIteration: false
+ sourceType: tool
+ targetType: tool
+ id: 1741329632798-source-17424344697090-target
source: '1741329632798'
sourceHandle: source
- target: '1741162531836'
+ target: '17424344697090'
targetHandle: target
type: custom
zIndex: 0
@@ -400,69 +380,118 @@ workflow:
isInIteration: false
sourceType: tool
targetType: variable-aggregator
- id: 1741328197695-source-1741162531836-target
- selected: false
- source: '1741328197695'
+ id: 17424344697090-source-1741162531836-target
+ source: '17424344697090'
sourceHandle: source
target: '1741162531836'
targetHandle: target
type: custom
zIndex: 0
+ - data:
+ isInIteration: false
+ sourceType: tool
+ targetType: tool
+ id: 1741328197695-source-17424345080000-target
+ source: '1741328197695'
+ sourceHandle: source
+ target: '17424345080000'
+ targetHandle: target
+ type: custom
+ zIndex: 0
- data:
isInIteration: false
sourceType: tool
targetType: variable-aggregator
- id: 1741328213545-source-1741162531836-target
- selected: false
- source: '1741328213545'
+ id: 17424345080000-source-1741162531836-target
+ source: '17424345080000'
sourceHandle: source
target: '1741162531836'
targetHandle: target
type: custom
zIndex: 0
+ - data:
+ isInIteration: false
+ sourceType: tool
+ targetType: tool
+ id: 1741328213545-source-17424345315500-target
+ source: '1741328213545'
+ sourceHandle: source
+ target: '17424345315500'
+ targetHandle: target
+ type: custom
+ zIndex: 0
- data:
isInIteration: false
sourceType: tool
targetType: variable-aggregator
- id: 1741328346220-source-1741162531836-target
- selected: false
- source: '1741328346220'
+ id: 17424345315500-source-1741162531836-target
+ source: '17424345315500'
sourceHandle: source
target: '1741162531836'
targetHandle: target
type: custom
zIndex: 0
+ - data:
+ isInIteration: false
+ sourceType: tool
+ targetType: tool
+ id: 1741328346220-source-17424345826170-target
+ source: '1741328346220'
+ sourceHandle: source
+ target: '17424345826170'
+ targetHandle: target
+ type: custom
+ zIndex: 0
- data:
isInIteration: false
sourceType: tool
targetType: variable-aggregator
- id: 1741328423453-source-1741162531836-target
- selected: false
- source: '1741328423453'
+ id: 17424345826170-source-1741162531836-target
+ source: '17424345826170'
sourceHandle: source
target: '1741162531836'
targetHandle: target
type: custom
zIndex: 0
+ - data:
+ isInIteration: false
+ sourceType: tool
+ targetType: tool
+ id: 1741328423453-source-17424346884650-target
+ source: '1741328423453'
+ sourceHandle: source
+ target: '17424346884650'
+ targetHandle: target
+ type: custom
+ zIndex: 0
- data:
isInIteration: false
sourceType: tool
targetType: variable-aggregator
- id: 1741328466394-source-1741162531836-target
- selected: false
- source: '1741328466394'
+ id: 17424346884650-source-1741162531836-target
+ source: '17424346884650'
sourceHandle: source
target: '1741162531836'
targetHandle: target
type: custom
zIndex: 0
+ - data:
+ isInIteration: false
+ sourceType: tool
+ targetType: tool
+ id: 1741328466394-source-17424347242840-target
+ source: '1741328466394'
+ sourceHandle: source
+ target: '17424347242840'
+ targetHandle: target
+ type: custom
+ zIndex: 0
- data:
isInIteration: false
sourceType: tool
targetType: variable-aggregator
- id: 1741328692906-source-1741162531836-target
- selected: false
- source: '1741328692906'
+ id: 17424347242840-source-1741162531836-target
+ source: '17424347242840'
sourceHandle: source
target: '1741162531836'
targetHandle: target
@@ -471,12 +500,11 @@ workflow:
- data:
isInIteration: false
sourceType: tool
- targetType: variable-aggregator
- id: 1741328742817-source-1741162531836-target
- selected: false
+ targetType: tool
+ id: 1741328742817-source-17424348206030-target
source: '1741328742817'
sourceHandle: source
- target: '1741162531836'
+ target: '17424348206030'
targetHandle: target
type: custom
zIndex: 0
@@ -484,21 +512,30 @@ workflow:
isInIteration: false
sourceType: tool
targetType: variable-aggregator
- id: 1741328773213-source-1741162531836-target
- selected: false
- source: '1741328773213'
+ id: 17424348206030-source-1741162531836-target
+ source: '17424348206030'
sourceHandle: source
target: '1741162531836'
targetHandle: target
type: custom
zIndex: 0
+ - data:
+ isInIteration: false
+ sourceType: tool
+ targetType: tool
+ id: 1741328773213-source-17424348526540-target
+ source: '1741328773213'
+ sourceHandle: source
+ target: '17424348526540'
+ targetHandle: target
+ type: custom
+ zIndex: 0
- data:
isInIteration: false
sourceType: tool
targetType: variable-aggregator
- id: 1741328799030-source-1741162531836-target
- selected: false
- source: '1741328799030'
+ id: 17424348526540-source-1741162531836-target
+ source: '17424348526540'
sourceHandle: source
target: '1741162531836'
targetHandle: target
@@ -506,13 +543,12 @@ workflow:
zIndex: 0
- data:
isInIteration: false
- sourceType: question-classifier
+ sourceType: tool
targetType: tool
- id: 1741158559444-1741591414269-1741591590829-target
- selected: false
- source: '1741158559444'
- sourceHandle: '1741591414269'
- target: '1741591590829'
+ id: 1741328799030-source-17424348570980-target
+ source: '1741328799030'
+ sourceHandle: source
+ target: '17424348570980'
targetHandle: target
type: custom
zIndex: 0
@@ -520,77 +556,230 @@ workflow:
isInIteration: false
sourceType: tool
targetType: variable-aggregator
- id: 1741591590829-source-1741162531836-target
- selected: false
- source: '1741591590829'
+ id: 17424348570980-source-1741162531836-target
+ source: '17424348570980'
sourceHandle: source
target: '1741162531836'
targetHandle: target
type: custom
zIndex: 0
- nodes:
- data:
- desc: ''
- selected: true
- title: start
- type: start
- variables:
- - allowed_file_extensions: []
- allowed_file_types:
- - document
- allowed_file_upload_methods:
- - local_file
- - remote_url
- label: alert
- max_length: 256
- options: []
- required: true
- type: text-input
- variable: alert
- - label: params
- max_length: 99999999999
- options: []
- required: true
- type: paragraph
- variable: params
- - label: startTime(Microsecond)
- max_length: 48
- options: []
- required: true
- type: number
- variable: startTime
- - label: endTime(Microsecond)
- max_length: 48
- options: []
- required: true
- type: number
- variable: endTime
- - allowed_file_extensions:
- - .json
- allowed_file_types:
- - custom
- allowed_file_upload_methods:
- - local_file
- - remote_url
+ isInIteration: false
+ sourceType: start
+ targetType: code
+ id: 1741157526222-source-1742806924635-target
+ source: '1741157526222'
+ sourceHandle: source
+ target: '1742806924635'
+ targetHandle: target
+ type: custom
+ zIndex: 0
+ - data:
+ isInIteration: false
+ sourceType: code
+ targetType: code
+ id: 1742806924635-source-1742433446760-target
+ source: '1742806924635'
+ sourceHandle: source
+ target: '1742433446760'
+ targetHandle: target
+ type: custom
+ zIndex: 0
+ - data:
+ isInIteration: false
+ sourceType: question-classifier
+ targetType: tool
+ id: 1741158559444-1741158765960-1742979394268-target
+ source: '1741158559444'
+ sourceHandle: '1741158765960'
+ target: '1742979394268'
+ targetHandle: target
+ type: custom
+ zIndex: 0
+ - data:
+ isInIteration: false
+ sourceType: question-classifier
+ targetType: tool
+ id: 1741158559444-1741318899444-1742979595004-target
+ source: '1741158559444'
+ sourceHandle: '1741318899444'
+ target: '1742979595004'
+ targetHandle: target
+ type: custom
+ zIndex: 0
+ - data:
+ isInIteration: false
+ sourceType: question-classifier
+ targetType: tool
+ id: 1741158559444-1741591414269-17429797453350-target
+ source: '1741158559444'
+ sourceHandle: '1741591414269'
+ target: '17429797453350'
+ targetHandle: target
+ type: custom
+ zIndex: 0
+ - data:
+ isInIteration: false
+ sourceType: tool
+ targetType: tool
+ id: 17429797453350-source-17429797664440-target
+ source: '17429797453350'
+ sourceHandle: source
+ target: '17429797664440'
+ targetHandle: target
+ type: custom
+ zIndex: 0
+ - data:
+ isInIteration: false
+ sourceType: tool
+ targetType: variable-aggregator
+ id: 17429797664440-source-1741162531836-target
+ source: '17429797664440'
+ sourceHandle: source
+ target: '1741162531836'
+ targetHandle: target
+ type: custom
+ zIndex: 0
+ - data:
+ isInIteration: false
+ sourceType: question-classifier
+ targetType: tool
+ id: 1741158559444-1741319171199-1742979828391-target
+ source: '1741158559444'
+ sourceHandle: '1741319171199'
+ target: '1742979828391'
+ targetHandle: target
+ type: custom
+ zIndex: 0
+ - data:
+ isInIteration: false
+ sourceType: tool
+ targetType: tool
+ id: 1742979828391-source-17429798797920-target
+ source: '1742979828391'
+ sourceHandle: source
+ target: '17429798797920'
+ targetHandle: target
+ type: custom
+ zIndex: 0
+ - data:
+ isInIteration: false
+ sourceType: tool
+ targetType: variable-aggregator
+ id: 17429798797920-source-1741162531836-target
+ source: '17429798797920'
+ sourceHandle: source
+ target: '1741162531836'
+ targetHandle: target
+ type: custom
+ zIndex: 0
+ - data:
+ isInIteration: false
+ sourceType: tool
+ targetType: tool
+ id: 1742979394268-source-17429835599060-target
+ source: '1742979394268'
+ sourceHandle: source
+ target: '17429835599060'
+ targetHandle: target
+ type: custom
+ zIndex: 0
+ - data:
+ isInIteration: false
+ sourceType: tool
+ targetType: variable-aggregator
+ id: 17429835599060-source-1741162531836-target
+ source: '17429835599060'
+ sourceHandle: source
+ target: '1741162531836'
+ targetHandle: target
+ type: custom
+ zIndex: 0
+ - data:
+ isInIteration: false
+ sourceType: tool
+ targetType: tool
+ id: 1742979595004-source-17429835940550-target
+ source: '1742979595004'
+ sourceHandle: source
+ target: '17429835940550'
+ targetHandle: target
+ type: custom
+ zIndex: 0
+ - data:
+ isInIteration: false
+ sourceType: tool
+ targetType: variable-aggregator
+ id: 17429835940550-source-1741162531836-target
+ source: '17429835940550'
+ sourceHandle: source
+ target: '1741162531836'
+ targetHandle: target
+ type: custom
+ zIndex: 0
+ nodes:
+ - data:
+ desc: ''
+ selected: false
+ title: Start
+ type: start
+ variables:
+ - allowed_file_extensions: []
+ allowed_file_types:
+ - document
+ allowed_file_upload_methods:
+ - local_file
+ - remote_url
+ label: alert
+ max_length: 256
+ options: []
+ required: true
+ type: text-input
+ variable: alert
+ - label: params
+ max_length: 99999999999
+ options: []
+ required: true
+ type: paragraph
+ variable: params
+ - label: startTime
+ max_length: 48
+ options: []
+ required: true
+ type: number
+ variable: startTime
+ - label: endTime
+ max_length: 48
+ options: []
+ required: true
+ type: number
+ variable: endTime
+ - allowed_file_extensions:
+ - .json
+ allowed_file_types:
+ - custom
+ allowed_file_upload_methods:
+ - local_file
+ - remote_url
label: input
max_length: 48
options: []
required: false
type: file
variable: input
- height: 193
+ height: 194
id: '1741157526222'
position:
- x: -474.8546859399444
- y: 113.39535872618072
+ x: 30
+ y: 560
positionAbsolute:
- x: -474.8546859399444
- y: 113.39535872618072
- selected: true
+ x: 30
+ y: 560
+ selected: false
sourcePosition: right
targetPosition: left
type: custom
- width: 243
+ width: 244
- data:
desc: ''
outputs:
@@ -599,21 +788,21 @@ workflow:
- output
variable: text
selected: false
- title: End
+ title: end
type: end
- height: 89
+ height: 90
id: '1741157560922'
position:
- x: 3744.206346600103
- y: 363.73374031791394
+ x: 3374
+ y: 560
positionAbsolute:
- x: 3744.206346600103
- y: 363.73374031791394
+ x: 3374
+ y: 560
selected: false
sourcePosition: right
targetPosition: left
type: custom
- width: 243
+ width: 244
- data:
classes:
- id: '1'
@@ -631,15 +820,20 @@ workflow:
- id: '1741318899444'
name: 'Container related
+
Container memory usage exceeds 80%'
- id: '1741318983134'
name: 'Application metrics
- Error rate increased'
+ Error rate related
+
+ For example, Request error rate exceeds 0%, log error number related'
- id: '1741319019432'
name: 'Network related
- Network RTT delay exceeds 50ms'
+ If the network RTT delay exceeds 50ms
+
+ network rtt'
- id: '1741319060092'
name: 'Host related
@@ -673,48 +867,48 @@ workflow:
File descriptor usage exceeds 85%'
- id: '1741319394268'
- name: Unknown Type
+ name: unknow type
- id: '1741591414269'
name: 'Container type
Container is killed'
desc: ''
- instruction: Please classifiy the type of alarm event from the alarm event
- description
+ instruction: Please classify the alert events based on the alert event description
instructions: ''
model:
completion_params:
temperature: 0.7
mode: chat
- name: deepseek-v3
- provider: langgenius/openai_api_compatible/openai_api_compatible
+ name: deepseek-chat
+ provider: langgenius/deepseek/deepseek
query_variable_selector:
- '1741157526222'
- alert
selected: false
- title: Question Classifier
+ title: alert event classify
topics: []
type: question-classifier
vision:
enabled: false
- height: 885
+ height: 896
id: '1741158559444'
position:
- x: 457.0185062880778
- y: 139.09402013442167
+ x: 942
+ y: 560
positionAbsolute:
- x: 457.0185062880778
- y: 139.09402013442167
- selected: false
+ x: 942
+ y: 560
+ selected: true
sourcePosition: right
targetPosition: left
type: custom
- width: 243
+ width: 244
- data:
agent_parameters:
instruction:
type: constant
- value: 根据告警事件的描述,选择工具查询数据,返回工具查询内容
+ value: According to the description of the alert event, select the tool
+ to query data and return the tool query content
model:
type: constant
value:
@@ -726,19 +920,19 @@ workflow:
type: model-selector
query:
type: constant
- value: '# alert info
+ value: '# Alert description
{{#1741157526222.alert#}}
- # data params
+ # Data parameters
{{#1741157526222.params#}}
- # startTime
+ # Start time
{{#1741157526222.startTime#}}
- # endTime
+ # End time
{{#1741157526222.endTime#}}
@@ -751,6 +945,9 @@ workflow:
extra:
description: ''
parameters:
+ cadvisor_job_name:
+ auto: 1
+ value: null
endTime:
auto: 1
value: null
@@ -769,23 +966,23 @@ workflow:
default: null
form: llm
human_description:
- en_US: Specified pod name
- ja_JP: Specified pod name
- pt_BR: Specified pod name
- zh_Hans: 指定的容器POD名称
+ en_US: cAdvisor job name
+ ja_JP: cAdvisor job name
+ pt_BR: cAdvisor job name
+ zh_Hans: cAdvisor任务名称
label:
- en_US: pod
- ja_JP: pod
- pt_BR: pod
- zh_Hans: pod
- llm_description: Specified pod name
+ en_US: cAdvisor job name
+ ja_JP: cAdvisor job name
+ pt_BR: cAdvisor job name
+ zh_Hans: cAdvisor任务名称
+ llm_description: cAdvisor job name
max: null
min: null
- name: pod
+ name: cadvisor_job_name
options: []
placeholder: null
precision: null
- required: true
+ required: false
scope: null
template: null
type: string
@@ -793,23 +990,23 @@ workflow:
default: null
form: llm
human_description:
- en_US: Specified namespace
- ja_JP: Specified namespace
- pt_BR: Specified namespace
- zh_Hans: 指定的容器所在Namespace
+ en_US: Namespace
+ ja_JP: Namespace
+ pt_BR: Namespace
+ zh_Hans: 命名空间
label:
- en_US: namespace
- ja_JP: namespace
- pt_BR: namespace
- zh_Hans: namespace
- llm_description: Specified namespace
+ en_US: Namespace
+ ja_JP: Namespace
+ pt_BR: Namespace
+ zh_Hans: 命名空间
+ llm_description: Namespace
max: null
min: null
name: namespace
options: []
placeholder: null
precision: null
- required: true
+ required: false
scope: null
template: null
type: string
@@ -817,16 +1014,40 @@ workflow:
default: null
form: llm
human_description:
- en_US: Data query start time
- ja_JP: Data query start time
- pt_BR: Data query start time
+ en_US: Pod name
+ ja_JP: Pod name
+ pt_BR: Pod name
+ zh_Hans: Pod名称
+ label:
+ en_US: Pod name
+ ja_JP: Pod name
+ pt_BR: Pod name
+ zh_Hans: Pod名称
+ llm_description: Pod name
+ max: null
+ min: null
+ name: pod
+ options: []
+ placeholder: null
+ precision: null
+ required: false
+ scope: null
+ template: null
+ type: string
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Data query start time(Microsecond)
+ ja_JP: Data query start time(Microsecond)
+ pt_BR: Data query start time(Microsecond)
zh_Hans: 开始时间 (微秒)
label:
en_US: startTime
ja_JP: startTime
pt_BR: startTime
zh_Hans: startTime
- llm_description: Data query start time
+ llm_description: Data query start time(Microsecond)
max: null
min: null
name: startTime
@@ -841,16 +1062,16 @@ workflow:
default: null
form: llm
human_description:
- en_US: Data query end time
- ja_JP: Data query end time
- pt_BR: Data query end time
+ en_US: Data query end time(Microsecond)
+ ja_JP: Data query end time(Microsecond)
+ pt_BR: Data query end time(Microsecond)
zh_Hans: 结束时间 (微秒)
label:
en_US: endTime
ja_JP: endTime
pt_BR: endTime
zh_Hans: endTime
- llm_description: Data query start time
+ llm_description: Data query end time(Microsecond)
max: null
min: null
name: endTime
@@ -862,17 +1083,24 @@ workflow:
template: null
type: number
settings: {}
- tool_label: 容器CPU使用率(使用Containerd容器运行时,按容器和Pod统计)
- tool_name: 查询容器CPU利用率
+ tool_label: Container CPU throttling time (Docker runtime, aggregated
+ by Pod)
+ tool_name: 容器CPU节流时长(使用Docker容器运行时,按Pod统计)
type: builtin
- enabled: true
extra:
description: ''
parameters:
+ cadvisor_job_name:
+ auto: 1
+ value: null
endTime:
auto: 1
value: null
- node:
+ namespace:
+ auto: 1
+ value: null
+ pod:
auto: 1
value: null
startTime:
@@ -884,23 +1112,23 @@ workflow:
default: null
form: llm
human_description:
- en_US: Specified host name
- ja_JP: Specified host name
- pt_BR: Specified host name
- zh_Hans: 指定的主机名
+ en_US: cAdvisor job name
+ ja_JP: cAdvisor job name
+ pt_BR: cAdvisor job name
+ zh_Hans: cAdvisor任务名称
label:
- en_US: node
- ja_JP: node
- pt_BR: node
- zh_Hans: node
- llm_description: Specified host name
+ en_US: cAdvisor job name
+ ja_JP: cAdvisor job name
+ pt_BR: cAdvisor job name
+ zh_Hans: cAdvisor任务名称
+ llm_description: cAdvisor job name
max: null
min: null
- name: node
+ name: cadvisor_job_name
options: []
placeholder: null
precision: null
- required: true
+ required: false
scope: null
template: null
type: string
@@ -908,16 +1136,64 @@ workflow:
default: null
form: llm
human_description:
- en_US: Data query start time
- ja_JP: Data query start time
- pt_BR: Data query start time
+ en_US: Namespace
+ ja_JP: Namespace
+ pt_BR: Namespace
+ zh_Hans: 命名空间
+ label:
+ en_US: Namespace
+ ja_JP: Namespace
+ pt_BR: Namespace
+ zh_Hans: 命名空间
+ llm_description: Namespace
+ max: null
+ min: null
+ name: namespace
+ options: []
+ placeholder: null
+ precision: null
+ required: false
+ scope: null
+ template: null
+ type: string
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Pod name
+ ja_JP: Pod name
+ pt_BR: Pod name
+ zh_Hans: Pod名称
+ label:
+ en_US: Pod name
+ ja_JP: Pod name
+ pt_BR: Pod name
+ zh_Hans: Pod名称
+ llm_description: Pod name
+ max: null
+ min: null
+ name: pod
+ options: []
+ placeholder: null
+ precision: null
+ required: false
+ scope: null
+ template: null
+ type: string
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Data query start time(Microsecond)
+ ja_JP: Data query start time(Microsecond)
+ pt_BR: Data query start time(Microsecond)
zh_Hans: 开始时间 (微秒)
label:
en_US: startTime
ja_JP: startTime
pt_BR: startTime
zh_Hans: startTime
- llm_description: Data query start time
+ llm_description: Data query start time(Microsecond)
max: null
min: null
name: startTime
@@ -932,16 +1208,16 @@ workflow:
default: null
form: llm
human_description:
- en_US: Data query end time
- ja_JP: Data query end time
- pt_BR: Data query end time
+ en_US: Data query end time(Microsecond)
+ ja_JP: Data query end time(Microsecond)
+ pt_BR: Data query end time(Microsecond)
zh_Hans: 结束时间 (微秒)
label:
en_US: endTime
ja_JP: endTime
pt_BR: endTime
zh_Hans: endTime
- llm_description: Data query start time
+ llm_description: Data query end time(Microsecond)
max: null
min: null
name: endTime
@@ -953,20 +1229,24 @@ workflow:
template: null
type: number
settings: {}
- tool_label: 宿主机IO等待CPU繁忙率
- tool_name: host_cpu_iowait
+ tool_label: Container CPU usage rate (Docker runtime, aggregated by
+ Pod)
+ tool_name: 容器CPU使用率(使用Docker容器运行时,按Pod统计)
type: builtin
- enabled: true
extra:
description: ''
parameters:
+ cadvisor_job_name:
+ auto: 1
+ value: null
endTime:
auto: 1
value: null
- job:
+ namespace:
auto: 1
value: null
- node:
+ pod:
auto: 1
value: null
startTime:
@@ -978,19 +1258,19 @@ workflow:
default: null
form: llm
human_description:
- en_US: Prometheus job name for host metrics
- ja_JP: Prometheus job name for host metrics
- pt_BR: Prometheus job name for host metrics
- zh_Hans: Prometheus任务名称(宿主机指标)
+ en_US: cAdvisor job name
+ ja_JP: cAdvisor job name
+ pt_BR: cAdvisor job name
+ zh_Hans: cAdvisor任务名称
label:
- en_US: Prometheus Job
- ja_JP: Prometheus Job
- pt_BR: Tarefa Prometheus
- zh_Hans: Prometheus任务
- llm_description: Unique identifier for metrics scrape job
+ en_US: cAdvisor job name
+ ja_JP: cAdvisor job name
+ pt_BR: cAdvisor job name
+ zh_Hans: cAdvisor任务名称
+ llm_description: cAdvisor job name
max: null
min: null
- name: job
+ name: cadvisor_job_name
options: []
placeholder: null
precision: null
@@ -1002,23 +1282,47 @@ workflow:
default: null
form: llm
human_description:
- en_US: Host node identifier
- ja_JP: Host node identifier
- pt_BR: Host node identifier
- zh_Hans: 宿主机节点标识
+ en_US: Namespace
+ ja_JP: Namespace
+ pt_BR: Namespace
+ zh_Hans: 命名空间
label:
- en_US: Host Node
- ja_JP: Host Node
- pt_BR: Host Node
- zh_Hans: 宿主机节点
- llm_description: Unique identifier for host node
+ en_US: Namespace
+ ja_JP: Namespace
+ pt_BR: Namespace
+ zh_Hans: 命名空间
+ llm_description: Namespace
max: null
min: null
- name: node
+ name: namespace
options: []
placeholder: null
precision: null
- required: true
+ required: false
+ scope: null
+ template: null
+ type: string
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Pod name
+ ja_JP: Pod name
+ pt_BR: Pod name
+ zh_Hans: Pod名称
+ label:
+ en_US: Pod name
+ ja_JP: Pod name
+ pt_BR: Pod name
+ zh_Hans: Pod名称
+ llm_description: Pod name
+ max: null
+ min: null
+ name: pod
+ options: []
+ placeholder: null
+ precision: null
+ required: false
scope: null
template: null
type: string
@@ -1026,8 +1330,8 @@ workflow:
default: null
form: llm
human_description:
- en_US: Data query start time
- ja_JP: Data query start time
+ en_US: Data query start time(Microsecond)
+ ja_JP: Data query start time(Microsecond)
pt_BR: Data query start time
zh_Hans: 开始时间 (微秒)
label:
@@ -1035,7 +1339,7 @@ workflow:
ja_JP: startTime
pt_BR: startTime
zh_Hans: startTime
- llm_description: Data query start time
+ llm_description: Data query start time(Microsecond)
max: null
min: null
name: startTime
@@ -1050,16 +1354,16 @@ workflow:
default: null
form: llm
human_description:
- en_US: Data query end time
- ja_JP: Data query end time
- pt_BR: Data query end time
+ en_US: Data query end time(Microsecond)
+ ja_JP: Data query end time(Microsecond)
+ pt_BR: Data query end time(Microsecond)
zh_Hans: 结束时间 (微秒)
label:
en_US: endTime
ja_JP: endTime
pt_BR: endTime
zh_Hans: endTime
- llm_description: Data query start time
+ llm_description: Data query end time(Microsecond)
max: null
min: null
name: endTime
@@ -1071,870 +1375,2096 @@ workflow:
template: null
type: number
settings: {}
- tool_label: 查询宿主机最近1分钟的系统负载
- tool_name: 查询宿主机最近1分钟的系统负载
- type: builtin
- - enabled: true
- extra:
- description: ''
- parameters:
- endTime:
- auto: 1
- value: null
- node:
- auto: 1
- value: null
- startTime:
- auto: 1
- value: null
- provider_name: apo_select
- schemas:
- - auto_generate: null
- default: null
- form: llm
- human_description:
- en_US: Specified host name
- ja_JP: Specified host name
- pt_BR: Specified host name
- zh_Hans: 指定的主机名
- label:
- en_US: node
- ja_JP: node
- pt_BR: node
- zh_Hans: node
- llm_description: Specified host name
- max: null
- min: null
- name: node
- options: []
- placeholder: null
- precision: null
- required: true
- scope: null
- template: null
- type: string
- - auto_generate: null
- default: null
- form: llm
- human_description:
- en_US: Data query start time
- ja_JP: Data query start time
- pt_BR: Data query start time
- zh_Hans: 开始时间 (微秒)
- label:
- en_US: startTime
- ja_JP: startTime
- pt_BR: startTime
- zh_Hans: startTime
- llm_description: Data query start time
- max: null
- min: null
- name: startTime
- options: []
- placeholder: null
- precision: null
- required: true
- scope: null
- template: null
- type: number
- - auto_generate: null
- default: null
- form: llm
- human_description:
- en_US: Data query end time
- ja_JP: Data query end time
- pt_BR: Data query end time
- zh_Hans: 结束时间 (微秒)
- label:
- en_US: endTime
- ja_JP: endTime
- pt_BR: endTime
- zh_Hans: endTime
- llm_description: Data query start time
- max: null
- min: null
- name: endTime
- options: []
- placeholder: null
- precision: null
- required: true
- scope: null
- template: null
- type: number
- settings: {}
- tool_label: 宿主机磁盘读取数据速率(字节/秒)
- tool_name: 宿主机磁盘读取数据速率(字节/秒)
- type: builtin
- - enabled: true
- extra:
- description: ''
- parameters:
- content_key:
- auto: 1
- value: null
- endTime:
- auto: 1
- value: null
- service_name:
- auto: 1
- value: null
- startTime:
- auto: 1
- value: null
- provider_name: apo_select
- schemas:
- - auto_generate: null
- default: null
- form: llm
- human_description:
- en_US: Specified service name
- ja_JP: Specified service name
- pt_BR: Specified service name
- zh_Hans: 指定的服务名
- label:
- en_US: service_name
- ja_JP: service_name
- pt_BR: service_name
- zh_Hans: service_name
- llm_description: 指定的服务名
- max: null
- min: null
- name: service_name
- options: []
- placeholder: null
- precision: null
- required: true
- scope: null
- template: null
- type: string
- - auto_generate: null
- default: null
- form: llm
- human_description:
- en_US: Specified endpoint name
- ja_JP: Specified endpoint name
- pt_BR: Specified endpoint name
- zh_Hans: 指定的服务端点名
- label:
- en_US: content_key
- ja_JP: content_key
- pt_BR: content_key
- zh_Hans: content_key
- llm_description: 指定的服务端点名
- max: null
- min: null
- name: content_key
- options: []
- placeholder: null
- precision: null
- required: true
- scope: null
- template: null
- type: string
- - auto_generate: null
- default: null
- form: llm
- human_description:
- en_US: Data query start time
- ja_JP: Data query start time
- pt_BR: Data query start time
- zh_Hans: 开始时间 (微秒)
- label:
- en_US: startTime
- ja_JP: startTime
- pt_BR: startTime
- zh_Hans: startTime
- llm_description: Data query start time
- max: null
- min: null
- name: startTime
- options: []
- placeholder: null
- precision: null
- required: true
- scope: null
- template: null
- type: number
- - auto_generate: null
- default: null
- form: llm
- human_description:
- en_US: Data query end time
- ja_JP: Data query end time
- pt_BR: Data query end time
- zh_Hans: 结束时间 (微秒)
- label:
- en_US: endTime
- ja_JP: endTime
- pt_BR: endTime
- zh_Hans: endTime
- llm_description: Data query start time
- max: null
- min: null
- name: endTime
- options: []
- placeholder: null
- precision: null
- required: true
- scope: null
- template: null
- type: number
- settings: {}
- tool_label: 服务请求成功率(按服务名和内容键统计,指定时间段内)
- tool_name: Originx 北极星指标 (服务层级) - RED指标 - 请求成功率
- type: builtin
- - enabled: true
- extra:
- description: ''
- parameters:
- endTime:
- auto: 1
- value: null
- job:
- auto: 1
- value: null
- node:
- auto: 1
- value: null
- startTime:
- auto: 1
- value: null
- provider_name: apo_select
- schemas:
- - auto_generate: null
- default: null
- form: llm
- human_description:
- en_US: Prometheus job name for host metrics
- ja_JP: Prometheus job name for host metrics
- pt_BR: Prometheus job name for host metrics
- zh_Hans: Prometheus任务名称(宿主机指标)
- label:
- en_US: Prometheus Job
- ja_JP: Prometheus Job
- pt_BR: Tarefa Prometheus
- zh_Hans: Prometheus任务
- llm_description: Unique identifier for metrics scrape job
- max: null
- min: null
- name: job
- options: []
- placeholder: null
- precision: null
- required: false
- scope: null
- template: null
- type: string
- - auto_generate: null
- default: null
- form: llm
- human_description:
- en_US: Host node identifier
- ja_JP: Host node identifier
- pt_BR: Host node identifier
- zh_Hans: 宿主机节点标识
- label:
- en_US: Host Node
- ja_JP: Host Node
- pt_BR: Host Node
- zh_Hans: 宿主机节点
- llm_description: Unique identifier for host node
- max: null
- min: null
- name: node
- options: []
- placeholder: null
- precision: null
- required: true
- scope: null
- template: null
- type: string
- - auto_generate: null
- default: null
- form: llm
- human_description:
- en_US: Data query start time
- ja_JP: Data query start time
- pt_BR: Data query start time
- zh_Hans: 开始时间 (微秒)
- label:
- en_US: startTime
- ja_JP: startTime
- pt_BR: startTime
- zh_Hans: startTime
- llm_description: Data query start time
- max: null
- min: null
- name: startTime
- options: []
- placeholder: null
- precision: null
- required: true
- scope: null
- template: null
- type: number
- - auto_generate: null
- default: null
- form: llm
- human_description:
- en_US: Data query end time
- ja_JP: Data query end time
- pt_BR: Data query end time
- zh_Hans: 结束时间 (微秒)
- label:
- en_US: endTime
- ja_JP: endTime
- pt_BR: endTime
- zh_Hans: endTime
- llm_description: Data query start time
- max: null
- min: null
- name: endTime
- options: []
- placeholder: null
- precision: null
- required: true
- scope: null
- template: null
- type: number
- settings: {}
- tool_label: 查询宿主机RAM总大小
- tool_name: 查询宿主机RAM总大小
- type: builtin
- - enabled: true
- extra:
- description: ''
- parameters:
- endTime:
- auto: 1
- value: null
- job:
- auto: 1
- value: null
- node:
- auto: 1
- value: null
- startTime:
- auto: 1
- value: null
- provider_name: apo_select
- schemas:
- - auto_generate: null
- default: null
- form: llm
- human_description:
- en_US: Prometheus job name for host metrics
- ja_JP: Prometheus job name for host metrics
- pt_BR: Prometheus job name for host metrics
- zh_Hans: Prometheus任务名称(宿主机指标)
- label:
- en_US: Prometheus Job
- ja_JP: Prometheus Job
- pt_BR: Tarefa Prometheus
- zh_Hans: Prometheus任务
- llm_description: Unique identifier for metrics scrape job
- max: null
- min: null
- name: job
- options: []
- placeholder: null
- precision: null
- required: false
- scope: null
- template: null
- type: string
- - auto_generate: null
- default: null
- form: llm
- human_description:
- en_US: Host node identifier
- ja_JP: Host node identifier
- pt_BR: Host node identifier
- zh_Hans: 宿主机节点标识
- label:
- en_US: Host Node
- ja_JP: Host Node
- pt_BR: Host Node
- zh_Hans: 宿主机节点
- llm_description: Unique identifier for host node
- max: null
- min: null
- name: node
- options: []
- placeholder: null
- precision: null
- required: true
- scope: null
- template: null
- type: string
- - auto_generate: null
- default: null
- form: llm
- human_description:
- en_US: Data query start time
- ja_JP: Data query start time
- pt_BR: Data query start time
- zh_Hans: 开始时间 (微秒)
- label:
- en_US: startTime
- ja_JP: startTime
- pt_BR: startTime
- zh_Hans: startTime
- llm_description: Data query start time
- max: null
- min: null
- name: startTime
- options: []
- placeholder: null
- precision: null
- required: true
- scope: null
- template: null
- type: number
- - auto_generate: null
- default: null
- form: llm
- human_description:
- en_US: Data query end time
- ja_JP: Data query end time
- pt_BR: Data query end time
- zh_Hans: 结束时间 (微秒)
- label:
- en_US: endTime
- ja_JP: endTime
- pt_BR: endTime
- zh_Hans: endTime
- llm_description: Data query start time
- max: null
- min: null
- name: endTime
- options: []
- placeholder: null
- precision: null
- required: true
- scope: null
- template: null
- type: number
- settings: {}
- tool_label: 查询宿主机根文件系统使用率
- tool_name: 查询宿主机根文件系统使用率
- type: builtin
- - enabled: true
- extra:
- description: ''
- parameters:
- endTime:
- auto: 1
- value: null
- node:
- auto: 1
- value: null
- startTime:
- auto: 1
- value: null
- provider_name: apo_select
- schemas:
- - auto_generate: null
- default: null
- form: llm
- human_description:
- en_US: Specified host name
- ja_JP: Specified host name
- pt_BR: Specified host name
- zh_Hans: 指定的主机名
- label:
- en_US: node
- ja_JP: node
- pt_BR: node
- zh_Hans: node
- llm_description: Specified host name
- max: null
- min: null
- name: node
- options: []
- placeholder: null
- precision: null
- required: true
- scope: null
- template: null
- type: string
- - auto_generate: null
- default: null
- form: llm
- human_description:
- en_US: Data query start time
- ja_JP: Data query start time
- pt_BR: Data query start time
- zh_Hans: 开始时间 (微秒)
- label:
- en_US: startTime
- ja_JP: startTime
- pt_BR: startTime
- zh_Hans: startTime
- llm_description: Data query start time
- max: null
- min: null
- name: startTime
- options: []
- placeholder: null
- precision: null
- required: true
- scope: null
- template: null
- type: number
- - auto_generate: null
- default: null
- form: llm
- human_description:
- en_US: Data query end time
- ja_JP: Data query end time
- pt_BR: Data query end time
- zh_Hans: 结束时间 (微秒)
- label:
- en_US: endTime
- ja_JP: endTime
- pt_BR: endTime
- zh_Hans: endTime
- llm_description: Data query start time
- max: null
- min: null
- name: endTime
- options: []
- placeholder: null
- precision: null
- required: true
- scope: null
- template: null
- type: number
- settings: {}
- tool_label: 宿主机CPU繁忙率(百分比)
- tool_name: 查询主机CPU利用率
- type: builtin
- - enabled: true
- extra:
- description: ''
- parameters:
- endTime:
- auto: 1
- value: null
- node:
- auto: 1
- value: null
- startTime:
- auto: 1
- value: null
- provider_name: apo_select
- schemas:
- - auto_generate: null
- default: null
- form: llm
- human_description:
- en_US: Specified host name
- ja_JP: Specified host name
- pt_BR: Specified host name
- zh_Hans: 指定的主机名
- label:
- en_US: node
- ja_JP: node
- pt_BR: node
- zh_Hans: node
- llm_description: Specified host name
- max: null
- min: null
- name: node
- options: []
- placeholder: null
- precision: null
- required: true
- scope: null
- template: null
- type: string
- - auto_generate: null
- default: null
- form: llm
- human_description:
- en_US: Data query start time
- ja_JP: Data query start time
- pt_BR: Data query start time
- zh_Hans: 开始时间 (微秒)
- label:
- en_US: startTime
- ja_JP: startTime
- pt_BR: startTime
- zh_Hans: startTime
- llm_description: Data query start time
- max: null
- min: null
- name: startTime
- options: []
- placeholder: null
- precision: null
- required: true
- scope: null
- template: null
- type: number
- - auto_generate: null
- default: null
- form: llm
- human_description:
- en_US: Data query end time
- ja_JP: Data query end time
- pt_BR: Data query end time
- zh_Hans: 结束时间 (微秒)
- label:
- en_US: endTime
- ja_JP: endTime
- pt_BR: endTime
- zh_Hans: endTime
- llm_description: Data query start time
- max: null
- min: null
- name: endTime
- options: []
- placeholder: null
- precision: null
- required: true
- scope: null
- template: null
- type: number
- settings: {}
- tool_label: 宿主机磁盘IO耗时速率
- tool_name: 宿主机磁盘IO耗时速率
- type: builtin
- - enabled: true
- extra:
- description: ''
- parameters:
- endTime:
- auto: 1
- value: null
- job:
- auto: 1
- value: null
- node:
- auto: 1
- value: null
- startTime:
- auto: 1
- value: null
- provider_name: apo_select
- schemas:
- - auto_generate: null
- default: null
- form: llm
- human_description:
- en_US: Prometheus job name for host metrics
- ja_JP: Prometheus job name for host metrics
- pt_BR: Prometheus job name for host metrics
- zh_Hans: Prometheus任务名称(宿主机指标)
- label:
- en_US: Prometheus Job
- ja_JP: Prometheus Job
- pt_BR: Tarefa Prometheus
- zh_Hans: Prometheus任务
- llm_description: Unique identifier for metrics scrape job
- max: null
- min: null
- name: job
- options: []
- placeholder: null
- precision: null
- required: false
- scope: null
- template: null
- type: string
- - auto_generate: null
- default: null
- form: llm
- human_description:
- en_US: Host node identifier
- ja_JP: Host node identifier
- pt_BR: Host node identifier
- zh_Hans: 宿主机节点标识
- label:
- en_US: Host Node
- ja_JP: Host Node
- pt_BR: Host Node
- zh_Hans: 宿主机节点
- llm_description: Unique identifier for host node
- max: null
- min: null
- name: node
- options: []
- placeholder: null
- precision: null
- required: true
- scope: null
- template: null
- type: string
- - auto_generate: null
- default: null
- form: llm
- human_description:
- en_US: Data query start time
- ja_JP: Data query start time
- pt_BR: Data query start time
- zh_Hans: 开始时间 (微秒)
- label:
- en_US: startTime
- ja_JP: startTime
- pt_BR: startTime
- zh_Hans: startTime
- llm_description: Data query start time
- max: null
- min: null
- name: startTime
- options: []
- placeholder: null
- precision: null
- required: true
- scope: null
- template: null
- type: number
- - auto_generate: null
- default: null
- form: llm
- human_description:
- en_US: Data query end time
- ja_JP: Data query end time
- pt_BR: Data query end time
- zh_Hans: 结束时间 (微秒)
- label:
- en_US: endTime
- ja_JP: endTime
- pt_BR: endTime
- zh_Hans: endTime
- llm_description: Data query start time
- max: null
- min: null
- name: endTime
- options: []
- placeholder: null
- precision: null
- required: true
- scope: null
- template: null
- type: number
- settings: {}
- tool_label: 查询宿主机CPU压力
- tool_name: 查询宿主机CPU压力
+ tool_label: Container network receive bandwidth (aggregated by namespace
+ and Pod)
+ tool_name: 容器网络接收带宽(按命名空间和Pod统计)
type: builtin
agent_strategy_label: FunctionCalling
agent_strategy_name: function_calling
agent_strategy_provider_name: langgenius/agent/agent
desc: ''
- output_schema: null
- plugin_unique_identifier: langgenius/agent:0.0.9@f16916b704a20067317dbe9030f62aa28f0832021a3ef6d4ce699504074c5e13
+ output_schema: null
+ plugin_unique_identifier: langgenius/agent:0.0.9@f16916b704a20067317dbe9030f62aa28f0832021a3ef6d4ce699504074c5e13
+ selected: false
+ title: Agent
+ type: agent
+ height: 198
+ id: '1741159085487'
+ position:
+ x: 2158
+ y: 560
+ positionAbsolute:
+ x: 2158
+ y: 560
+ selected: false
+ sourcePosition: right
+ targetPosition: left
+ type: custom
+ width: 244
+ - data:
+ desc: ''
+ output_type: string
+ selected: false
+ title: summary 15 mins data
+ type: variable-aggregator
+ variables:
+ - - '1741328045214'
+ - text
+ - - '1742979394268'
+ - text
+ - - '1741328076453'
+ - text
+ - - '1742979595004'
+ - text
+ - - '1741329632798'
+ - text
+ - - '1741328197695'
+ - text
+ - - '1741328423453'
+ - text
+ - - '1741328466394'
+ - text
+ - - '1742979828391'
+ - text
+ - - '1741328742817'
+ - text
+ - - '1741328773213'
+ - text
+ - - '1741328799030'
+ - text
+ - - '17429797453350'
+ - text
+ - - '1741328346220'
+ - text
+ - - '1741328213545'
+ - text
+ height: 416
+ id: '1741162531836'
+ position:
+ x: 1854
+ y: 1275
+ positionAbsolute:
+ x: 1854
+ y: 1275
+ selected: false
+ sourcePosition: right
+ targetPosition: left
+ type: custom
+ width: 244
+ - data:
+ classes:
+ - id: '1'
+ name: jitter
+ - id: '2'
+ name: continuous
+ desc: ''
+ instruction: Determine whether the input conclusion is jitter or continuous
+ instructions: ''
+ model:
+ completion_params:
+ temperature: 0.7
+ mode: chat
+ name: deepseek-chat
+ provider: langgenius/deepseek/deepseek
+ query_variable_selector:
+ - '1741159085487'
+ - text
+ selected: false
+ title: llm analysis
+ topics: []
+ type: question-classifier
+ vision:
+ enabled: false
+ height: 168
+ id: '1741311244655'
+ position:
+ x: 2462
+ y: 560
+ positionAbsolute:
+ x: 2462
+ y: 560
+ selected: false
+ sourcePosition: right
+ targetPosition: left
+ type: custom
+ width: 244
+ - data:
+ code: "\ndef main(arg1: str) -> dict:\n res = \"true\"\n if arg1 ==\
+ \ \"continuous\":\n res = \"false\"\n return {\n \"result\"\
+ : res,\n }\n"
+ code_language: python3
+ desc: ''
+ outputs:
+ result:
+ children: null
+ type: string
+ selected: false
+ title: get result
+ type: code
+ variables:
+ - value_selector:
+ - '1741311244655'
+ - class_name
+ variable: arg1
+ height: 54
+ id: '1741311294320'
+ position:
+ x: 2766
+ y: 560
+ positionAbsolute:
+ x: 2766
+ y: 560
+ selected: false
+ sourcePosition: right
+ targetPosition: left
+ type: custom
+ width: 244
+ - data:
+ desc: ''
+ output_type: string
+ selected: false
+ title: summary
+ type: variable-aggregator
+ variables:
+ - - '1741311294320'
+ - result
+ - - '1742366303110'
+ - class_name
+ height: 130
+ id: '1741311394752'
+ position:
+ x: 3070
+ y: 560
+ positionAbsolute:
+ x: 3070
+ y: 560
+ selected: false
+ sourcePosition: right
+ targetPosition: left
+ type: custom
+ width: 244
+ - data:
+ desc: ''
+ is_team_authorization: true
+ output_schema: null
+ paramSchemas:
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Specified service name
+ ja_JP: Specified service name
+ pt_BR: Specified service name
+ zh_Hans: 指定的服务名
+ label:
+ en_US: service_name
+ ja_JP: service_name
+ pt_BR: service_name
+ zh_Hans: service_name
+ llm_description: 指定的服务名
+ max: null
+ min: null
+ name: service_name
+ options: []
+ placeholder: null
+ precision: null
+ required: true
+ scope: null
+ template: null
+ type: string
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Specified endpoint name
+ ja_JP: Specified endpoint name
+ pt_BR: Specified endpoint name
+ zh_Hans: 指定的服务端点名
+ label:
+ en_US: content_key
+ ja_JP: content_key
+ pt_BR: content_key
+ zh_Hans: content_key
+ llm_description: 指定的服务端点名
+ max: null
+ min: null
+ name: content_key
+ options: []
+ placeholder: null
+ precision: null
+ required: true
+ scope: null
+ template: null
+ type: string
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Data query start time
+ ja_JP: Data query start time
+ pt_BR: Data query start time
+ zh_Hans: 开始时间 (微秒)
+ label:
+ en_US: startTime
+ ja_JP: startTime
+ pt_BR: startTime
+ zh_Hans: startTime
+ llm_description: Data query start time
+ max: null
+ min: null
+ name: startTime
+ options: []
+ placeholder: null
+ precision: null
+ required: true
+ scope: null
+ template: null
+ type: number
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Data query end time
+ ja_JP: Data query end time
+ pt_BR: Data query end time
+ zh_Hans: 结束时间 (微秒)
+ label:
+ en_US: endTime
+ ja_JP: endTime
+ pt_BR: endTime
+ zh_Hans: endTime
+ llm_description: Data query start time
+ max: null
+ min: null
+ name: endTime
+ options: []
+ placeholder: null
+ precision: null
+ required: true
+ scope: null
+ template: null
+ type: number
+ params:
+ content_key: ''
+ endTime: ''
+ service_name: ''
+ startTime: ''
+ provider_id: apo_select
+ provider_name: apo_select
+ provider_type: builtin
+ selected: false
+ title: Average service response time (milliseconds, by service name and content
+ key, within a specified time period)
+ tool_configurations: {}
+ tool_label: 服务平均响应时间(毫秒,按服务名和内容键统计,指定时间段内)
+ tool_name: Originx 北极星指标 (服务层级) - RED指标 - 平均响应时间
+ tool_parameters:
+ content_key:
+ type: mixed
+ value: '{{#1742806924635.endpoint#}}'
+ endTime:
+ type: variable
+ value:
+ - '1741157526222'
+ - endTime
+ service_name:
+ type: mixed
+ value: '{{#1742806924635.service#}}'
+ startTime:
+ type: variable
+ value:
+ - '1741157526222'
+ - startTime
+ type: tool
+ height: 54
+ id: '1741328045214'
+ position:
+ x: 1246
+ y: 617
+ positionAbsolute:
+ x: 1246
+ y: 617
+ selected: false
+ sourcePosition: right
+ targetPosition: left
+ type: custom
+ width: 244
+ - data:
+ desc: ''
+ is_team_authorization: true
+ output_schema: null
+ paramSchemas:
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Specified pod name
+ ja_JP: Specified pod name
+ pt_BR: Specified pod name
+ zh_Hans: 指定的容器POD名称
+ label:
+ en_US: pod
+ ja_JP: pod
+ pt_BR: pod
+ zh_Hans: pod
+ llm_description: Specified pod name
+ max: null
+ min: null
+ name: pod
+ options: []
+ placeholder: null
+ precision: null
+ required: true
+ scope: null
+ template: null
+ type: string
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Specified namespace
+ ja_JP: Specified namespace
+ pt_BR: Specified namespace
+ zh_Hans: 指定的容器所在Namespace
+ label:
+ en_US: namespace
+ ja_JP: namespace
+ pt_BR: namespace
+ zh_Hans: namespace
+ llm_description: Specified namespace
+ max: null
+ min: null
+ name: namespace
+ options: []
+ placeholder: null
+ precision: null
+ required: true
+ scope: null
+ template: null
+ type: string
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Data query start time
+ ja_JP: Data query start time
+ pt_BR: Data query start time
+ zh_Hans: 开始时间 (微秒)
+ label:
+ en_US: startTime
+ ja_JP: startTime
+ pt_BR: startTime
+ zh_Hans: startTime
+ llm_description: Data query start time
+ max: null
+ min: null
+ name: startTime
+ options: []
+ placeholder: null
+ precision: null
+ required: true
+ scope: null
+ template: null
+ type: number
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Data query end time
+ ja_JP: Data query end time
+ pt_BR: Data query end time
+ zh_Hans: 结束时间 (微秒)
+ label:
+ en_US: endTime
+ ja_JP: endTime
+ pt_BR: endTime
+ zh_Hans: endTime
+ llm_description: Data query start time
+ max: null
+ min: null
+ name: endTime
+ options: []
+ placeholder: null
+ precision: null
+ required: true
+ scope: null
+ template: null
+ type: number
+ params:
+ endTime: ''
+ namespace: ''
+ pod: ''
+ startTime: ''
+ provider_id: apo_select
+ provider_name: apo_select
+ provider_type: builtin
+ selected: false
+ title: Container CPU throttling duration (when using Containerd container
+ runtime, statistics by container and Pod)
+ tool_configurations: {}
+ tool_label: 容器CPU节流时长(使用Containerd容器运行时,按容器和Pod统计)
+ tool_name: 容器CPU节流时长(使用Containerd容器运行时,按容器和Pod统计)
+ tool_parameters:
+ endTime:
+ type: variable
+ value:
+ - '1741157526222'
+ - endTime
+ namespace:
+ type: mixed
+ value: '{{#1742806924635.namespace#}}'
+ pod:
+ type: mixed
+ value: '{{#1742806924635.pod#}}'
+ startTime:
+ type: variable
+ value:
+ - '1741157526222'
+ - startTime
+ type: tool
+ height: 54
+ id: '1741328076453'
+ position:
+ x: 1246
+ y: 711
+ positionAbsolute:
+ x: 1246
+ y: 711
+ selected: false
+ sourcePosition: right
+ targetPosition: left
+ type: custom
+ width: 244
+ - data:
+ desc: ''
+ is_team_authorization: true
+ output_schema: null
+ paramSchemas:
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Specified pod name
+ ja_JP: Specified pod name
+ pt_BR: Specified pod name
+ zh_Hans: 指定的容器POD名称
+ label:
+ en_US: pod
+ ja_JP: pod
+ pt_BR: pod
+ zh_Hans: pod
+ llm_description: Specified pod name
+ max: null
+ min: null
+ name: pod
+ options: []
+ placeholder: null
+ precision: null
+ required: true
+ scope: null
+ template: null
+ type: string
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Specified namespace
+ ja_JP: Specified namespace
+ pt_BR: Specified namespace
+ zh_Hans: 指定的容器所在Namespace
+ label:
+ en_US: namespace
+ ja_JP: namespace
+ pt_BR: namespace
+ zh_Hans: namespace
+ llm_description: Specified namespace
+ max: null
+ min: null
+ name: namespace
+ options: []
+ placeholder: null
+ precision: null
+ required: true
+ scope: null
+ template: null
+ type: string
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Data query start time
+ ja_JP: Data query start time
+ pt_BR: Data query start time
+ zh_Hans: 开始时间 (微秒)
+ label:
+ en_US: startTime
+ ja_JP: startTime
+ pt_BR: startTime
+ zh_Hans: startTime
+ llm_description: Data query start time
+ max: null
+ min: null
+ name: startTime
+ options: []
+ placeholder: null
+ precision: null
+ required: true
+ scope: null
+ template: null
+ type: number
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Data query end time
+ ja_JP: Data query end time
+ pt_BR: Data query end time
+ zh_Hans: 结束时间 (微秒)
+ label:
+ en_US: endTime
+ ja_JP: endTime
+ pt_BR: endTime
+ zh_Hans: endTime
+ llm_description: Data query start time
+ max: null
+ min: null
+ name: endTime
+ options: []
+ placeholder: null
+ precision: null
+ required: true
+ scope: null
+ template: null
+ type: number
+ params:
+ endTime: ''
+ namespace: ''
+ pod: ''
+ startTime: ''
+ provider_id: apo_select
+ provider_name: apo_select
+ provider_type: builtin
+ selected: false
+ title: The network round-trip time between the container and the downstream
+ service (RTT, by namespace and Pod)
+ tool_configurations: {}
+ tool_label: 容器与下游服务的网络往返时间(RTT,按命名空间和Pod统计)
+ tool_name: 查询容器网络与下游RTT
+ tool_parameters:
+ endTime:
+ type: variable
+ value:
+ - '1741157526222'
+ - endTime
+ namespace:
+ type: mixed
+ value: '{{#1742806924635.namespace#}}'
+ pod:
+ type: mixed
+ value: '{{#1742806924635.pod#}}'
+ startTime:
+ type: variable
+ value:
+ - '1741157526222'
+ - startTime
+ type: tool
+ height: 54
+ id: '1741328197695'
+ position:
+ x: 1246
+ y: 899
+ positionAbsolute:
+ x: 1246
+ y: 899
+ selected: false
+ sourcePosition: right
+ targetPosition: left
+ type: custom
+ width: 244
+ - data:
+ desc: ''
+ is_team_authorization: true
+ output_schema: null
+ paramSchemas:
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Specified host name
+ ja_JP: Specified host name
+ pt_BR: Specified host name
+ zh_Hans: 指定的主机名
+ label:
+ en_US: node
+ ja_JP: node
+ pt_BR: node
+ zh_Hans: node
+ llm_description: Specified host name
+ max: null
+ min: null
+ name: node
+ options: []
+ placeholder: null
+ precision: null
+ required: true
+ scope: null
+ template: null
+ type: string
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Data query start time
+ ja_JP: Data query start time
+ pt_BR: Data query start time
+ zh_Hans: 开始时间 (微秒)
+ label:
+ en_US: startTime
+ ja_JP: startTime
+ pt_BR: startTime
+ zh_Hans: startTime
+ llm_description: Data query start time
+ max: null
+ min: null
+ name: startTime
+ options: []
+ placeholder: null
+ precision: null
+ required: true
+ scope: null
+ template: null
+ type: number
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Data query end time
+ ja_JP: Data query end time
+ pt_BR: Data query end time
+ zh_Hans: 结束时间 (微秒)
+ label:
+ en_US: endTime
+ ja_JP: endTime
+ pt_BR: endTime
+ zh_Hans: endTime
+ llm_description: Data query start time
+ max: null
+ min: null
+ name: endTime
+ options: []
+ placeholder: null
+ precision: null
+ required: true
+ scope: null
+ template: null
+ type: number
+ params:
+ endTime: ''
+ node: ''
+ startTime: ''
+ provider_id: apo_select
+ provider_name: apo_select
+ provider_type: builtin
+ selected: false
+ title: Host disk usage (percentage, excluding rootfs)
+ tool_configurations: {}
+ tool_label: 宿主机磁盘使用率(百分比,不含rootfs)
+ tool_name: 宿主机磁盘使用率(百分比,不含rootfs)
+ tool_parameters:
+ endTime:
+ type: variable
+ value:
+ - '1741157526222'
+ - endTime
+ node:
+ type: mixed
+ value: '{{#1742806924635.node#}}'
+ startTime:
+ type: variable
+ value:
+ - '1741157526222'
+ - startTime
+ type: tool
+ height: 54
+ id: '1741328213545'
+ position:
+ x: 1246
+ y: 993
+ positionAbsolute:
+ x: 1246
+ y: 993
+ selected: false
+ sourcePosition: right
+ targetPosition: left
+ type: custom
+ width: 244
+ - data:
+ desc: ''
+ is_team_authorization: true
+ output_schema: null
+ paramSchemas:
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Specified host name
+ ja_JP: Specified host name
+ pt_BR: Specified host name
+ zh_Hans: 指定的主机名
+ label:
+ en_US: node
+ ja_JP: node
+ pt_BR: node
+ zh_Hans: node
+ llm_description: Specified host name
+ max: null
+ min: null
+ name: node
+ options: []
+ placeholder: null
+ precision: null
+ required: true
+ scope: null
+ template: null
+ type: string
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Data query start time
+ ja_JP: Data query start time
+ pt_BR: Data query start time
+ zh_Hans: 开始时间 (微秒)
+ label:
+ en_US: startTime
+ ja_JP: startTime
+ pt_BR: startTime
+ zh_Hans: startTime
+ llm_description: Data query start time
+ max: null
+ min: null
+ name: startTime
+ options: []
+ placeholder: null
+ precision: null
+ required: true
+ scope: null
+ template: null
+ type: number
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Data query end time
+ ja_JP: Data query end time
+ pt_BR: Data query end time
+ zh_Hans: 结束时间 (微秒)
+ label:
+ en_US: endTime
+ ja_JP: endTime
+ pt_BR: endTime
+ zh_Hans: endTime
+ llm_description: Data query start time
+ max: null
+ min: null
+ name: endTime
+ options: []
+ placeholder: null
+ precision: null
+ required: true
+ scope: null
+ template: null
+ type: number
+ params:
+ endTime: ''
+ node: ''
+ startTime: ''
+ provider_id: apo_select
+ provider_name: apo_select
+ provider_type: builtin
+ selected: false
+ title: Host network receiving rate (bits/second)
+ tool_configurations: {}
+ tool_label: 宿主机网络接收速率(比特/秒)
+ tool_name: 宿主机网络接收速率(比特/秒)
+ tool_parameters:
+ endTime:
+ type: variable
+ value:
+ - '1741157526222'
+ - endTime
+ node:
+ type: mixed
+ value: '{{#1742806924635.node#}}'
+ startTime:
+ type: variable
+ value:
+ - '1741157526222'
+ - startTime
+ type: tool
+ height: 54
+ id: '1741328346220'
+ position:
+ x: 1246
+ y: 1087
+ positionAbsolute:
+ x: 1246
+ y: 1087
+ selected: false
+ sourcePosition: right
+ targetPosition: left
+ type: custom
+ width: 244
+ - data:
+ desc: ''
+ is_team_authorization: true
+ output_schema: null
+ paramSchemas:
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Specified host name
+ ja_JP: Specified host name
+ pt_BR: Specified host name
+ zh_Hans: 指定的主机名
+ label:
+ en_US: node
+ ja_JP: node
+ pt_BR: node
+ zh_Hans: node
+ llm_description: Specified host name
+ max: null
+ min: null
+ name: node
+ options: []
+ placeholder: null
+ precision: null
+ required: true
+ scope: null
+ template: null
+ type: string
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Data query start time
+ ja_JP: Data query start time
+ pt_BR: Data query start time
+ zh_Hans: 开始时间 (微秒)
+ label:
+ en_US: startTime
+ ja_JP: startTime
+ pt_BR: startTime
+ zh_Hans: startTime
+ llm_description: Data query start time
+ max: null
+ min: null
+ name: startTime
+ options: []
+ placeholder: null
+ precision: null
+ required: true
+ scope: null
+ template: null
+ type: number
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Data query end time
+ ja_JP: Data query end time
+ pt_BR: Data query end time
+ zh_Hans: 结束时间 (微秒)
+ label:
+ en_US: endTime
+ ja_JP: endTime
+ pt_BR: endTime
+ zh_Hans: endTime
+ llm_description: Data query start time
+ max: null
+ min: null
+ name: endTime
+ options: []
+ placeholder: null
+ precision: null
+ required: true
+ scope: null
+ template: null
+ type: number
+ params:
+ endTime: ''
+ node: ''
+ startTime: ''
+ provider_id: apo_select
+ provider_name: apo_select
+ provider_type: builtin
+ selected: false
+ title: Host disk read data rate (bytes/second)
+ tool_configurations: {}
+ tool_label: 宿主机磁盘读取数据速率(字节/秒)
+ tool_name: 宿主机磁盘读取数据速率(字节/秒)
+ tool_parameters:
+ endTime:
+ type: variable
+ value:
+ - '1741157526222'
+ - endTime
+ node:
+ type: mixed
+ value: '{{#1742806924635.node#}}'
+ startTime:
+ type: variable
+ value:
+ - '1741157526222'
+ - startTime
+ type: tool
+ height: 54
+ id: '1741328423453'
+ position:
+ x: 1246
+ y: 1181
+ positionAbsolute:
+ x: 1246
+ y: 1181
+ selected: false
+ sourcePosition: right
+ targetPosition: left
+ type: custom
+ width: 244
+ - data:
+ desc: ''
+ is_team_authorization: true
+ output_schema: null
+ paramSchemas:
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Specified host name
+ ja_JP: Specified host name
+ pt_BR: Specified host name
+ zh_Hans: 指定的主机名
+ label:
+ en_US: node
+ ja_JP: node
+ pt_BR: node
+ zh_Hans: node
+ llm_description: Specified host name
+ max: null
+ min: null
+ name: node
+ options: []
+ placeholder: null
+ precision: null
+ required: true
+ scope: null
+ template: null
+ type: string
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Data query start time
+ ja_JP: Data query start time
+ pt_BR: Data query start time
+ zh_Hans: 开始时间 (微秒)
+ label:
+ en_US: startTime
+ ja_JP: startTime
+ pt_BR: startTime
+ zh_Hans: startTime
+ llm_description: Data query start time
+ max: null
+ min: null
+ name: startTime
+ options: []
+ placeholder: null
+ precision: null
+ required: true
+ scope: null
+ template: null
+ type: number
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Data query end time
+ ja_JP: Data query end time
+ pt_BR: Data query end time
+ zh_Hans: 结束时间 (微秒)
+ label:
+ en_US: endTime
+ ja_JP: endTime
+ pt_BR: endTime
+ zh_Hans: endTime
+ llm_description: Data query start time
+ max: null
+ min: null
+ name: endTime
+ options: []
+ placeholder: null
+ precision: null
+ required: true
+ scope: null
+ template: null
+ type: number
+ params:
+ endTime: ''
+ node: ''
+ startTime: ''
+ provider_id: apo_select
+ provider_name: apo_select
+ provider_type: builtin
+ selected: false
+ title: Host disk write data rate (bytes/second)
+ tool_configurations: {}
+ tool_label: 宿主机磁盘写入数据速率(字节/秒)
+ tool_name: 宿主机磁盘写入数据速率(字节/秒)
+ tool_parameters:
+ endTime:
+ type: variable
+ value:
+ - '1741157526222'
+ - endTime
+ node:
+ type: mixed
+ value: '{{#1742806924635.node#}}'
+ startTime:
+ type: variable
+ value:
+ - '1741157526222'
+ - startTime
+ type: tool
+ height: 54
+ id: '1741328466394'
+ position:
+ x: 1246
+ y: 1275
+ positionAbsolute:
+ x: 1246
+ y: 1275
+ selected: false
+ sourcePosition: right
+ targetPosition: left
+ type: custom
+ width: 244
+ - data:
+ desc: ''
+ is_team_authorization: true
+ output_schema: null
+ paramSchemas:
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Specified host name
+ ja_JP: Specified host name
+ pt_BR: Specified host name
+ zh_Hans: 指定的主机名
+ label:
+ en_US: node
+ ja_JP: node
+ pt_BR: node
+ zh_Hans: node
+ llm_description: Specified host name
+ max: null
+ min: null
+ name: node
+ options: []
+ placeholder: null
+ precision: null
+ required: true
+ scope: null
+ template: null
+ type: string
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Data query start time
+ ja_JP: Data query start time
+ pt_BR: Data query start time
+ zh_Hans: 开始时间 (微秒)
+ label:
+ en_US: startTime
+ ja_JP: startTime
+ pt_BR: startTime
+ zh_Hans: startTime
+ llm_description: Data query start time
+ max: null
+ min: null
+ name: startTime
+ options: []
+ placeholder: null
+ precision: null
+ required: true
+ scope: null
+ template: null
+ type: number
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Data query end time
+ ja_JP: Data query end time
+ pt_BR: Data query end time
+ zh_Hans: 结束时间 (微秒)
+ label:
+ en_US: endTime
+ ja_JP: endTime
+ pt_BR: endTime
+ zh_Hans: endTime
+ llm_description: Data query start time
+ max: null
+ min: null
+ name: endTime
+ options: []
+ placeholder: null
+ precision: null
+ required: true
+ scope: null
+ template: null
+ type: number
+ params:
+ endTime: ''
+ node: ''
+ startTime: ''
+ provider_id: apo_select
+ provider_name: apo_select
+ provider_type: builtin
+ selected: false
+ title: Host disk IO time consumption rate
+ tool_configurations: {}
+ tool_label: 宿主机磁盘IO耗时速率
+ tool_name: 宿主机磁盘IO耗时速率
+ tool_parameters:
+ endTime:
+ type: variable
+ value:
+ - '1741157526222'
+ - endTime
+ node:
+ type: mixed
+ value: '{{#1742806924635.node#}}'
+ startTime:
+ type: variable
+ value:
+ - '1741157526222'
+ - startTime
+ type: tool
+ height: 54
+ id: '1741328742817'
+ position:
+ x: 1246
+ y: 1369
+ positionAbsolute:
+ x: 1246
+ y: 1369
+ selected: false
+ sourcePosition: right
+ targetPosition: left
+ type: custom
+ width: 244
+ - data:
+ desc: ''
+ is_team_authorization: true
+ output_schema: null
+ paramSchemas:
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Specified host name
+ ja_JP: Specified host name
+ pt_BR: Specified host name
+ zh_Hans: 指定的主机名
+ label:
+ en_US: node
+ ja_JP: node
+ pt_BR: node
+ zh_Hans: node
+ llm_description: Specified host name
+ max: null
+ min: null
+ name: node
+ options: []
+ placeholder: null
+ precision: null
+ required: true
+ scope: null
+ template: null
+ type: string
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Data query start time
+ ja_JP: Data query start time
+ pt_BR: Data query start time
+ zh_Hans: 开始时间 (微秒)
+ label:
+ en_US: startTime
+ ja_JP: startTime
+ pt_BR: startTime
+ zh_Hans: startTime
+ llm_description: Data query start time
+ max: null
+ min: null
+ name: startTime
+ options: []
+ placeholder: null
+ precision: null
+ required: true
+ scope: null
+ template: null
+ type: number
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Data query end time
+ ja_JP: Data query end time
+ pt_BR: Data query end time
+ zh_Hans: 结束时间 (微秒)
+ label:
+ en_US: endTime
+ ja_JP: endTime
+ pt_BR: endTime
+ zh_Hans: endTime
+ llm_description: Data query start time
+ max: null
+ min: null
+ name: endTime
+ options: []
+ placeholder: null
+ precision: null
+ required: true
+ scope: null
+ template: null
+ type: number
+ params:
+ endTime: ''
+ node: ''
+ startTime: ''
+ provider_id: apo_select
+ provider_name: apo_select
+ provider_type: builtin
+ selected: false
+ title: Host IO waiting CPU busy rate
+ tool_configurations: {}
+ tool_label: 宿主机IO等待CPU繁忙率
+ tool_name: host_cpu_iowait
+ tool_parameters:
+ endTime:
+ type: variable
+ value:
+ - '1741157526222'
+ - endTime
+ node:
+ type: mixed
+ value: '{{#1742806924635.node#}}'
+ startTime:
+ type: variable
+ value:
+ - '1741157526222'
+ - startTime
+ type: tool
+ height: 54
+ id: '1741328773213'
+ position:
+ x: 1246
+ y: 1463
+ positionAbsolute:
+ x: 1246
+ y: 1463
+ selected: false
+ sourcePosition: right
+ targetPosition: left
+ type: custom
+ width: 244
+ - data:
+ desc: ''
+ is_team_authorization: true
+ output_schema: null
+ paramSchemas:
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Specified host name
+ ja_JP: Specified host name
+ pt_BR: Specified host name
+ zh_Hans: 指定的主机名
+ label:
+ en_US: node
+ ja_JP: node
+ pt_BR: node
+ zh_Hans: node
+ llm_description: Specified host name
+ max: null
+ min: null
+ name: node
+ options: []
+ placeholder: null
+ precision: null
+ required: true
+ scope: null
+ template: null
+ type: string
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Data query start time
+ ja_JP: Data query start time
+ pt_BR: Data query start time
+ zh_Hans: 开始时间 (微秒)
+ label:
+ en_US: startTime
+ ja_JP: startTime
+ pt_BR: startTime
+ zh_Hans: startTime
+ llm_description: Data query start time
+ max: null
+ min: null
+ name: startTime
+ options: []
+ placeholder: null
+ precision: null
+ required: true
+ scope: null
+ template: null
+ type: number
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Data query end time
+ ja_JP: Data query end time
+ pt_BR: Data query end time
+ zh_Hans: 结束时间 (微秒)
+ label:
+ en_US: endTime
+ ja_JP: endTime
+ pt_BR: endTime
+ zh_Hans: endTime
+ llm_description: Data query start time
+ max: null
+ min: null
+ name: endTime
+ options: []
+ placeholder: null
+ precision: null
+ required: true
+ scope: null
+ template: null
+ type: number
+ params:
+ endTime: ''
+ node: ''
+ startTime: ''
+ provider_id: apo_select
+ provider_name: apo_select
+ provider_type: builtin
+ selected: false
+ title: The number of file descriptors currently open on the host
+ tool_configurations: {}
+ tool_label: 宿主机当前打开文件描述符数
+ tool_name: host_cpu_fd_open
+ tool_parameters:
+ endTime:
+ type: variable
+ value:
+ - '1741157526222'
+ - endTime
+ node:
+ type: mixed
+ value: '{{#1742806924635.node#}}'
+ startTime:
+ type: variable
+ value:
+ - '1741157526222'
+ - startTime
+ type: tool
+ height: 54
+ id: '1741328799030'
+ position:
+ x: 1246
+ y: 1557
+ positionAbsolute:
+ x: 1246
+ y: 1557
+ selected: false
+ sourcePosition: right
+ targetPosition: left
+ type: custom
+ width: 244
+ - data:
+ desc: ''
+ is_team_authorization: true
+ output_schema: null
+ paramSchemas:
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Specified service name
+ ja_JP: Specified service name
+ pt_BR: Specified service name
+ zh_Hans: 指定的服务名
+ label:
+ en_US: service_name
+ ja_JP: service_name
+ pt_BR: service_name
+ zh_Hans: service_name
+ llm_description: 指定的服务名
+ max: null
+ min: null
+ name: service_name
+ options: []
+ placeholder: null
+ precision: null
+ required: true
+ scope: null
+ template: null
+ type: string
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Specified endpoint name
+ ja_JP: Specified endpoint name
+ pt_BR: Specified endpoint name
+ zh_Hans: 指定的服务端点名
+ label:
+ en_US: content_key
+ ja_JP: content_key
+ pt_BR: content_key
+ zh_Hans: content_key
+ llm_description: 指定的服务端点名
+ max: null
+ min: null
+ name: content_key
+ options: []
+ placeholder: null
+ precision: null
+ required: true
+ scope: null
+ template: null
+ type: string
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Data query start time
+ ja_JP: Data query start time
+ pt_BR: Data query start time
+ zh_Hans: 开始时间 (微秒)
+ label:
+ en_US: startTime
+ ja_JP: startTime
+ pt_BR: startTime
+ zh_Hans: startTime
+ llm_description: Data query start time
+ max: null
+ min: null
+ name: startTime
+ options: []
+ placeholder: null
+ precision: null
+ required: true
+ scope: null
+ template: null
+ type: number
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Data query end time
+ ja_JP: Data query end time
+ pt_BR: Data query end time
+ zh_Hans: 结束时间 (微秒)
+ label:
+ en_US: endTime
+ ja_JP: endTime
+ pt_BR: endTime
+ zh_Hans: endTime
+ llm_description: Data query start time
+ max: null
+ min: null
+ name: endTime
+ options: []
+ placeholder: null
+ precision: null
+ required: true
+ scope: null
+ template: null
+ type: number
+ params:
+ content_key: ''
+ endTime: ''
+ service_name: ''
+ startTime: ''
+ provider_id: apo_select
+ provider_name: apo_select
+ provider_type: builtin
+ selected: false
+ title: Service request success rate (by service name and content key, within
+ a specified time period)
+ tool_configurations: {}
+ tool_label: 服务请求成功率(按服务名和内容键统计,指定时间段内)
+ tool_name: Originx 北极星指标 (服务层级) - RED指标 - 请求成功率
+ tool_parameters:
+ content_key:
+ type: mixed
+ value: '{{#1742806924635.endpoint#}}'
+ endTime:
+ type: variable
+ value:
+ - '1741157526222'
+ - endTime
+ service_name:
+ type: mixed
+ value: '{{#1742806924635.service#}}'
+ startTime:
+ type: variable
+ value:
+ - '1741157526222'
+ - startTime
+ type: tool
+ height: 54
+ id: '1741329632798'
+ position:
+ x: 1246
+ y: 805
+ positionAbsolute:
+ x: 1246
+ y: 805
+ selected: false
+ sourcePosition: right
+ targetPosition: left
+ type: custom
+ width: 244
+ - data:
+ context:
+ enabled: false
+ variable_selector: []
+ desc: ''
+ model:
+ completion_params:
+ temperature: 0.7
+ mode: chat
+ name: deepseek-chat
+ provider: langgenius/deepseek/deepseek
+ prompt_template:
+ - id: c981a70d-9ebb-4f03-949a-8d78826f9bda
+ role: system
+ text: You are an intelligent assistant that helps users solve problems in
+ the field of observability
+ - id: c62c7537-195d-41e7-9127-116cf3debc7c
+ role: user
+ text: '##Purpose
+
+ Please analyze the indicator change trend of the system/application in
+ the past 15 minutes, and analyze it in combination with the current alert
+ event.
+
+ ##Steps
+
+ 1. List the change trend of MetricsData in the past 15 minutes, describe
+ whether the changes of these Metrics are normal, and whether there are
+ abnormal fluctuations or trends.
+
+ 2. Confirmation of alarm validity: Combined with the alarm event, determine
+ whether the current alert is valid.
+
+ If MetricsData continues to rise or is at a high level, the alarm is considered
+ valid.
+
+ If it is in a fluctuating state, that is, it rises occasionally but then
+ falls, the alert is considered invalid.
+
+ If MetricsData eventually returns to the normal range or low value, the
+ alarm is considered invalid.
+
+ If there is historical data, it is necessary to compare and analyze the
+ historical data. If it is higher than the historical data, the alert is
+ also valid.
+
+ ##Output
+
+ Describe the trend of MetricsData and draw a conclusion on whether the
+ alert is valid.
+
+ Note: The conclusion of the alert validity analysis can only be valid
+ or invalid
+
+ ##Data
+
+ MetricsData
+
+ {{#1741162531836.output#}}
+
+ Historical data of metricsdata
+
+ {{#1742434016239.output#}}
+
+ Alert event description
+
+ {{#1741157526222.alert#}}'
selected: false
- title: Agent
- type: agent
- height: 197
- id: '1741159085487'
+ title: llm analysis metrics data
+ type: llm
+ variables: []
+ vision:
+ enabled: false
+ height: 90
+ id: '1742366141890'
+ position:
+ x: 2462
+ y: 1314
+ positionAbsolute:
+ x: 2462
+ y: 1314
+ selected: false
+ sourcePosition: right
+ targetPosition: left
+ type: custom
+ width: 244
+ - data:
+ classes:
+ - id: '1'
+ name: 'true'
+ - id: '2'
+ name: 'false'
+ desc: ''
+ instruction: '# Purpose
+
+ Classify based on the input conclusion
+
+ If the conclusion is that the alert is valid, classify it as false
+
+ If the conclusion is that the alert is invalid, classify it as true
+
+ # Note
+
+ Please check the text carefully and look for conclusions about the effectiveness
+ of the alarm, do not misclassify'
+ instructions: ''
+ model:
+ completion_params:
+ temperature: 0.7
+ mode: chat
+ name: deepseek-chat
+ provider: langgenius/deepseek/deepseek
+ query_variable_selector:
+ - '1742366141890'
+ - text
+ selected: false
+ title: data trend classify
+ topics: []
+ type: question-classifier
+ vision:
+ enabled: false
+ height: 168
+ id: '1742366303110'
position:
- x: 1307.6754497452887
- y: 1290.1574754514506
+ x: 2766
+ y: 1218
positionAbsolute:
- x: 1307.6754497452887
- y: 1290.1574754514506
+ x: 2766
+ y: 1218
selected: false
sourcePosition: right
targetPosition: left
type: custom
- width: 243
+ width: 244
- data:
- code: "\ndef get_value(data, keys):\n for key in keys:\n value =\
- \ data.get(key)\n if value is not None:\n return value\n\
- \ return \"\"\n\nimport json\ndef main(arg: str) -> dict:\n data =\
- \ json.loads(arg)\n return {\n \"node\": data.get('node', ''),\n\
- \ \"service\": get_value(data, [\"svc_name\", \"service\"]),\n \
- \ \"endpoint\": get_value(data,[\"endpoint\", \"content_key\"]),\n\
- \ \"pod\": data.get('pod', ''),\n \"namespace\": data.get('namespace',\
- \ ''),\n }\n"
+ code: "SECOND = 1000000 # microseconds\nMINUTE = 60 * SECOND\nHOUR = 60 *\
+ \ MINUTE\n\ndef main(arg1: int, arg2: int) -> dict:\n \n return {\n\
+ \ \"history_st\": arg1 - (24*HOUR),\n \"history_et\": arg2,\n\
+ \ }\n"
code_language: python3
desc: ''
outputs:
- endpoint:
- children: null
- type: string
- namespace:
- children: null
- type: string
- node:
- children: null
- type: string
- pod:
+ history_et:
children: null
- type: string
- service:
+ type: number
+ history_st:
children: null
- type: string
+ type: number
+ retry_config:
+ max_retries: 3
+ retry_enabled: true
+ retry_interval: 1000
+ selected: false
+ title: get history data range
+ type: code
+ variables:
+ - value_selector:
+ - '1741157526222'
+ - startTime
+ variable: arg1
+ - value_selector:
+ - '1741157526222'
+ - endTime
+ variable: arg2
+ height: 80
+ id: '1742433446760'
+ position:
+ x: 638
+ y: 560
+ positionAbsolute:
+ x: 638
+ y: 560
+ selected: false
+ sourcePosition: right
+ targetPosition: left
+ type: custom
+ width: 244
+ - data:
+ desc: ''
+ is_team_authorization: true
+ output_schema: null
+ paramSchemas:
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Specified service name
+ ja_JP: Specified service name
+ pt_BR: Specified service name
+ zh_Hans: 指定的服务名
+ label:
+ en_US: service_name
+ ja_JP: service_name
+ pt_BR: service_name
+ zh_Hans: service_name
+ llm_description: 指定的服务名
+ max: null
+ min: null
+ name: service_name
+ options: []
+ placeholder: null
+ precision: null
+ required: true
+ scope: null
+ template: null
+ type: string
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Specified endpoint name
+ ja_JP: Specified endpoint name
+ pt_BR: Specified endpoint name
+ zh_Hans: 指定的服务端点名
+ label:
+ en_US: content_key
+ ja_JP: content_key
+ pt_BR: content_key
+ zh_Hans: content_key
+ llm_description: 指定的服务端点名
+ max: null
+ min: null
+ name: content_key
+ options: []
+ placeholder: null
+ precision: null
+ required: true
+ scope: null
+ template: null
+ type: string
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Data query start time
+ ja_JP: Data query start time
+ pt_BR: Data query start time
+ zh_Hans: 开始时间 (微秒)
+ label:
+ en_US: startTime
+ ja_JP: startTime
+ pt_BR: startTime
+ zh_Hans: startTime
+ llm_description: Data query start time
+ max: null
+ min: null
+ name: startTime
+ options: []
+ placeholder: null
+ precision: null
+ required: true
+ scope: null
+ template: null
+ type: number
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Data query end time
+ ja_JP: Data query end time
+ pt_BR: Data query end time
+ zh_Hans: 结束时间 (微秒)
+ label:
+ en_US: endTime
+ ja_JP: endTime
+ pt_BR: endTime
+ zh_Hans: endTime
+ llm_description: Data query start time
+ max: null
+ min: null
+ name: endTime
+ options: []
+ placeholder: null
+ precision: null
+ required: true
+ scope: null
+ template: null
+ type: number
+ params:
+ content_key: ''
+ endTime: ''
+ service_name: ''
+ startTime: ''
+ provider_id: apo_select
+ provider_name: apo_select
+ provider_type: builtin
selected: false
- title: get params
- type: code
- variables:
- - value_selector:
- - '1741157526222'
- - params
- variable: arg
- height: 53
- id: '1741161440242'
+ title: History Average service response time (milliseconds, by service name
+ and content key, within a specified time period)
+ tool_configurations: {}
+ tool_label: 服务平均响应时间(毫秒,按服务名和内容键统计,指定时间段内)
+ tool_name: Originx 北极星指标 (服务层级) - RED指标 - 平均响应时间
+ tool_parameters:
+ content_key:
+ type: mixed
+ value: '{{#1742806924635.endpoint#}}'
+ endTime:
+ type: variable
+ value:
+ - '1742433446760'
+ - history_et
+ service_name:
+ type: mixed
+ value: '{{#1742806924635.service#}}'
+ startTime:
+ type: variable
+ value:
+ - '1742433446760'
+ - history_st
+ type: tool
+ height: 54
+ id: '17424339242280'
position:
- x: -69.08988532973478
- y: 292.1938971823079
+ x: 1550
+ y: 617
positionAbsolute:
- x: -69.08988532973478
- y: 292.1938971823079
+ x: 1550
+ y: 617
selected: false
sourcePosition: right
targetPosition: left
type: custom
- width: 243
+ width: 244
- data:
desc: ''
output_type: string
selected: false
- title: aggregator data
+ title: summary history data
type: variable-aggregator
variables:
- - - '1741328045214'
+ - - '17424339242280'
- text
- - - '1741328058981'
+ - - '17429797664440'
- text
- - - '1741328076453'
+ - - '17424348570980'
- text
- - - '1741328169934'
+ - - '17424348526540'
- text
- - - '1741329632798'
+ - - '17424348206030'
- text
- - - '1741328197695'
+ - - '17424347242840'
- text
- - - '1741328423453'
+ - - '17424346884650'
- text
- - - '1741328466394'
+ - - '17424342365860'
- text
- - - '1741328692906'
+ - - '17424344697090'
- text
- - - '1741328742817'
+ - - '17424345080000'
- text
- - - '1741328773213'
+ - - '17424345826170'
- text
- - - '1741328799030'
+ - - '17424345315500'
- text
- - - '1741591590829'
+ - - '17429798797920'
- text
- height: 370
- id: '1741162531836'
+ - - '17429835599060'
+ - text
+ - - '17429835940550'
+ - text
+ height: 416
+ id: '1742434016239'
+ position:
+ x: 2158
+ y: 1166
+ positionAbsolute:
+ x: 2158
+ y: 1166
+ selected: false
+ sourcePosition: right
+ targetPosition: left
+ type: custom
+ width: 244
+ - data:
+ desc: ''
+ is_team_authorization: true
+ output_schema: null
+ paramSchemas:
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Specified pod name
+ ja_JP: Specified pod name
+ pt_BR: Specified pod name
+ zh_Hans: 指定的容器POD名称
+ label:
+ en_US: pod
+ ja_JP: pod
+ pt_BR: pod
+ zh_Hans: pod
+ llm_description: Specified pod name
+ max: null
+ min: null
+ name: pod
+ options: []
+ placeholder: null
+ precision: null
+ required: true
+ scope: null
+ template: null
+ type: string
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Specified namespace
+ ja_JP: Specified namespace
+ pt_BR: Specified namespace
+ zh_Hans: 指定的容器所在Namespace
+ label:
+ en_US: namespace
+ ja_JP: namespace
+ pt_BR: namespace
+ zh_Hans: namespace
+ llm_description: Specified namespace
+ max: null
+ min: null
+ name: namespace
+ options: []
+ placeholder: null
+ precision: null
+ required: true
+ scope: null
+ template: null
+ type: string
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Data query start time
+ ja_JP: Data query start time
+ pt_BR: Data query start time
+ zh_Hans: 开始时间 (微秒)
+ label:
+ en_US: startTime
+ ja_JP: startTime
+ pt_BR: startTime
+ zh_Hans: startTime
+ llm_description: Data query start time
+ max: null
+ min: null
+ name: startTime
+ options: []
+ placeholder: null
+ precision: null
+ required: true
+ scope: null
+ template: null
+ type: number
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Data query end time
+ ja_JP: Data query end time
+ pt_BR: Data query end time
+ zh_Hans: 结束时间 (微秒)
+ label:
+ en_US: endTime
+ ja_JP: endTime
+ pt_BR: endTime
+ zh_Hans: endTime
+ llm_description: Data query start time
+ max: null
+ min: null
+ name: endTime
+ options: []
+ placeholder: null
+ precision: null
+ required: true
+ scope: null
+ template: null
+ type: number
+ params:
+ endTime: ''
+ namespace: ''
+ pod: ''
+ startTime: ''
+ provider_id: apo_select
+ provider_name: apo_select
+ provider_type: builtin
+ selected: false
+ title: history Container CPU throttling duration (when using Containerd container
+ runtime, statistics by container and Pod)
+ tool_configurations: {}
+ tool_label: 容器CPU节流时长(使用Containerd容器运行时,按容器和Pod统计)
+ tool_name: 容器CPU节流时长(使用Containerd容器运行时,按容器和Pod统计)
+ tool_parameters:
+ endTime:
+ type: variable
+ value:
+ - '1742433446760'
+ - history_et
+ namespace:
+ type: mixed
+ value: '{{#1742806924635.namespace#}}'
+ pod:
+ type: mixed
+ value: '{{#1742806924635.pod#}}'
+ startTime:
+ type: variable
+ value:
+ - '1742433446760'
+ - history_st
+ type: tool
+ height: 54
+ id: '17424342365860'
position:
- x: 1791.1271628500772
- y: 78.61010888432415
+ x: 1550
+ y: 711
positionAbsolute:
- x: 1791.1271628500772
- y: 78.61010888432415
+ x: 1550
+ y: 711
selected: false
sourcePosition: right
targetPosition: left
type: custom
- width: 243
+ width: 244
- data:
desc: ''
is_team_authorization: true
@@ -1944,171 +3474,143 @@ workflow:
default: null
form: llm
human_description:
- en_US: time series metric data
- ja_JP: time series metric data
- pt_BR: time series metric data
- zh_Hans: 时序指标数据
+ en_US: Specified service name
+ ja_JP: Specified service name
+ pt_BR: Specified service name
+ zh_Hans: 指定的服务名
+ label:
+ en_US: service_name
+ ja_JP: service_name
+ pt_BR: service_name
+ zh_Hans: service_name
+ llm_description: 指定的服务名
+ max: null
+ min: null
+ name: service_name
+ options: []
+ placeholder: null
+ precision: null
+ required: true
+ scope: null
+ template: null
+ type: string
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Specified endpoint name
+ ja_JP: Specified endpoint name
+ pt_BR: Specified endpoint name
+ zh_Hans: 指定的服务端点名
+ label:
+ en_US: content_key
+ ja_JP: content_key
+ pt_BR: content_key
+ zh_Hans: content_key
+ llm_description: 指定的服务端点名
+ max: null
+ min: null
+ name: content_key
+ options: []
+ placeholder: null
+ precision: null
+ required: true
+ scope: null
+ template: null
+ type: string
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Data query start time
+ ja_JP: Data query start time
+ pt_BR: Data query start time
+ zh_Hans: 开始时间 (微秒)
label:
- en_US: metricData
- ja_JP: metricData
- pt_BR: metricData
- zh_Hans: metricData
- llm_description: Time series indicator data
+ en_US: startTime
+ ja_JP: startTime
+ pt_BR: startTime
+ zh_Hans: startTime
+ llm_description: Data query start time
max: null
min: null
- name: metricData
+ name: startTime
options: []
placeholder: null
precision: null
required: true
scope: null
template: null
- type: string
+ type: number
- auto_generate: null
default: null
form: llm
human_description:
- en_US: threshold
- ja_JP: threshold
- pt_BR: threshold
- zh_Hans: 趋势分析阈值
+ en_US: Data query end time
+ ja_JP: Data query end time
+ pt_BR: Data query end time
+ zh_Hans: 结束时间 (微秒)
label:
- en_US: threshold
- ja_JP: threshold
- pt_BR: threshold
- zh_Hans: threshold
- llm_description: threshold
+ en_US: endTime
+ ja_JP: endTime
+ pt_BR: endTime
+ zh_Hans: endTime
+ llm_description: Data query start time
max: null
min: null
- name: threshold
+ name: endTime
options: []
placeholder: null
precision: null
- required: false
+ required: true
scope: null
template: null
- type: string
+ type: number
params:
- metricData: ''
- threshold: ''
- provider_id: apo_analysis
- provider_name: apo_analysis
+ content_key: ''
+ endTime: ''
+ service_name: ''
+ startTime: ''
+ provider_id: apo_select
+ provider_name: apo_select
provider_type: builtin
selected: false
- title: trend analysis
+ title: history Service request success rate (by service name and content
+ key, within a specified time period)
tool_configurations: {}
- tool_label: 趋势分析
- tool_name: trend
+ tool_label: 服务请求成功率(按服务名和内容键统计,指定时间段内)
+ tool_name: Originx 北极星指标 (服务层级) - RED指标 - 请求成功率
tool_parameters:
- metricData:
+ content_key:
+ type: mixed
+ value: '{{#1742806924635.endpoint#}}'
+ endTime:
+ type: variable
+ value:
+ - '1742433446760'
+ - history_et
+ service_name:
type: mixed
- value: '{{#1741162531836.output#}}'
+ value: '{{#1742806924635.service#}}'
+ startTime:
+ type: variable
+ value:
+ - '1742433446760'
+ - history_st
type: tool
- height: 53
- id: '1741166377433'
- position:
- x: 2391.9587465022714
- y: 113.39535872618072
- positionAbsolute:
- x: 2391.9587465022714
- y: 113.39535872618072
- selected: false
- sourcePosition: right
- targetPosition: left
- type: custom
- width: 243
- - data:
- classes:
- - id: '1'
- name: jitter
- - id: '2'
- name: continuous
- desc: ''
- instruction: Determine whether the input conclusion is jitter or continuous
- instructions: ''
- model:
- completion_params:
- temperature: 0.7
- mode: chat
- name: deepseek-chat
- provider: langgenius/deepseek/deepseek
- query_variable_selector:
- - '1741159085487'
- - text
- selected: false
- title: Question Classifier
- topics: []
- type: question-classifier
- vision:
- enabled: false
- height: 167
- id: '1741311244655'
- position:
- x: 1978.2523323677738
- y: 1024.2103589724884
- positionAbsolute:
- x: 1978.2523323677738
- y: 1024.2103589724884
- selected: false
- sourcePosition: right
- targetPosition: left
- type: custom
- width: 243
- - data:
- code: "\ndef main(arg1: str) -> dict:\n res = \"true\"\n if arg1 ==\
- \ \"continuous\":\n res = \"false\"\n return {\n \"result\"\
- : res,\n }\n"
- code_language: python3
- desc: ''
- outputs:
- result:
- children: null
- type: string
- selected: false
- title: get alert vaild
- type: code
- variables:
- - value_selector:
- - '1741311244655'
- - class_name
- variable: arg1
- height: 53
- id: '1741311294320'
- position:
- x: 2339.896564438594
- y: 908.8373922229209
- positionAbsolute:
- x: 2339.896564438594
- y: 908.8373922229209
- selected: false
- sourcePosition: right
- targetPosition: left
- type: custom
- width: 243
- - data:
- desc: ''
- output_type: string
- selected: false
- title: aggregator data
- type: variable-aggregator
- variables:
- - - '1741311294320'
- - result
- - - '1741166377433'
- - text
- height: 128
- id: '1741311394752'
+ height: 54
+ id: '17424344697090'
position:
- x: 3165.5195077270564
- y: 457.05597714025964
+ x: 1550
+ y: 805
positionAbsolute:
- x: 3165.5195077270564
- y: 457.05597714025964
+ x: 1550
+ y: 805
selected: false
sourcePosition: right
targetPosition: left
type: custom
- width: 243
+ width: 244
- data:
desc: ''
is_team_authorization: true
@@ -2118,19 +3620,43 @@ workflow:
default: null
form: llm
human_description:
- en_US: Specified service name
- ja_JP: Specified service name
- pt_BR: Specified service name
- zh_Hans: 指定的服务名
+ en_US: Specified pod name
+ ja_JP: Specified pod name
+ pt_BR: Specified pod name
+ zh_Hans: 指定的容器POD名称
label:
- en_US: service_name
- ja_JP: service_name
- pt_BR: service_name
- zh_Hans: service_name
- llm_description: 指定的服务名
+ en_US: pod
+ ja_JP: pod
+ pt_BR: pod
+ zh_Hans: pod
+ llm_description: Specified pod name
max: null
min: null
- name: service_name
+ name: pod
+ options: []
+ placeholder: null
+ precision: null
+ required: true
+ scope: null
+ template: null
+ type: string
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Specified namespace
+ ja_JP: Specified namespace
+ pt_BR: Specified namespace
+ zh_Hans: 指定的容器所在Namespace
+ label:
+ en_US: namespace
+ ja_JP: namespace
+ pt_BR: namespace
+ zh_Hans: namespace
+ llm_description: Specified namespace
+ max: null
+ min: null
+ name: namespace
options: []
placeholder: null
precision: null
@@ -2142,19 +3668,117 @@ workflow:
default: null
form: llm
human_description:
- en_US: Specified endpoint name
- ja_JP: Specified endpoint name
- pt_BR: Specified endpoint name
- zh_Hans: 指定的服务端点名
+ en_US: Data query start time
+ ja_JP: Data query start time
+ pt_BR: Data query start time
+ zh_Hans: 开始时间 (微秒)
+ label:
+ en_US: startTime
+ ja_JP: startTime
+ pt_BR: startTime
+ zh_Hans: startTime
+ llm_description: Data query start time
+ max: null
+ min: null
+ name: startTime
+ options: []
+ placeholder: null
+ precision: null
+ required: true
+ scope: null
+ template: null
+ type: number
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Data query end time
+ ja_JP: Data query end time
+ pt_BR: Data query end time
+ zh_Hans: 结束时间 (微秒)
+ label:
+ en_US: endTime
+ ja_JP: endTime
+ pt_BR: endTime
+ zh_Hans: endTime
+ llm_description: Data query start time
+ max: null
+ min: null
+ name: endTime
+ options: []
+ placeholder: null
+ precision: null
+ required: true
+ scope: null
+ template: null
+ type: number
+ params:
+ endTime: ''
+ namespace: ''
+ pod: ''
+ startTime: ''
+ provider_id: apo_select
+ provider_name: apo_select
+ provider_type: builtin
+ selected: false
+ title: history The network round-trip time between the container and the downstream
+ service (RTT, by namespace and Pod)
+ tool_configurations: {}
+ tool_label: 容器与下游服务的网络往返时间(RTT,按命名空间和Pod统计)
+ tool_name: 查询容器网络与下游RTT
+ tool_parameters:
+ endTime:
+ type: variable
+ value:
+ - '1742433446760'
+ - history_et
+ namespace:
+ type: mixed
+ value: '{{#1742806924635.namespace#}}'
+ pod:
+ type: mixed
+ value: '{{#1742806924635.pod#}}'
+ startTime:
+ type: variable
+ value:
+ - '1742433446760'
+ - history_st
+ type: tool
+ height: 54
+ id: '17424345080000'
+ position:
+ x: 1550
+ y: 899
+ positionAbsolute:
+ x: 1550
+ y: 899
+ selected: false
+ sourcePosition: right
+ targetPosition: left
+ type: custom
+ width: 244
+ - data:
+ desc: ''
+ is_team_authorization: true
+ output_schema: null
+ paramSchemas:
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Specified host name
+ ja_JP: Specified host name
+ pt_BR: Specified host name
+ zh_Hans: 指定的主机名
label:
- en_US: content_key
- ja_JP: content_key
- pt_BR: content_key
- zh_Hans: content_key
- llm_description: 指定的服务端点名
+ en_US: node
+ ja_JP: node
+ pt_BR: node
+ zh_Hans: node
+ llm_description: Specified host name
max: null
min: null
- name: content_key
+ name: node
options: []
placeholder: null
precision: null
@@ -2211,50 +3835,45 @@ workflow:
template: null
type: number
params:
- content_key: ''
endTime: ''
- service_name: ''
+ node: ''
startTime: ''
provider_id: apo_select
provider_name: apo_select
provider_type: builtin
selected: false
- title: Average service response time (milliseconds, by service name and content
- key, within a specified time period)
+ title: history Host disk usage (percentage, excluding rootfs)
tool_configurations: {}
- tool_label: 服务平均响应时间(毫秒,按服务名和内容键统计,指定时间段内)
- tool_name: Originx 北极星指标 (服务层级) - RED指标 - 平均响应时间
+ tool_label: 宿主机磁盘使用率(百分比,不含rootfs)
+ tool_name: 宿主机磁盘使用率(百分比,不含rootfs)
tool_parameters:
- content_key:
- type: mixed
- value: '{{#1741161440242.endpoint#}}'
endTime:
type: variable
value:
- - '1741157526222'
- - endTime
- service_name:
+ - '1742433446760'
+ - history_et
+ node:
type: mixed
- value: '{{#1741161440242.service#}}'
+ value: '{{#1742806924635.node#}}'
startTime:
type: variable
value:
- - '1741157526222'
- - startTime
+ - '1742433446760'
+ - history_st
type: tool
- height: 53
- id: '1741328045214'
+ height: 54
+ id: '17424345315500'
position:
- x: 855.3123364340672
- y: 87.84552204580373
+ x: 1550
+ y: 993
positionAbsolute:
- x: 855.3123364340672
- y: 87.84552204580373
+ x: 1550
+ y: 993
selected: false
sourcePosition: right
targetPosition: left
type: custom
- width: 243
+ width: 244
- data:
desc: ''
is_team_authorization: true
@@ -2264,43 +3883,19 @@ workflow:
default: null
form: llm
human_description:
- en_US: Specified pod name
- ja_JP: Specified pod name
- pt_BR: Specified pod name
- zh_Hans: 指定的容器POD名称
- label:
- en_US: pod
- ja_JP: pod
- pt_BR: pod
- zh_Hans: pod
- llm_description: Specified pod name
- max: null
- min: null
- name: pod
- options: []
- placeholder: null
- precision: null
- required: true
- scope: null
- template: null
- type: string
- - auto_generate: null
- default: null
- form: llm
- human_description:
- en_US: Specified namespace
- ja_JP: Specified namespace
- pt_BR: Specified namespace
- zh_Hans: 指定的容器所在Namespace
+ en_US: Specified host name
+ ja_JP: Specified host name
+ pt_BR: Specified host name
+ zh_Hans: 指定的主机名
label:
- en_US: namespace
- ja_JP: namespace
- pt_BR: namespace
- zh_Hans: namespace
- llm_description: Specified namespace
+ en_US: node
+ ja_JP: node
+ pt_BR: node
+ zh_Hans: node
+ llm_description: Specified host name
max: null
min: null
- name: namespace
+ name: node
options: []
placeholder: null
precision: null
@@ -2358,49 +3953,44 @@ workflow:
type: number
params:
endTime: ''
- namespace: ''
- pod: ''
+ node: ''
startTime: ''
provider_id: apo_select
provider_name: apo_select
provider_type: builtin
selected: false
- title: Container CPU usage (when using Containerd container runtime, statistics
- are calculated by container and Pod)
+ title: history Host network receiving rate (bits/second)
tool_configurations: {}
- tool_label: 容器CPU使用率(使用Containerd容器运行时,按容器和Pod统计)
- tool_name: 查询容器CPU利用率
+ tool_label: 宿主机网络接收速率(比特/秒)
+ tool_name: 宿主机网络接收速率(比特/秒)
tool_parameters:
endTime:
type: variable
value:
- - '1741157526222'
- - endTime
- namespace:
- type: mixed
- value: '{{#1741161440242.namespace#}}'
- pod:
+ - '1742433446760'
+ - history_et
+ node:
type: mixed
- value: '{{#1741161440242.pod#}}'
+ value: '{{#1742806924635.node#}}'
startTime:
type: variable
value:
- - '1741157526222'
- - startTime
+ - '1742433446760'
+ - history_st
type: tool
- height: 53
- id: '1741328058981'
+ height: 54
+ id: '17424345826170'
position:
- x: 866.9205146355775
- y: 182.43066738622156
+ x: 1550
+ y: 1087
positionAbsolute:
- x: 866.9205146355775
- y: 182.43066738622156
+ x: 1550
+ y: 1087
selected: false
sourcePosition: right
targetPosition: left
type: custom
- width: 243
+ width: 244
- data:
desc: ''
is_team_authorization: true
@@ -2410,43 +4000,19 @@ workflow:
default: null
form: llm
human_description:
- en_US: Specified pod name
- ja_JP: Specified pod name
- pt_BR: Specified pod name
- zh_Hans: 指定的容器POD名称
- label:
- en_US: pod
- ja_JP: pod
- pt_BR: pod
- zh_Hans: pod
- llm_description: Specified pod name
- max: null
- min: null
- name: pod
- options: []
- placeholder: null
- precision: null
- required: true
- scope: null
- template: null
- type: string
- - auto_generate: null
- default: null
- form: llm
- human_description:
- en_US: Specified namespace
- ja_JP: Specified namespace
- pt_BR: Specified namespace
- zh_Hans: 指定的容器所在Namespace
+ en_US: Specified host name
+ ja_JP: Specified host name
+ pt_BR: Specified host name
+ zh_Hans: 指定的主机名
label:
- en_US: namespace
- ja_JP: namespace
- pt_BR: namespace
- zh_Hans: namespace
- llm_description: Specified namespace
+ en_US: node
+ ja_JP: node
+ pt_BR: node
+ zh_Hans: node
+ llm_description: Specified host name
max: null
min: null
- name: namespace
+ name: node
options: []
placeholder: null
precision: null
@@ -2504,49 +4070,44 @@ workflow:
type: number
params:
endTime: ''
- namespace: ''
- pod: ''
+ node: ''
startTime: ''
provider_id: apo_select
provider_name: apo_select
provider_type: builtin
selected: false
- title: Container CPU throttling duration (when using Containerd container
- runtime, statistics by container and Pod)
+ title: history Host disk read data rate (bytes/second)
tool_configurations: {}
- tool_label: 容器CPU节流时长(使用Containerd容器运行时,按容器和Pod统计)
- tool_name: 容器CPU节流时长(使用Containerd容器运行时,按容器和Pod统计)
+ tool_label: 宿主机磁盘读取数据速率(字节/秒)
+ tool_name: 宿主机磁盘读取数据速率(字节/秒)
tool_parameters:
endTime:
type: variable
value:
- - '1741157526222'
- - endTime
- namespace:
- type: mixed
- value: '{{#1741161440242.namespace#}}'
- pod:
+ - '1742433446760'
+ - history_et
+ node:
type: mixed
- value: '{{#1741161440242.pod#}}'
+ value: '{{#1742806924635.node#}}'
startTime:
type: variable
value:
- - '1741157526222'
- - startTime
+ - '1742433446760'
+ - history_st
type: tool
- height: 53
- id: '1741328076453'
+ height: 54
+ id: '17424346884650'
position:
- x: 879.4543026140257
- y: 267.35126206280336
+ x: 1550
+ y: 1181
positionAbsolute:
- x: 879.4543026140257
- y: 267.35126206280336
+ x: 1550
+ y: 1181
selected: false
sourcePosition: right
targetPosition: left
type: custom
- width: 243
+ width: 244
- data:
desc: ''
is_team_authorization: true
@@ -2556,43 +4117,19 @@ workflow:
default: null
form: llm
human_description:
- en_US: Specified pod name
- ja_JP: Specified pod name
- pt_BR: Specified pod name
- zh_Hans: 指定的容器POD名称
- label:
- en_US: pod
- ja_JP: pod
- pt_BR: pod
- zh_Hans: pod
- llm_description: Specified pod name
- max: null
- min: null
- name: pod
- options: []
- placeholder: null
- precision: null
- required: true
- scope: null
- template: null
- type: string
- - auto_generate: null
- default: null
- form: llm
- human_description:
- en_US: Specified namespace
- ja_JP: Specified namespace
- pt_BR: Specified namespace
- zh_Hans: 指定的容器所在Namespace
+ en_US: Specified host name
+ ja_JP: Specified host name
+ pt_BR: Specified host name
+ zh_Hans: 指定的主机名
label:
- en_US: namespace
- ja_JP: namespace
- pt_BR: namespace
- zh_Hans: namespace
- llm_description: Specified namespace
+ en_US: node
+ ja_JP: node
+ pt_BR: node
+ zh_Hans: node
+ llm_description: Specified host name
max: null
min: null
- name: namespace
+ name: node
options: []
placeholder: null
precision: null
@@ -2650,49 +4187,44 @@ workflow:
type: number
params:
endTime: ''
- namespace: ''
- pod: ''
+ node: ''
startTime: ''
provider_id: apo_select
provider_name: apo_select
provider_type: builtin
selected: false
- title: Number of bytes of container memory used (when using containerd container
- runtime, statistics are calculated by container and Pod)
+ title: history Host disk write data rate (bytes/second)
tool_configurations: {}
- tool_label: 容器内存使用字节数(使用Containerd容器运行时,按容器和Pod统计)
- tool_name: 查询容器内存使用量
+ tool_label: 宿主机磁盘写入数据速率(字节/秒)
+ tool_name: 宿主机磁盘写入数据速率(字节/秒)
tool_parameters:
endTime:
type: variable
value:
- - '1741157526222'
- - endTime
- namespace:
- type: mixed
- value: '{{#1741161440242.namespace#}}'
- pod:
+ - '1742433446760'
+ - history_et
+ node:
type: mixed
- value: '{{#1741161440242.pod#}}'
+ value: '{{#1742806924635.node#}}'
startTime:
type: variable
value:
- - '1741157526222'
- - startTime
+ - '1742433446760'
+ - history_st
type: tool
- height: 53
- id: '1741328169934'
+ height: 54
+ id: '17424347242840'
position:
- x: 879.4543026140257
- y: 347.02153779457154
+ x: 1550
+ y: 1275
positionAbsolute:
- x: 879.4543026140257
- y: 347.02153779457154
+ x: 1550
+ y: 1275
selected: false
sourcePosition: right
targetPosition: left
type: custom
- width: 243
+ width: 244
- data:
desc: ''
is_team_authorization: true
@@ -2702,43 +4234,19 @@ workflow:
default: null
form: llm
human_description:
- en_US: Specified pod name
- ja_JP: Specified pod name
- pt_BR: Specified pod name
- zh_Hans: 指定的容器POD名称
- label:
- en_US: pod
- ja_JP: pod
- pt_BR: pod
- zh_Hans: pod
- llm_description: Specified pod name
- max: null
- min: null
- name: pod
- options: []
- placeholder: null
- precision: null
- required: true
- scope: null
- template: null
- type: string
- - auto_generate: null
- default: null
- form: llm
- human_description:
- en_US: Specified namespace
- ja_JP: Specified namespace
- pt_BR: Specified namespace
- zh_Hans: 指定的容器所在Namespace
- label:
- en_US: namespace
- ja_JP: namespace
- pt_BR: namespace
- zh_Hans: namespace
- llm_description: Specified namespace
+ en_US: Specified host name
+ ja_JP: Specified host name
+ pt_BR: Specified host name
+ zh_Hans: 指定的主机名
+ label:
+ en_US: node
+ ja_JP: node
+ pt_BR: node
+ zh_Hans: node
+ llm_description: Specified host name
max: null
min: null
- name: namespace
+ name: node
options: []
placeholder: null
precision: null
@@ -2796,49 +4304,44 @@ workflow:
type: number
params:
endTime: ''
- namespace: ''
- pod: ''
+ node: ''
startTime: ''
provider_id: apo_select
provider_name: apo_select
provider_type: builtin
selected: false
- title: The network round-trip time between the container and the downstream
- service (RTT, by namespace and Pod)
+ title: history Host disk IO time consumption rate
tool_configurations: {}
- tool_label: 容器与下游服务的网络往返时间(RTT,按命名空间和Pod统计)
- tool_name: 查询容器网络与下游RTT
+ tool_label: 宿主机磁盘IO耗时速率
+ tool_name: 宿主机磁盘IO耗时速率
tool_parameters:
endTime:
type: variable
value:
- - '1741157526222'
- - endTime
- namespace:
- type: mixed
- value: '{{#1741161440242.namespace#}}'
- pod:
+ - '1742433446760'
+ - history_et
+ node:
type: mixed
- value: '{{#1741161440242.pod#}}'
+ value: '{{#1742806924635.node#}}'
startTime:
type: variable
value:
- - '1741157526222'
- - startTime
+ - '1742433446760'
+ - history_st
type: tool
- height: 53
- id: '1741328197695'
+ height: 54
+ id: '17424348206030'
position:
- x: 879.4543026140257
- y: 516.6534783332379
+ x: 1550
+ y: 1369
positionAbsolute:
- x: 879.4543026140257
- y: 516.6534783332379
+ x: 1550
+ y: 1369
selected: false
sourcePosition: right
targetPosition: left
type: custom
- width: 243
+ width: 244
- data:
desc: ''
is_team_authorization: true
@@ -2924,38 +4427,38 @@ workflow:
provider_name: apo_select
provider_type: builtin
selected: false
- title: Host disk usage (percentage, excluding rootfs)
+ title: history Host IO waiting CPU busy rate
tool_configurations: {}
- tool_label: 宿主机磁盘使用率(百分比,不含rootfs)
- tool_name: 宿主机磁盘使用率(百分比,不含rootfs)
+ tool_label: 宿主机IO等待CPU繁忙率
+ tool_name: host_cpu_iowait
tool_parameters:
endTime:
type: variable
value:
- - '1741157526222'
- - endTime
+ - '1742433446760'
+ - history_et
node:
type: mixed
- value: '{{#1741161440242.node#}}'
+ value: '{{#1742806924635.node#}}'
startTime:
type: variable
value:
- - '1741157526222'
- - startTime
+ - '1742433446760'
+ - history_st
type: tool
- height: 53
- id: '1741328213545'
+ height: 54
+ id: '17424348526540'
position:
- x: 897.1352138415443
- y: 617.4421900673747
+ x: 1550
+ y: 1463
positionAbsolute:
- x: 897.1352138415443
- y: 617.4421900673747
+ x: 1550
+ y: 1463
selected: false
sourcePosition: right
targetPosition: left
type: custom
- width: 243
+ width: 244
- data:
desc: ''
is_team_authorization: true
@@ -3041,38 +4544,86 @@ workflow:
provider_name: apo_select
provider_type: builtin
selected: false
- title: Host network receiving rate (bits/second)
+ title: history The number of file descriptors currently open on the host
tool_configurations: {}
- tool_label: 宿主机网络接收速率(比特/秒)
- tool_name: 宿主机网络接收速率(比特/秒)
+ tool_label: 宿主机当前打开文件描述符数
+ tool_name: host_cpu_fd_open
tool_parameters:
endTime:
type: variable
value:
- - '1741157526222'
- - endTime
+ - '1742433446760'
+ - history_et
node:
type: mixed
- value: '{{#1741161440242.node#}}'
+ value: '{{#1742806924635.node#}}'
startTime:
type: variable
value:
- - '1741157526222'
- - startTime
+ - '1742433446760'
+ - history_st
type: tool
- height: 53
- id: '1741328346220'
+ height: 54
+ id: '17424348570980'
+ position:
+ x: 1550
+ y: 1557
+ positionAbsolute:
+ x: 1550
+ y: 1557
+ selected: false
+ sourcePosition: right
+ targetPosition: left
+ type: custom
+ width: 244
+ - data:
+ code: " \ndef get_value(data, keys): \n for key in keys: \n value = data.get(key)\
+ \ \n if value is not None: \n return value \n return \"\" \n\n\
+ import json \n\ndef main(arg: str) -> dict:\n data = json.loads(arg) \n\
+ \ return { \n \"node\": get_value(data, [\"svc_node\", \"node\", \"nodename\"\
+ ]), \n \"service\": get_value(data, [\"svc_name\", \"service\"]),\
+ \ \n \"endpoint\": get_value(data,[\"endpoint\", \"content_key\"]), \n\
+ \ \"pod\": get_value(data,[\"pod\", \"src_pod\", \"pod_name\"]), \n \"\
+ namespace\": get_value(data,[\"namespace\", \"src_namespace\"]), \n}"
+ code_language: python3
+ desc: ''
+ outputs:
+ endpoint:
+ children: null
+ type: string
+ namespace:
+ children: null
+ type: string
+ node:
+ children: null
+ type: string
+ pod:
+ children: null
+ type: string
+ service:
+ children: null
+ type: string
+ selected: false
+ title: get alert event labels
+ type: code
+ variables:
+ - value_selector:
+ - '1741157526222'
+ - params
+ variable: arg
+ height: 54
+ id: '1742806924635'
position:
- x: 897.1352138415443
- y: 706.3425334205976
+ x: 334
+ y: 560
positionAbsolute:
- x: 897.1352138415443
- y: 706.3425334205976
+ x: 334
+ y: 560
selected: false
sourcePosition: right
targetPosition: left
type: custom
- width: 243
+ width: 244
- data:
desc: ''
is_team_authorization: true
@@ -3082,23 +4633,23 @@ workflow:
default: null
form: llm
human_description:
- en_US: Specified host name
- ja_JP: Specified host name
- pt_BR: Specified host name
- zh_Hans: 指定的主机名
+ en_US: cAdvisor job name
+ ja_JP: cAdvisor job name
+ pt_BR: cAdvisor job name
+ zh_Hans: cAdvisor任务名称
label:
- en_US: node
- ja_JP: node
- pt_BR: node
- zh_Hans: node
- llm_description: Specified host name
+ en_US: cAdvisor job name
+ ja_JP: cAdvisor job name
+ pt_BR: cAdvisor job name
+ zh_Hans: cAdvisor任务名称
+ llm_description: cAdvisor job name
max: null
min: null
- name: node
+ name: cadvisor_job_name
options: []
placeholder: null
precision: null
- required: true
+ required: false
scope: null
template: null
type: string
@@ -3106,16 +4657,64 @@ workflow:
default: null
form: llm
human_description:
- en_US: Data query start time
- ja_JP: Data query start time
- pt_BR: Data query start time
+ en_US: Namespace
+ ja_JP: Namespace
+ pt_BR: Namespace
+ zh_Hans: 命名空间
+ label:
+ en_US: Namespace
+ ja_JP: Namespace
+ pt_BR: Namespace
+ zh_Hans: 命名空间
+ llm_description: Namespace
+ max: null
+ min: null
+ name: namespace
+ options: []
+ placeholder: null
+ precision: null
+ required: false
+ scope: null
+ template: null
+ type: string
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Pod name
+ ja_JP: Pod name
+ pt_BR: Pod name
+ zh_Hans: Pod名称
+ label:
+ en_US: Pod name
+ ja_JP: Pod name
+ pt_BR: Pod name
+ zh_Hans: Pod名称
+ llm_description: Pod name
+ max: null
+ min: null
+ name: pod
+ options: []
+ placeholder: null
+ precision: null
+ required: false
+ scope: null
+ template: null
+ type: string
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Data query start time(Microsecond)
+ ja_JP: Data query start time(Microsecond)
+ pt_BR: Data query start time(Microsecond)
zh_Hans: 开始时间 (微秒)
label:
en_US: startTime
ja_JP: startTime
pt_BR: startTime
zh_Hans: startTime
- llm_description: Data query start time
+ llm_description: Data query start time(Microsecond)
max: null
min: null
name: startTime
@@ -3130,16 +4729,16 @@ workflow:
default: null
form: llm
human_description:
- en_US: Data query end time
- ja_JP: Data query end time
- pt_BR: Data query end time
+ en_US: Data query end time(Microsecond)
+ ja_JP: Data query end time(Microsecond)
+ pt_BR: Data query end time(Microsecond)
zh_Hans: 结束时间 (微秒)
label:
en_US: endTime
ja_JP: endTime
pt_BR: endTime
zh_Hans: endTime
- llm_description: Data query start time
+ llm_description: Data query end time(Microsecond)
max: null
min: null
name: endTime
@@ -3151,45 +4750,51 @@ workflow:
template: null
type: number
params:
+ cadvisor_job_name: ''
endTime: ''
- node: ''
+ namespace: ''
+ pod: ''
startTime: ''
provider_id: apo_select
provider_name: apo_select
provider_type: builtin
selected: false
- title: Host disk read data rate (bytes/second)
+ title: container cpu usage
tool_configurations: {}
- tool_label: 宿主机磁盘读取数据速率(字节/秒)
- tool_name: 宿主机磁盘读取数据速率(字节/秒)
+ tool_label: Container CPU usage rate (Containerd runtime, aggregated by container
+ and Pod)
+ tool_name: 容器CPU使用率(使用Containerd容器运行时,按容器和Pod统计)
tool_parameters:
endTime:
type: variable
value:
- '1741157526222'
- endTime
- node:
+ namespace:
+ type: mixed
+ value: '{{#1742806924635.namespace#}}'
+ pod:
type: mixed
- value: '{{#1741161440242.node#}}'
+ value: '{{#1742806924635.pod#}}'
startTime:
type: variable
value:
- '1741157526222'
- startTime
type: tool
- height: 53
- id: '1741328423453'
+ height: 54
+ id: '1742979394268'
position:
- x: 909.6690018199924
- y: 807.5848583297699
+ x: 1246
+ y: 1839
positionAbsolute:
- x: 909.6690018199924
- y: 807.5848583297699
+ x: 1246
+ y: 1839
selected: false
sourcePosition: right
targetPosition: left
type: custom
- width: 243
+ width: 244
- data:
desc: ''
is_team_authorization: true
@@ -3199,23 +4804,23 @@ workflow:
default: null
form: llm
human_description:
- en_US: Specified host name
- ja_JP: Specified host name
- pt_BR: Specified host name
- zh_Hans: 指定的主机名
+ en_US: cAdvisor job name
+ ja_JP: cAdvisor job name
+ pt_BR: cAdvisor job name
+ zh_Hans: cAdvisor任务名称
label:
- en_US: node
- ja_JP: node
- pt_BR: node
- zh_Hans: node
- llm_description: Specified host name
+ en_US: cAdvisor job name
+ ja_JP: cAdvisor job name
+ pt_BR: cAdvisor job name
+ zh_Hans: cAdvisor任务名称
+ llm_description: cAdvisor job name
max: null
min: null
- name: node
+ name: cadvisor_job_name
options: []
placeholder: null
precision: null
- required: true
+ required: false
scope: null
template: null
type: string
@@ -3223,16 +4828,64 @@ workflow:
default: null
form: llm
human_description:
- en_US: Data query start time
- ja_JP: Data query start time
- pt_BR: Data query start time
+ en_US: Namespace
+ ja_JP: Namespace
+ pt_BR: Namespace
+ zh_Hans: 命名空间
+ label:
+ en_US: Namespace
+ ja_JP: Namespace
+ pt_BR: Namespace
+ zh_Hans: 命名空间
+ llm_description: Namespace
+ max: null
+ min: null
+ name: namespace
+ options: []
+ placeholder: null
+ precision: null
+ required: false
+ scope: null
+ template: null
+ type: string
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Pod name
+ ja_JP: Pod name
+ pt_BR: Pod name
+ zh_Hans: Pod名称
+ label:
+ en_US: Pod name
+ ja_JP: Pod name
+ pt_BR: Pod name
+ zh_Hans: Pod名称
+ llm_description: Pod name
+ max: null
+ min: null
+ name: pod
+ options: []
+ placeholder: null
+ precision: null
+ required: false
+ scope: null
+ template: null
+ type: string
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Data query start time(Microsecond)
+ ja_JP: Data query start time(Microsecond)
+ pt_BR: Data query start time(Microsecond)
zh_Hans: 开始时间 (微秒)
label:
en_US: startTime
ja_JP: startTime
pt_BR: startTime
zh_Hans: startTime
- llm_description: Data query start time
+ llm_description: Data query start time(Microsecond)
max: null
min: null
name: startTime
@@ -3247,16 +4900,16 @@ workflow:
default: null
form: llm
human_description:
- en_US: Data query end time
- ja_JP: Data query end time
- pt_BR: Data query end time
+ en_US: Data query end time(Microsecond)
+ ja_JP: Data query end time(Microsecond)
+ pt_BR: Data query end time(Microsecond)
zh_Hans: 结束时间 (微秒)
label:
en_US: endTime
ja_JP: endTime
pt_BR: endTime
zh_Hans: endTime
- llm_description: Data query start time
+ llm_description: Data query end time(Microsecond)
max: null
min: null
name: endTime
@@ -3268,45 +4921,51 @@ workflow:
template: null
type: number
params:
+ cadvisor_job_name: ''
endTime: ''
- node: ''
+ namespace: ''
+ pod: ''
startTime: ''
provider_id: apo_select
provider_name: apo_select
provider_type: builtin
selected: false
- title: Host disk write data rate (bytes/second)
+ title: contaienr rss
tool_configurations: {}
- tool_label: 宿主机磁盘写入数据速率(字节/秒)
- tool_name: 宿主机磁盘写入数据速率(字节/秒)
+ tool_label: Container memory usage in bytes (Containerd runtime, aggregated
+ by container and Pod)
+ tool_name: 容器内存使用字节数(使用Containerd容器运行时,按容器和Pod统计)
tool_parameters:
endTime:
type: variable
value:
- '1741157526222'
- endTime
- node:
+ namespace:
type: mixed
- value: '{{#1741161440242.node#}}'
+ value: '{{#1742806924635.namespace#}}'
+ pod:
+ type: mixed
+ value: '{{#1742806924635.pod#}}'
startTime:
type: variable
value:
- '1741157526222'
- startTime
type: tool
- height: 53
- id: '1741328466394'
+ height: 54
+ id: '1742979595004'
position:
- x: 922.0951827508213
- y: 890.0354967992098
+ x: 1246
+ y: 1933
positionAbsolute:
- x: 922.0951827508213
- y: 890.0354967992098
+ x: 1246
+ y: 1933
selected: false
sourcePosition: right
targetPosition: left
type: custom
- width: 243
+ width: 244
- data:
desc: ''
is_team_authorization: true
@@ -3316,23 +4975,23 @@ workflow:
default: null
form: llm
human_description:
- en_US: Specified host name
- ja_JP: Specified host name
- pt_BR: Specified host name
- zh_Hans: 指定的主机名
+ en_US: cAdvisor job name
+ ja_JP: cAdvisor job name
+ pt_BR: cAdvisor job name
+ zh_Hans: cAdvisor任务名称
label:
- en_US: node
- ja_JP: node
- pt_BR: node
- zh_Hans: node
- llm_description: Specified host name
+ en_US: cAdvisor job name
+ ja_JP: cAdvisor job name
+ pt_BR: cAdvisor job name
+ zh_Hans: cAdvisor任务名称
+ llm_description: cAdvisor job name
max: null
min: null
- name: node
+ name: cadvisor_job_name
options: []
placeholder: null
precision: null
- required: true
+ required: false
scope: null
template: null
type: string
@@ -3340,16 +4999,64 @@ workflow:
default: null
form: llm
human_description:
- en_US: Data query start time
- ja_JP: Data query start time
- pt_BR: Data query start time
+ en_US: Namespace
+ ja_JP: Namespace
+ pt_BR: Namespace
+ zh_Hans: 命名空间
+ label:
+ en_US: Namespace
+ ja_JP: Namespace
+ pt_BR: Namespace
+ zh_Hans: 命名空间
+ llm_description: Namespace
+ max: null
+ min: null
+ name: namespace
+ options: []
+ placeholder: null
+ precision: null
+ required: false
+ scope: null
+ template: null
+ type: string
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Pod name
+ ja_JP: Pod name
+ pt_BR: Pod name
+ zh_Hans: Pod名称
+ label:
+ en_US: Pod name
+ ja_JP: Pod name
+ pt_BR: Pod name
+ zh_Hans: Pod名称
+ llm_description: Pod name
+ max: null
+ min: null
+ name: pod
+ options: []
+ placeholder: null
+ precision: null
+ required: false
+ scope: null
+ template: null
+ type: string
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Data query start time(Microsecond)
+ ja_JP: Data query start time(Microsecond)
+ pt_BR: Data query start time(Microsecond)
zh_Hans: 开始时间 (微秒)
label:
en_US: startTime
ja_JP: startTime
pt_BR: startTime
zh_Hans: startTime
- llm_description: Data query start time
+ llm_description: Data query start time(Microsecond)
max: null
min: null
name: startTime
@@ -3364,16 +5071,16 @@ workflow:
default: null
form: llm
human_description:
- en_US: Data query end time
- ja_JP: Data query end time
- pt_BR: Data query end time
+ en_US: Data query end time(Microsecond)
+ ja_JP: Data query end time(Microsecond)
+ pt_BR: Data query end time(Microsecond)
zh_Hans: 结束时间 (微秒)
label:
en_US: endTime
ja_JP: endTime
pt_BR: endTime
zh_Hans: endTime
- llm_description: Data query start time
+ llm_description: Data query end time(Microsecond)
max: null
min: null
name: endTime
@@ -3385,45 +5092,51 @@ workflow:
template: null
type: number
params:
+ cadvisor_job_name: ''
endTime: ''
- node: ''
+ namespace: ''
+ pod: ''
startTime: ''
provider_id: apo_select
provider_name: apo_select
provider_type: builtin
selected: false
- title: Host CPU busy rate (percentage)
+ title: container rss
tool_configurations: {}
- tool_label: 宿主机CPU繁忙率(百分比)
- tool_name: 查询主机CPU利用率
+ tool_label: Container memory usage in bytes (Containerd runtime, aggregated
+ by container and Pod)
+ tool_name: 容器内存使用字节数(使用Containerd容器运行时,按容器和Pod统计)
tool_parameters:
endTime:
type: variable
value:
- '1741157526222'
- endTime
- node:
+ namespace:
+ type: mixed
+ value: '{{#1742806924635.namespace#}}'
+ pod:
type: mixed
- value: '{{#1741161440242.node#}}'
+ value: '{{#1742806924635.pod#}}'
startTime:
type: variable
value:
- '1741157526222'
- startTime
type: tool
- height: 53
- id: '1741328692906'
+ height: 54
+ id: '17429797453350'
position:
- x: 1288.1326361010936
- y: 765.9218546549957
+ x: 1246
+ y: 1651
positionAbsolute:
- x: 1288.1326361010936
- y: 765.9218546549957
+ x: 1246
+ y: 1651
selected: false
sourcePosition: right
targetPosition: left
type: custom
- width: 243
+ width: 244
- data:
desc: ''
is_team_authorization: true
@@ -3433,23 +5146,23 @@ workflow:
default: null
form: llm
human_description:
- en_US: Specified host name
- ja_JP: Specified host name
- pt_BR: Specified host name
- zh_Hans: 指定的主机名
+ en_US: cAdvisor job name
+ ja_JP: cAdvisor job name
+ pt_BR: cAdvisor job name
+ zh_Hans: cAdvisor任务名称
label:
- en_US: node
- ja_JP: node
- pt_BR: node
- zh_Hans: node
- llm_description: Specified host name
+ en_US: cAdvisor job name
+ ja_JP: cAdvisor job name
+ pt_BR: cAdvisor job name
+ zh_Hans: cAdvisor任务名称
+ llm_description: cAdvisor job name
max: null
min: null
- name: node
+ name: cadvisor_job_name
options: []
placeholder: null
precision: null
- required: true
+ required: false
scope: null
template: null
type: string
@@ -3457,16 +5170,64 @@ workflow:
default: null
form: llm
human_description:
- en_US: Data query start time
- ja_JP: Data query start time
- pt_BR: Data query start time
+ en_US: Namespace
+ ja_JP: Namespace
+ pt_BR: Namespace
+ zh_Hans: 命名空间
+ label:
+ en_US: Namespace
+ ja_JP: Namespace
+ pt_BR: Namespace
+ zh_Hans: 命名空间
+ llm_description: Namespace
+ max: null
+ min: null
+ name: namespace
+ options: []
+ placeholder: null
+ precision: null
+ required: false
+ scope: null
+ template: null
+ type: string
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Pod name
+ ja_JP: Pod name
+ pt_BR: Pod name
+ zh_Hans: Pod名称
+ label:
+ en_US: Pod name
+ ja_JP: Pod name
+ pt_BR: Pod name
+ zh_Hans: Pod名称
+ llm_description: Pod name
+ max: null
+ min: null
+ name: pod
+ options: []
+ placeholder: null
+ precision: null
+ required: false
+ scope: null
+ template: null
+ type: string
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Data query start time(Microsecond)
+ ja_JP: Data query start time(Microsecond)
+ pt_BR: Data query start time(Microsecond)
zh_Hans: 开始时间 (微秒)
label:
en_US: startTime
ja_JP: startTime
pt_BR: startTime
zh_Hans: startTime
- llm_description: Data query start time
+ llm_description: Data query start time(Microsecond)
max: null
min: null
name: startTime
@@ -3481,16 +5242,16 @@ workflow:
default: null
form: llm
human_description:
- en_US: Data query end time
- ja_JP: Data query end time
- pt_BR: Data query end time
+ en_US: Data query end time(Microsecond)
+ ja_JP: Data query end time(Microsecond)
+ pt_BR: Data query end time(Microsecond)
zh_Hans: 结束时间 (微秒)
label:
en_US: endTime
ja_JP: endTime
pt_BR: endTime
zh_Hans: endTime
- llm_description: Data query start time
+ llm_description: Data query end time(Microsecond)
max: null
min: null
name: endTime
@@ -3502,45 +5263,51 @@ workflow:
template: null
type: number
params:
+ cadvisor_job_name: ''
endTime: ''
- node: ''
+ namespace: ''
+ pod: ''
startTime: ''
provider_id: apo_select
provider_name: apo_select
provider_type: builtin
selected: false
- title: Host disk IO time consumption rate
+ title: history container rss
tool_configurations: {}
- tool_label: 宿主机磁盘IO耗时速率
- tool_name: 宿主机磁盘IO耗时速率
+ tool_label: Container memory usage in bytes (Containerd runtime, aggregated
+ by container and Pod)
+ tool_name: 容器内存使用字节数(使用Containerd容器运行时,按容器和Pod统计)
tool_parameters:
endTime:
type: variable
value:
- - '1741157526222'
- - endTime
- node:
+ - '1742433446760'
+ - history_et
+ namespace:
type: mixed
- value: '{{#1741161440242.node#}}'
+ value: '{{#1742806924635.namespace#}}'
+ pod:
+ type: mixed
+ value: '{{#1742806924635.pod#}}'
startTime:
type: variable
value:
- - '1741157526222'
- - startTime
+ - '1742433446760'
+ - history_st
type: tool
- height: 53
- id: '1741328742817'
+ height: 54
+ id: '17429797664440'
position:
- x: 1320.3050732843196
- y: 838.8279382371494
+ x: 1550
+ y: 1651
positionAbsolute:
- x: 1320.3050732843196
- y: 838.8279382371494
+ x: 1550
+ y: 1651
selected: false
sourcePosition: right
targetPosition: left
type: custom
- width: 243
+ width: 244
- data:
desc: ''
is_team_authorization: true
@@ -3550,23 +5317,47 @@ workflow:
default: null
form: llm
human_description:
- en_US: Specified host name
- ja_JP: Specified host name
- pt_BR: Specified host name
- zh_Hans: 指定的主机名
+ en_US: Prometheus job name for host metrics
+ ja_JP: Prometheus job name for host metrics
+ pt_BR: Prometheus job name for host metrics
+ zh_Hans: Prometheus任务名称(宿主机指标)
label:
- en_US: node
- ja_JP: node
- pt_BR: node
- zh_Hans: node
- llm_description: Specified host name
+ en_US: Prometheus Job
+ ja_JP: Prometheus Job
+ pt_BR: Tarefa Prometheus
+ zh_Hans: Prometheus任务
+ llm_description: Unique identifier for metrics scrape job
+ max: null
+ min: null
+ name: job
+ options: []
+ placeholder: null
+ precision: null
+ required: false
+ scope: null
+ template: null
+ type: string
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Host node identifier
+ ja_JP: Host node identifier
+ pt_BR: Host node identifier
+ zh_Hans: 宿主机节点标识
+ label:
+ en_US: Host Node
+ ja_JP: Host Node
+ pt_BR: Host Node
+ zh_Hans: 宿主机节点
+ llm_description: Unique identifier for host node
max: null
min: null
name: node
options: []
placeholder: null
precision: null
- required: true
+ required: false
scope: null
template: null
type: string
@@ -3574,16 +5365,16 @@ workflow:
default: null
form: llm
human_description:
- en_US: Data query start time
- ja_JP: Data query start time
- pt_BR: Data query start time
+ en_US: Data query start time(Microsecond)
+ ja_JP: Data query start time(Microsecond)
+ pt_BR: Data query start time(Microsecond)
zh_Hans: 开始时间 (微秒)
label:
en_US: startTime
ja_JP: startTime
pt_BR: startTime
zh_Hans: startTime
- llm_description: Data query start time
+ llm_description: Data query start time(Microsecond)
max: null
min: null
name: startTime
@@ -3598,16 +5389,16 @@ workflow:
default: null
form: llm
human_description:
- en_US: Data query end time
- ja_JP: Data query end time
- pt_BR: Data query end time
+ en_US: Data query end time(Microsecond)
+ ja_JP: Data query end time(Microsecond)
+ pt_BR: Data query end time(Microsecond)
zh_Hans: 结束时间 (微秒)
label:
en_US: endTime
ja_JP: endTime
pt_BR: endTime
zh_Hans: endTime
- llm_description: Data query start time
+ llm_description: Data query end time(Microsecond)
max: null
min: null
name: endTime
@@ -3620,16 +5411,17 @@ workflow:
type: number
params:
endTime: ''
+ job: ''
node: ''
startTime: ''
provider_id: apo_select
provider_name: apo_select
provider_type: builtin
selected: false
- title: Host IO waiting CPU busy rate
+ title: host cpu
tool_configurations: {}
- tool_label: 宿主机IO等待CPU繁忙率
- tool_name: host_cpu_iowait
+ tool_label: Query host's CPU pressure
+ tool_name: 查询宿主机CPU压力
tool_parameters:
endTime:
type: variable
@@ -3638,26 +5430,26 @@ workflow:
- endTime
node:
type: mixed
- value: '{{#1741161440242.node#}}'
+ value: '{{#1742806924635.node#}}'
startTime:
type: variable
value:
- '1741157526222'
- startTime
type: tool
- height: 53
- id: '1741328773213'
+ height: 54
+ id: '1742979828391'
position:
- x: 1295.1943032554088
- y: 918.3967184410467
+ x: 1246
+ y: 1745
positionAbsolute:
- x: 1295.1943032554088
- y: 918.3967184410467
+ x: 1246
+ y: 1745
selected: false
sourcePosition: right
targetPosition: left
type: custom
- width: 243
+ width: 244
- data:
desc: ''
is_team_authorization: true
@@ -3667,23 +5459,47 @@ workflow:
default: null
form: llm
human_description:
- en_US: Specified host name
- ja_JP: Specified host name
- pt_BR: Specified host name
- zh_Hans: 指定的主机名
+ en_US: Prometheus job name for host metrics
+ ja_JP: Prometheus job name for host metrics
+ pt_BR: Prometheus job name for host metrics
+ zh_Hans: Prometheus任务名称(宿主机指标)
label:
- en_US: node
- ja_JP: node
- pt_BR: node
- zh_Hans: node
- llm_description: Specified host name
+ en_US: Prometheus Job
+ ja_JP: Prometheus Job
+ pt_BR: Tarefa Prometheus
+ zh_Hans: Prometheus任务
+ llm_description: Unique identifier for metrics scrape job
+ max: null
+ min: null
+ name: job
+ options: []
+ placeholder: null
+ precision: null
+ required: false
+ scope: null
+ template: null
+ type: string
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Host node identifier
+ ja_JP: Host node identifier
+ pt_BR: Host node identifier
+ zh_Hans: 宿主机节点标识
+ label:
+ en_US: Host Node
+ ja_JP: Host Node
+ pt_BR: Host Node
+ zh_Hans: 宿主机节点
+ llm_description: Unique identifier for host node
max: null
min: null
name: node
options: []
placeholder: null
precision: null
- required: true
+ required: false
scope: null
template: null
type: string
@@ -3691,16 +5507,16 @@ workflow:
default: null
form: llm
human_description:
- en_US: Data query start time
- ja_JP: Data query start time
- pt_BR: Data query start time
+ en_US: Data query start time(Microsecond)
+ ja_JP: Data query start time(Microsecond)
+ pt_BR: Data query start time(Microsecond)
zh_Hans: 开始时间 (微秒)
label:
en_US: startTime
ja_JP: startTime
pt_BR: startTime
zh_Hans: startTime
- llm_description: Data query start time
+ llm_description: Data query start time(Microsecond)
max: null
min: null
name: startTime
@@ -3715,16 +5531,16 @@ workflow:
default: null
form: llm
human_description:
- en_US: Data query end time
- ja_JP: Data query end time
- pt_BR: Data query end time
+ en_US: Data query end time(Microsecond)
+ ja_JP: Data query end time(Microsecond)
+ pt_BR: Data query end time(Microsecond)
zh_Hans: 结束时间 (微秒)
label:
en_US: endTime
ja_JP: endTime
pt_BR: endTime
zh_Hans: endTime
- llm_description: Data query start time
+ llm_description: Data query end time(Microsecond)
max: null
min: null
name: endTime
@@ -3737,44 +5553,45 @@ workflow:
type: number
params:
endTime: ''
+ job: ''
node: ''
startTime: ''
provider_id: apo_select
provider_name: apo_select
provider_type: builtin
selected: false
- title: The number of file descriptors currently open on the host
+ title: history host cpu
tool_configurations: {}
- tool_label: 宿主机当前打开文件描述符数
- tool_name: host_cpu_fd_open
+ tool_label: Query host's CPU pressure
+ tool_name: 查询宿主机CPU压力
tool_parameters:
endTime:
type: variable
value:
- - '1741157526222'
- - endTime
+ - '1742433446760'
+ - history_et
node:
type: mixed
- value: '{{#1741161440242.node#}}'
+ value: '{{#1742806924635.node#}}'
startTime:
type: variable
value:
- - '1741157526222'
- - startTime
+ - '1742433446760'
+ - history_st
type: tool
- height: 53
- id: '1741328799030'
+ height: 54
+ id: '17429798797920'
position:
- x: 1300.5588170319227
- y: 999.2631864254831
+ x: 1550
+ y: 1745
positionAbsolute:
- x: 1300.5588170319227
- y: 999.2631864254831
+ x: 1550
+ y: 1745
selected: false
sourcePosition: right
targetPosition: left
type: custom
- width: 243
+ width: 244
- data:
desc: ''
is_team_authorization: true
@@ -3784,23 +5601,23 @@ workflow:
default: null
form: llm
human_description:
- en_US: Specified service name
- ja_JP: Specified service name
- pt_BR: Specified service name
- zh_Hans: 指定的服务名
+ en_US: cAdvisor job name
+ ja_JP: cAdvisor job name
+ pt_BR: cAdvisor job name
+ zh_Hans: cAdvisor任务名称
label:
- en_US: service_name
- ja_JP: service_name
- pt_BR: service_name
- zh_Hans: service_name
- llm_description: 指定的服务名
+ en_US: cAdvisor job name
+ ja_JP: cAdvisor job name
+ pt_BR: cAdvisor job name
+ zh_Hans: cAdvisor任务名称
+ llm_description: cAdvisor job name
max: null
min: null
- name: service_name
+ name: cadvisor_job_name
options: []
placeholder: null
precision: null
- required: true
+ required: false
scope: null
template: null
type: string
@@ -3808,23 +5625,23 @@ workflow:
default: null
form: llm
human_description:
- en_US: Specified endpoint name
- ja_JP: Specified endpoint name
- pt_BR: Specified endpoint name
- zh_Hans: 指定的服务端点名
+ en_US: Namespace
+ ja_JP: Namespace
+ pt_BR: Namespace
+ zh_Hans: 命名空间
label:
- en_US: content_key
- ja_JP: content_key
- pt_BR: content_key
- zh_Hans: content_key
- llm_description: 指定的服务端点名
+ en_US: Namespace
+ ja_JP: Namespace
+ pt_BR: Namespace
+ zh_Hans: 命名空间
+ llm_description: Namespace
max: null
min: null
- name: content_key
+ name: namespace
options: []
placeholder: null
precision: null
- required: true
+ required: false
scope: null
template: null
type: string
@@ -3832,16 +5649,40 @@ workflow:
default: null
form: llm
human_description:
- en_US: Data query start time
- ja_JP: Data query start time
- pt_BR: Data query start time
+ en_US: Pod name
+ ja_JP: Pod name
+ pt_BR: Pod name
+ zh_Hans: Pod名称
+ label:
+ en_US: Pod name
+ ja_JP: Pod name
+ pt_BR: Pod name
+ zh_Hans: Pod名称
+ llm_description: Pod name
+ max: null
+ min: null
+ name: pod
+ options: []
+ placeholder: null
+ precision: null
+ required: false
+ scope: null
+ template: null
+ type: string
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Data query start time(Microsecond)
+ ja_JP: Data query start time(Microsecond)
+ pt_BR: Data query start time(Microsecond)
zh_Hans: 开始时间 (微秒)
label:
en_US: startTime
ja_JP: startTime
pt_BR: startTime
zh_Hans: startTime
- llm_description: Data query start time
+ llm_description: Data query start time(Microsecond)
max: null
min: null
name: startTime
@@ -3856,16 +5697,16 @@ workflow:
default: null
form: llm
human_description:
- en_US: Data query end time
- ja_JP: Data query end time
- pt_BR: Data query end time
+ en_US: Data query end time(Microsecond)
+ ja_JP: Data query end time(Microsecond)
+ pt_BR: Data query end time(Microsecond)
zh_Hans: 结束时间 (微秒)
label:
en_US: endTime
ja_JP: endTime
pt_BR: endTime
zh_Hans: endTime
- llm_description: Data query start time
+ llm_description: Data query end time(Microsecond)
max: null
min: null
name: endTime
@@ -3877,50 +5718,51 @@ workflow:
template: null
type: number
params:
- content_key: ''
+ cadvisor_job_name: ''
endTime: ''
- service_name: ''
+ namespace: ''
+ pod: ''
startTime: ''
provider_id: apo_select
provider_name: apo_select
provider_type: builtin
selected: false
- title: Service request success rate (by service name and content key, within
- a specified time period)
+ title: history container cpu usage
tool_configurations: {}
- tool_label: 服务请求成功率(按服务名和内容键统计,指定时间段内)
- tool_name: Originx 北极星指标 (服务层级) - RED指标 - 请求成功率
+ tool_label: Container CPU usage rate (Containerd runtime, aggregated by container
+ and Pod)
+ tool_name: 容器CPU使用率(使用Containerd容器运行时,按容器和Pod统计)
tool_parameters:
- content_key:
- type: mixed
- value: '{{#1741161440242.endpoint#}}'
endTime:
type: variable
value:
- '1741157526222'
- endTime
- service_name:
+ namespace:
+ type: mixed
+ value: '{{#1742806924635.namespace#}}'
+ pod:
type: mixed
- value: '{{#1741161440242.service#}}'
+ value: '{{#1742806924635.pod#}}'
startTime:
type: variable
value:
- '1741157526222'
- startTime
type: tool
- height: 53
- id: '1741329632798'
+ height: 54
+ id: '17429835599060'
position:
- x: 879.4543026140257
- y: 428.59818368333947
+ x: 1550
+ y: 1839
positionAbsolute:
- x: 879.4543026140257
- y: 428.59818368333947
+ x: 1550
+ y: 1839
selected: false
sourcePosition: right
targetPosition: left
type: custom
- width: 243
+ width: 244
- data:
desc: ''
is_team_authorization: true
@@ -3930,23 +5772,23 @@ workflow:
default: null
form: llm
human_description:
- en_US: Specified pod name
- ja_JP: Specified pod name
- pt_BR: Specified pod name
- zh_Hans: 指定的容器POD名称
+ en_US: cAdvisor job name
+ ja_JP: cAdvisor job name
+ pt_BR: cAdvisor job name
+ zh_Hans: cAdvisor任务名称
label:
- en_US: pod
- ja_JP: pod
- pt_BR: pod
- zh_Hans: pod
- llm_description: Specified pod name
+ en_US: cAdvisor job name
+ ja_JP: cAdvisor job name
+ pt_BR: cAdvisor job name
+ zh_Hans: cAdvisor任务名称
+ llm_description: cAdvisor job name
max: null
min: null
- name: pod
+ name: cadvisor_job_name
options: []
placeholder: null
precision: null
- required: true
+ required: false
scope: null
template: null
type: string
@@ -3954,23 +5796,23 @@ workflow:
default: null
form: llm
human_description:
- en_US: Specified namespace
- ja_JP: Specified namespace
- pt_BR: Specified namespace
- zh_Hans: 指定的容器所在Namespace
+ en_US: Namespace
+ ja_JP: Namespace
+ pt_BR: Namespace
+ zh_Hans: 命名空间
label:
- en_US: namespace
- ja_JP: namespace
- pt_BR: namespace
- zh_Hans: namespace
- llm_description: Specified namespace
+ en_US: Namespace
+ ja_JP: Namespace
+ pt_BR: Namespace
+ zh_Hans: 命名空间
+ llm_description: Namespace
max: null
min: null
name: namespace
options: []
placeholder: null
precision: null
- required: true
+ required: false
scope: null
template: null
type: string
@@ -3978,16 +5820,40 @@ workflow:
default: null
form: llm
human_description:
- en_US: Data query start time
- ja_JP: Data query start time
- pt_BR: Data query start time
+ en_US: Pod name
+ ja_JP: Pod name
+ pt_BR: Pod name
+ zh_Hans: Pod名称
+ label:
+ en_US: Pod name
+ ja_JP: Pod name
+ pt_BR: Pod name
+ zh_Hans: Pod名称
+ llm_description: Pod name
+ max: null
+ min: null
+ name: pod
+ options: []
+ placeholder: null
+ precision: null
+ required: false
+ scope: null
+ template: null
+ type: string
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Data query start time(Microsecond)
+ ja_JP: Data query start time(Microsecond)
+ pt_BR: Data query start time(Microsecond)
zh_Hans: 开始时间 (微秒)
label:
en_US: startTime
ja_JP: startTime
pt_BR: startTime
zh_Hans: startTime
- llm_description: Data query start time
+ llm_description: Data query start time(Microsecond)
max: null
min: null
name: startTime
@@ -4002,16 +5868,16 @@ workflow:
default: null
form: llm
human_description:
- en_US: Data query end time
- ja_JP: Data query end time
- pt_BR: Data query end time
+ en_US: Data query end time(Microsecond)
+ ja_JP: Data query end time(Microsecond)
+ pt_BR: Data query end time(Microsecond)
zh_Hans: 结束时间 (微秒)
label:
en_US: endTime
ja_JP: endTime
pt_BR: endTime
zh_Hans: endTime
- llm_description: Data query start time
+ llm_description: Data query end time(Microsecond)
max: null
min: null
name: endTime
@@ -4023,6 +5889,7 @@ workflow:
template: null
type: number
params:
+ cadvisor_job_name: ''
endTime: ''
namespace: ''
pod: ''
@@ -4031,11 +5898,11 @@ workflow:
provider_name: apo_select
provider_type: builtin
selected: false
- title: Number of bytes of container memory used (when using containerd container
- runtime, statistics are calculated by container and Pod)
+ title: history container rss
tool_configurations: {}
- tool_label: 容器内存使用字节数(使用Containerd容器运行时,按容器和Pod统计)
- tool_name: 查询容器内存使用量
+ tool_label: Container memory usage in bytes (Containerd runtime, aggregated
+ by container and Pod)
+ tool_name: 容器内存使用字节数(使用Containerd容器运行时,按容器和Pod统计)
tool_parameters:
endTime:
type: variable
@@ -4044,30 +5911,30 @@ workflow:
- endTime
namespace:
type: mixed
- value: '{{#1741161440242.namespace#}}'
+ value: '{{#1742806924635.namespace#}}'
pod:
type: mixed
- value: '{{#1741161440242.pod#}}'
+ value: '{{#1742806924635.pod#}}'
startTime:
type: variable
value:
- '1741157526222'
- startTime
type: tool
- height: 53
- id: '1741591590829'
+ height: 54
+ id: '17429835940550'
position:
- x: 1106.622658811791
- y: 1100.534952103478
+ x: 1550
+ y: 1933
positionAbsolute:
- x: 1106.622658811791
- y: 1100.534952103478
+ x: 1550
+ y: 1933
selected: false
sourcePosition: right
targetPosition: left
type: custom
- width: 243
+ width: 244
viewport:
- x: 562.6748622348487
- y: 184.9909979491867
- zoom: 0.5641586917716426
+ x: -177.69424554330567
+ y: -151.32564818705146
+ zoom: 0.6449586508173727
diff --git a/api/init_data/workflows/zh/告警有效性确认.yml b/api/init_data/workflows/zh/告警有效性确认.yml
index d96ae3448e..bfe8fe21d9 100644
--- a/api/init_data/workflows/zh/告警有效性确认.yml
+++ b/api/init_data/workflows/zh/告警有效性确认.yml
@@ -60,44 +60,12 @@ workflow:
voice: ''
graph:
edges:
- - data:
- isInIteration: false
- sourceType: code
- targetType: question-classifier
- id: 1741161440242-source-1741158559444-target
- source: '1741161440242'
- sourceHandle: source
- target: '1741158559444'
- targetHandle: target
- type: custom
- zIndex: 0
- - data:
- isInIteration: false
- sourceType: variable-aggregator
- targetType: tool
- id: 1741162531836-source-1741166377433-target
- source: '1741162531836'
- sourceHandle: source
- target: '1741166377433'
- targetHandle: target
- type: custom
- zIndex: 0
- - data:
- isInIteration: false
- sourceType: start
- targetType: code
- id: 1741157526222-source-1741161440242-target
- source: '1741157526222'
- sourceHandle: source
- target: '1741161440242'
- targetHandle: target
- type: custom
- zIndex: 0
- data:
isInIteration: false
sourceType: agent
targetType: question-classifier
id: 1741159085487-source-1741311244655-target
+ selected: false
source: '1741159085487'
sourceHandle: source
target: '1741311244655'
@@ -109,6 +77,7 @@ workflow:
sourceType: question-classifier
targetType: code
id: 1741311244655-1-1741311294320-target
+ selected: false
source: '1741311244655'
sourceHandle: '1'
target: '1741311294320'
@@ -120,6 +89,7 @@ workflow:
sourceType: code
targetType: variable-aggregator
id: 1741311294320-source-1741311394752-target
+ selected: false
source: '1741311294320'
sourceHandle: source
target: '1741311394752'
@@ -131,28 +101,19 @@ workflow:
sourceType: variable-aggregator
targetType: end
id: 1741311394752-source-1741157560922-target
+ selected: false
source: '1741311394752'
sourceHandle: source
target: '1741157560922'
targetHandle: target
type: custom
zIndex: 0
- - data:
- isInIteration: false
- sourceType: tool
- targetType: variable-aggregator
- id: 1741166377433-source-1741311394752-target
- source: '1741166377433'
- sourceHandle: source
- target: '1741311394752'
- targetHandle: target
- type: custom
- zIndex: 0
- data:
isInIteration: false
sourceType: question-classifier
targetType: agent
id: 1741158559444-1741319394268-1741159085487-target
+ selected: false
source: '1741158559444'
sourceHandle: '1741319394268'
target: '1741159085487'
@@ -164,50 +125,31 @@ workflow:
sourceType: question-classifier
targetType: tool
id: 1741158559444-1-1741328045214-target
+ selected: false
source: '1741158559444'
sourceHandle: '1'
target: '1741328045214'
targetHandle: target
type: custom
zIndex: 0
- - data:
- isInIteration: false
- sourceType: question-classifier
- targetType: tool
- id: 1741158559444-1741158765960-1741328058981-target
- source: '1741158559444'
- sourceHandle: '1741158765960'
- target: '1741328058981'
- targetHandle: target
- type: custom
- zIndex: 0
- data:
isInIteration: false
sourceType: question-classifier
targetType: tool
id: 1741158559444-1741318878864-1741328076453-target
+ selected: false
source: '1741158559444'
sourceHandle: '1741318878864'
target: '1741328076453'
targetHandle: target
type: custom
zIndex: 0
- - data:
- isInIteration: false
- sourceType: question-classifier
- targetType: tool
- id: 1741158559444-1741318899444-1741328169934-target
- source: '1741158559444'
- sourceHandle: '1741318899444'
- target: '1741328169934'
- targetHandle: target
- type: custom
- zIndex: 0
- data:
isInIteration: false
sourceType: question-classifier
targetType: tool
id: 1741158559444-1741319019432-1741328197695-target
+ selected: false
source: '1741158559444'
sourceHandle: '1741319019432'
target: '1741328197695'
@@ -219,6 +161,7 @@ workflow:
sourceType: question-classifier
targetType: tool
id: 1741158559444-1741319060092-1741328213545-target
+ selected: false
source: '1741158559444'
sourceHandle: '1741319060092'
target: '1741328213545'
@@ -230,6 +173,7 @@ workflow:
sourceType: question-classifier
targetType: tool
id: 1741158559444-1741319099071-1741328346220-target
+ selected: false
source: '1741158559444'
sourceHandle: '1741319099071'
target: '1741328346220'
@@ -241,6 +185,7 @@ workflow:
sourceType: question-classifier
targetType: tool
id: 1741158559444-1741319132527-1741328423453-target
+ selected: false
source: '1741158559444'
sourceHandle: '1741319132527'
target: '1741328423453'
@@ -252,28 +197,19 @@ workflow:
sourceType: question-classifier
targetType: tool
id: 1741158559444-1741319160027-1741328466394-target
+ selected: false
source: '1741158559444'
sourceHandle: '1741319160027'
target: '1741328466394'
targetHandle: target
type: custom
zIndex: 0
- - data:
- isInIteration: false
- sourceType: question-classifier
- targetType: tool
- id: 1741158559444-1741319171199-1741328692906-target
- source: '1741158559444'
- sourceHandle: '1741319171199'
- target: '1741328692906'
- targetHandle: target
- type: custom
- zIndex: 0
- data:
isInIteration: false
sourceType: question-classifier
targetType: tool
id: 1741158559444-1741319213624-1741328742817-target
+ selected: false
source: '1741158559444'
sourceHandle: '1741319213624'
target: '1741328742817'
@@ -285,6 +221,7 @@ workflow:
sourceType: question-classifier
targetType: tool
id: 1741158559444-1741319251403-1741328773213-target
+ selected: false
source: '1741158559444'
sourceHandle: '1741319251403'
target: '1741328773213'
@@ -296,6 +233,7 @@ workflow:
sourceType: question-classifier
targetType: tool
id: 1741158559444-1741319284158-1741328799030-target
+ selected: false
source: '1741158559444'
sourceHandle: '1741319284158'
target: '1741328799030'
@@ -307,6 +245,7 @@ workflow:
sourceType: question-classifier
targetType: tool
id: 1741158559444-1741318983134-1741329632798-target
+ selected: false
source: '1741158559444'
sourceHandle: '1741318983134'
target: '1741329632798'
@@ -315,12 +254,59 @@ workflow:
zIndex: 0
- data:
isInIteration: false
- sourceType: tool
+ sourceType: llm
+ targetType: question-classifier
+ id: 1742366141890-source-1742366303110-target
+ selected: false
+ source: '1742366141890'
+ sourceHandle: source
+ target: '1742366303110'
+ targetHandle: target
+ type: custom
+ zIndex: 0
+ - data:
+ isInIteration: false
+ sourceType: question-classifier
+ targetType: variable-aggregator
+ id: 1742366303110-1-1741311394752-target
+ selected: false
+ source: '1742366303110'
+ sourceHandle: '1'
+ target: '1741311394752'
+ targetHandle: target
+ type: custom
+ zIndex: 0
+ - data:
+ isInIteration: false
+ sourceType: question-classifier
targetType: variable-aggregator
- id: 1741328045214-source-1741162531836-target
+ id: 1742366303110-2-1741311394752-target
+ selected: false
+ source: '1742366303110'
+ sourceHandle: '2'
+ target: '1741311394752'
+ targetHandle: target
+ type: custom
+ zIndex: 0
+ - data:
+ isInIteration: false
+ sourceType: code
+ targetType: question-classifier
+ id: 1742433446760-source-1741158559444-target
+ source: '1742433446760'
+ sourceHandle: source
+ target: '1741158559444'
+ targetHandle: target
+ type: custom
+ zIndex: 0
+ - data:
+ isInIteration: false
+ sourceType: tool
+ targetType: tool
+ id: 1741328045214-source-17424339242280-target
source: '1741328045214'
sourceHandle: source
- target: '1741162531836'
+ target: '17424339242280'
targetHandle: target
type: custom
zIndex: 0
@@ -328,8 +314,8 @@ workflow:
isInIteration: false
sourceType: tool
targetType: variable-aggregator
- id: 1741328058981-source-1741162531836-target
- source: '1741328058981'
+ id: 17424339242280-source-1741162531836-target
+ source: '17424339242280'
sourceHandle: source
target: '1741162531836'
targetHandle: target
@@ -337,12 +323,23 @@ workflow:
zIndex: 0
- data:
isInIteration: false
- sourceType: tool
+ sourceType: variable-aggregator
targetType: variable-aggregator
- id: 1741328076453-source-1741162531836-target
- source: '1741328076453'
+ id: 1741162531836-source-1742434016239-target
+ source: '1741162531836'
sourceHandle: source
- target: '1741162531836'
+ target: '1742434016239'
+ targetHandle: target
+ type: custom
+ zIndex: 0
+ - data:
+ isInIteration: false
+ sourceType: variable-aggregator
+ targetType: llm
+ id: 1742434016239-source-1742366141890-target
+ source: '1742434016239'
+ sourceHandle: source
+ target: '1742366141890'
targetHandle: target
type: custom
zIndex: 0
@@ -350,8 +347,8 @@ workflow:
isInIteration: false
sourceType: tool
targetType: variable-aggregator
- id: 1741328169934-source-1741162531836-target
- source: '1741328169934'
+ id: 17424342365860-source-1741162531836-target
+ source: '17424342365860'
sourceHandle: source
target: '1741162531836'
targetHandle: target
@@ -360,11 +357,22 @@ workflow:
- data:
isInIteration: false
sourceType: tool
- targetType: variable-aggregator
- id: 1741329632798-source-1741162531836-target
+ targetType: tool
+ id: 1741328076453-source-17424342365860-target
+ source: '1741328076453'
+ sourceHandle: source
+ target: '17424342365860'
+ targetHandle: target
+ type: custom
+ zIndex: 0
+ - data:
+ isInIteration: false
+ sourceType: tool
+ targetType: tool
+ id: 1741329632798-source-17424344697090-target
source: '1741329632798'
sourceHandle: source
- target: '1741162531836'
+ target: '17424344697090'
targetHandle: target
type: custom
zIndex: 0
@@ -372,64 +380,118 @@ workflow:
isInIteration: false
sourceType: tool
targetType: variable-aggregator
- id: 1741328197695-source-1741162531836-target
- source: '1741328197695'
+ id: 17424344697090-source-1741162531836-target
+ source: '17424344697090'
sourceHandle: source
target: '1741162531836'
targetHandle: target
type: custom
zIndex: 0
+ - data:
+ isInIteration: false
+ sourceType: tool
+ targetType: tool
+ id: 1741328197695-source-17424345080000-target
+ source: '1741328197695'
+ sourceHandle: source
+ target: '17424345080000'
+ targetHandle: target
+ type: custom
+ zIndex: 0
- data:
isInIteration: false
sourceType: tool
targetType: variable-aggregator
- id: 1741328213545-source-1741162531836-target
- source: '1741328213545'
+ id: 17424345080000-source-1741162531836-target
+ source: '17424345080000'
sourceHandle: source
target: '1741162531836'
targetHandle: target
type: custom
zIndex: 0
+ - data:
+ isInIteration: false
+ sourceType: tool
+ targetType: tool
+ id: 1741328213545-source-17424345315500-target
+ source: '1741328213545'
+ sourceHandle: source
+ target: '17424345315500'
+ targetHandle: target
+ type: custom
+ zIndex: 0
- data:
isInIteration: false
sourceType: tool
targetType: variable-aggregator
- id: 1741328346220-source-1741162531836-target
- source: '1741328346220'
+ id: 17424345315500-source-1741162531836-target
+ source: '17424345315500'
sourceHandle: source
target: '1741162531836'
targetHandle: target
type: custom
zIndex: 0
+ - data:
+ isInIteration: false
+ sourceType: tool
+ targetType: tool
+ id: 1741328346220-source-17424345826170-target
+ source: '1741328346220'
+ sourceHandle: source
+ target: '17424345826170'
+ targetHandle: target
+ type: custom
+ zIndex: 0
- data:
isInIteration: false
sourceType: tool
targetType: variable-aggregator
- id: 1741328423453-source-1741162531836-target
- source: '1741328423453'
+ id: 17424345826170-source-1741162531836-target
+ source: '17424345826170'
sourceHandle: source
target: '1741162531836'
targetHandle: target
type: custom
zIndex: 0
+ - data:
+ isInIteration: false
+ sourceType: tool
+ targetType: tool
+ id: 1741328423453-source-17424346884650-target
+ source: '1741328423453'
+ sourceHandle: source
+ target: '17424346884650'
+ targetHandle: target
+ type: custom
+ zIndex: 0
- data:
isInIteration: false
sourceType: tool
targetType: variable-aggregator
- id: 1741328466394-source-1741162531836-target
- source: '1741328466394'
+ id: 17424346884650-source-1741162531836-target
+ source: '17424346884650'
sourceHandle: source
target: '1741162531836'
targetHandle: target
type: custom
zIndex: 0
+ - data:
+ isInIteration: false
+ sourceType: tool
+ targetType: tool
+ id: 1741328466394-source-17424347242840-target
+ source: '1741328466394'
+ sourceHandle: source
+ target: '17424347242840'
+ targetHandle: target
+ type: custom
+ zIndex: 0
- data:
isInIteration: false
sourceType: tool
targetType: variable-aggregator
- id: 1741328692906-source-1741162531836-target
- selected: false
- source: '1741328692906'
+ id: 17424347242840-source-1741162531836-target
+ source: '17424347242840'
sourceHandle: source
target: '1741162531836'
targetHandle: target
@@ -438,11 +500,11 @@ workflow:
- data:
isInIteration: false
sourceType: tool
- targetType: variable-aggregator
- id: 1741328742817-source-1741162531836-target
+ targetType: tool
+ id: 1741328742817-source-17424348206030-target
source: '1741328742817'
sourceHandle: source
- target: '1741162531836'
+ target: '17424348206030'
targetHandle: target
type: custom
zIndex: 0
@@ -450,19 +512,30 @@ workflow:
isInIteration: false
sourceType: tool
targetType: variable-aggregator
- id: 1741328773213-source-1741162531836-target
- source: '1741328773213'
+ id: 17424348206030-source-1741162531836-target
+ source: '17424348206030'
sourceHandle: source
target: '1741162531836'
targetHandle: target
type: custom
zIndex: 0
+ - data:
+ isInIteration: false
+ sourceType: tool
+ targetType: tool
+ id: 1741328773213-source-17424348526540-target
+ source: '1741328773213'
+ sourceHandle: source
+ target: '17424348526540'
+ targetHandle: target
+ type: custom
+ zIndex: 0
- data:
isInIteration: false
sourceType: tool
targetType: variable-aggregator
- id: 1741328799030-source-1741162531836-target
- source: '1741328799030'
+ id: 17424348526540-source-1741162531836-target
+ source: '17424348526540'
sourceHandle: source
target: '1741162531836'
targetHandle: target
@@ -470,12 +543,12 @@ workflow:
zIndex: 0
- data:
isInIteration: false
- sourceType: question-classifier
+ sourceType: tool
targetType: tool
- id: 1741158559444-1741591414269-1741591590829-target
- source: '1741158559444'
- sourceHandle: '1741591414269'
- target: '1741591590829'
+ id: 1741328799030-source-17424348570980-target
+ source: '1741328799030'
+ sourceHandle: source
+ target: '17424348570980'
targetHandle: target
type: custom
zIndex: 0
@@ -483,76 +556,230 @@ workflow:
isInIteration: false
sourceType: tool
targetType: variable-aggregator
- id: 1741591590829-source-1741162531836-target
- source: '1741591590829'
+ id: 17424348570980-source-1741162531836-target
+ source: '17424348570980'
sourceHandle: source
target: '1741162531836'
targetHandle: target
type: custom
zIndex: 0
- nodes:
- data:
- desc: ''
- selected: true
- title: 开始
- type: start
- variables:
- - allowed_file_extensions: []
- allowed_file_types:
- - document
- allowed_file_upload_methods:
- - local_file
- - remote_url
- label: alert
- max_length: 256
- options: []
- required: true
- type: text-input
- variable: alert
- - label: params
- max_length: 99999999999
- options: []
- required: true
- type: paragraph
- variable: params
- - label: startTime(微秒)
- max_length: 48
- options: []
- required: true
- type: number
- variable: startTime
- - label: endTime(微秒)
- max_length: 48
- options: []
- required: true
- type: number
- variable: endTime
- - allowed_file_extensions:
- - .json
- allowed_file_types:
- - custom
- allowed_file_upload_methods:
- - local_file
- - remote_url
- label: input
- max_length: 48
- options: []
+ isInIteration: false
+ sourceType: start
+ targetType: code
+ id: 1741157526222-source-1742806924635-target
+ source: '1741157526222'
+ sourceHandle: source
+ target: '1742806924635'
+ targetHandle: target
+ type: custom
+ zIndex: 0
+ - data:
+ isInIteration: false
+ sourceType: code
+ targetType: code
+ id: 1742806924635-source-1742433446760-target
+ source: '1742806924635'
+ sourceHandle: source
+ target: '1742433446760'
+ targetHandle: target
+ type: custom
+ zIndex: 0
+ - data:
+ isInIteration: false
+ sourceType: question-classifier
+ targetType: tool
+ id: 1741158559444-1741158765960-1742979394268-target
+ source: '1741158559444'
+ sourceHandle: '1741158765960'
+ target: '1742979394268'
+ targetHandle: target
+ type: custom
+ zIndex: 0
+ - data:
+ isInIteration: false
+ sourceType: question-classifier
+ targetType: tool
+ id: 1741158559444-1741318899444-1742979595004-target
+ source: '1741158559444'
+ sourceHandle: '1741318899444'
+ target: '1742979595004'
+ targetHandle: target
+ type: custom
+ zIndex: 0
+ - data:
+ isInIteration: false
+ sourceType: question-classifier
+ targetType: tool
+ id: 1741158559444-1741591414269-17429797453350-target
+ source: '1741158559444'
+ sourceHandle: '1741591414269'
+ target: '17429797453350'
+ targetHandle: target
+ type: custom
+ zIndex: 0
+ - data:
+ isInIteration: false
+ sourceType: tool
+ targetType: tool
+ id: 17429797453350-source-17429797664440-target
+ source: '17429797453350'
+ sourceHandle: source
+ target: '17429797664440'
+ targetHandle: target
+ type: custom
+ zIndex: 0
+ - data:
+ isInIteration: false
+ sourceType: tool
+ targetType: variable-aggregator
+ id: 17429797664440-source-1741162531836-target
+ source: '17429797664440'
+ sourceHandle: source
+ target: '1741162531836'
+ targetHandle: target
+ type: custom
+ zIndex: 0
+ - data:
+ isInIteration: false
+ sourceType: question-classifier
+ targetType: tool
+ id: 1741158559444-1741319171199-1742979828391-target
+ source: '1741158559444'
+ sourceHandle: '1741319171199'
+ target: '1742979828391'
+ targetHandle: target
+ type: custom
+ zIndex: 0
+ - data:
+ isInIteration: false
+ sourceType: tool
+ targetType: tool
+ id: 1742979828391-source-17429798797920-target
+ source: '1742979828391'
+ sourceHandle: source
+ target: '17429798797920'
+ targetHandle: target
+ type: custom
+ zIndex: 0
+ - data:
+ isInIteration: false
+ sourceType: tool
+ targetType: variable-aggregator
+ id: 17429798797920-source-1741162531836-target
+ source: '17429798797920'
+ sourceHandle: source
+ target: '1741162531836'
+ targetHandle: target
+ type: custom
+ zIndex: 0
+ - data:
+ isInIteration: false
+ sourceType: tool
+ targetType: tool
+ id: 1742979394268-source-17429835599060-target
+ source: '1742979394268'
+ sourceHandle: source
+ target: '17429835599060'
+ targetHandle: target
+ type: custom
+ zIndex: 0
+ - data:
+ isInIteration: false
+ sourceType: tool
+ targetType: variable-aggregator
+ id: 17429835599060-source-1741162531836-target
+ source: '17429835599060'
+ sourceHandle: source
+ target: '1741162531836'
+ targetHandle: target
+ type: custom
+ zIndex: 0
+ - data:
+ isInIteration: false
+ sourceType: tool
+ targetType: tool
+ id: 1742979595004-source-17429835940550-target
+ source: '1742979595004'
+ sourceHandle: source
+ target: '17429835940550'
+ targetHandle: target
+ type: custom
+ zIndex: 0
+ - data:
+ isInIteration: false
+ sourceType: tool
+ targetType: variable-aggregator
+ id: 17429835940550-source-1741162531836-target
+ source: '17429835940550'
+ sourceHandle: source
+ target: '1741162531836'
+ targetHandle: target
+ type: custom
+ zIndex: 0
+ nodes:
+ - data:
+ desc: ''
+ selected: false
+ title: 开始
+ type: start
+ variables:
+ - allowed_file_extensions: []
+ allowed_file_types:
+ - document
+ allowed_file_upload_methods:
+ - local_file
+ - remote_url
+ label: alert
+ max_length: 256
+ options: []
+ required: true
+ type: text-input
+ variable: alert
+ - label: params
+ max_length: 99999999999
+ options: []
+ required: true
+ type: paragraph
+ variable: params
+ - label: startTime
+ max_length: 48
+ options: []
+ required: true
+ type: number
+ variable: startTime
+ - label: endTime
+ max_length: 48
+ options: []
+ required: true
+ type: number
+ variable: endTime
+ - allowed_file_extensions:
+ - .json
+ allowed_file_types:
+ - custom
+ allowed_file_upload_methods:
+ - local_file
+ - remote_url
+ label: input
+ max_length: 48
+ options: []
required: false
type: file
variable: input
- height: 193
+ height: 194
id: '1741157526222'
position:
- x: -474.8546859399444
- y: 113.39535872618072
+ x: -108.57929564245899
+ y: 544.6023004841712
positionAbsolute:
- x: -474.8546859399444
- y: 113.39535872618072
- selected: true
+ x: -108.57929564245899
+ y: 544.6023004841712
+ selected: false
sourcePosition: right
targetPosition: left
type: custom
- width: 243
+ width: 244
- data:
desc: ''
outputs:
@@ -563,19 +790,19 @@ workflow:
selected: false
title: 结束
type: end
- height: 89
+ height: 90
id: '1741157560922'
position:
- x: 3744.206346600103
- y: 363.73374031791394
+ x: 3374
+ y: 560
positionAbsolute:
- x: 3744.206346600103
- y: 363.73374031791394
+ x: 3374
+ y: 560
selected: false
sourcePosition: right
targetPosition: left
type: custom
- width: 243
+ width: 244
- data:
classes:
- id: '1'
@@ -598,11 +825,15 @@ workflow:
- id: '1741318983134'
name: '应用指标
- 错误率上升'
+ 错误率相关
+
+ 如Request error rate exceeds 0%,日志错误数相关'
- id: '1741319019432'
name: '网络相关
- 网络RTT延时超过50ms'
+ 如网络RTT延时超过50ms
+
+ network rtt'
- id: '1741319060092'
name: '主机相关
@@ -642,7 +873,9 @@ workflow:
容器被kill'
desc: ''
- instruction: 请你从告警事件描述来区分告警事件的类型
+ instruction: '请你从告警事件描述
+
+ 来对分告警事件进行分类'
instructions: ''
model:
completion_params:
@@ -654,24 +887,24 @@ workflow:
- '1741157526222'
- alert
selected: false
- title: 问题分类器
+ title: 告警事件分类
topics: []
type: question-classifier
vision:
enabled: false
- height: 687
+ height: 720
id: '1741158559444'
position:
- x: 458.26517283507326
- y: 139.09402013442167
+ x: 197.77785673494304
+ y: 703.2841482722955
positionAbsolute:
- x: 458.26517283507326
- y: 139.09402013442167
- selected: false
+ x: 197.77785673494304
+ y: 703.2841482722955
+ selected: true
sourcePosition: right
targetPosition: left
type: custom
- width: 243
+ width: 244
- data:
agent_parameters:
instruction:
@@ -715,10 +948,7 @@ workflow:
endTime:
auto: 1
value: null
- namespace:
- auto: 1
- value: null
- pod:
+ node:
auto: 1
value: null
startTime:
@@ -730,43 +960,19 @@ workflow:
default: null
form: llm
human_description:
- en_US: Specified pod name
- ja_JP: Specified pod name
- pt_BR: Specified pod name
- zh_Hans: 指定的容器POD名称
- label:
- en_US: pod
- ja_JP: pod
- pt_BR: pod
- zh_Hans: pod
- llm_description: Specified pod name
- max: null
- min: null
- name: pod
- options: []
- placeholder: null
- precision: null
- required: true
- scope: null
- template: null
- type: string
- - auto_generate: null
- default: null
- form: llm
- human_description:
- en_US: Specified namespace
- ja_JP: Specified namespace
- pt_BR: Specified namespace
- zh_Hans: 指定的容器所在Namespace
+ en_US: Specified host name
+ ja_JP: Specified host name
+ pt_BR: Specified host name
+ zh_Hans: 指定的主机名
label:
- en_US: namespace
- ja_JP: namespace
- pt_BR: namespace
- zh_Hans: namespace
- llm_description: Specified namespace
+ en_US: node
+ ja_JP: node
+ pt_BR: node
+ zh_Hans: node
+ llm_description: Specified host name
max: null
min: null
- name: namespace
+ name: node
options: []
placeholder: null
precision: null
@@ -823,8 +1029,8 @@ workflow:
template: null
type: number
settings: {}
- tool_label: 容器CPU使用率(使用Containerd容器运行时,按容器和Pod统计)
- tool_name: 查询容器CPU利用率
+ tool_label: 宿主机IO等待CPU繁忙率
+ tool_name: host_cpu_iowait
type: builtin
- enabled: true
extra:
@@ -833,6 +1039,9 @@ workflow:
endTime:
auto: 1
value: null
+ job:
+ auto: 1
+ value: null
node:
auto: 1
value: null
@@ -845,16 +1054,40 @@ workflow:
default: null
form: llm
human_description:
- en_US: Specified host name
- ja_JP: Specified host name
- pt_BR: Specified host name
- zh_Hans: 指定的主机名
+ en_US: Prometheus job name for host metrics
+ ja_JP: Prometheus job name for host metrics
+ pt_BR: Prometheus job name for host metrics
+ zh_Hans: Prometheus任务名称(宿主机指标)
label:
- en_US: node
- ja_JP: node
- pt_BR: node
- zh_Hans: node
- llm_description: Specified host name
+ en_US: Prometheus Job
+ ja_JP: Prometheus Job
+ pt_BR: Tarefa Prometheus
+ zh_Hans: Prometheus任务
+ llm_description: Unique identifier for metrics scrape job
+ max: null
+ min: null
+ name: job
+ options: []
+ placeholder: null
+ precision: null
+ required: false
+ scope: null
+ template: null
+ type: string
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Host node identifier
+ ja_JP: Host node identifier
+ pt_BR: Host node identifier
+ zh_Hans: 宿主机节点标识
+ label:
+ en_US: Host Node
+ ja_JP: Host Node
+ pt_BR: Host Node
+ zh_Hans: 宿主机节点
+ llm_description: Unique identifier for host node
max: null
min: null
name: node
@@ -914,126 +1147,8 @@ workflow:
template: null
type: number
settings: {}
- tool_label: 宿主机IO等待CPU繁忙率
- tool_name: host_cpu_iowait
- type: builtin
- - enabled: true
- extra:
- description: ''
- parameters:
- endTime:
- auto: 1
- value: null
- job:
- auto: 1
- value: null
- node:
- auto: 1
- value: null
- startTime:
- auto: 1
- value: null
- provider_name: apo_select
- schemas:
- - auto_generate: null
- default: null
- form: llm
- human_description:
- en_US: Prometheus job name for host metrics
- ja_JP: Prometheus job name for host metrics
- pt_BR: Prometheus job name for host metrics
- zh_Hans: Prometheus任务名称(宿主机指标)
- label:
- en_US: Prometheus Job
- ja_JP: Prometheus Job
- pt_BR: Tarefa Prometheus
- zh_Hans: Prometheus任务
- llm_description: Unique identifier for metrics scrape job
- max: null
- min: null
- name: job
- options: []
- placeholder: null
- precision: null
- required: false
- scope: null
- template: null
- type: string
- - auto_generate: null
- default: null
- form: llm
- human_description:
- en_US: Host node identifier
- ja_JP: Host node identifier
- pt_BR: Host node identifier
- zh_Hans: 宿主机节点标识
- label:
- en_US: Host Node
- ja_JP: Host Node
- pt_BR: Host Node
- zh_Hans: 宿主机节点
- llm_description: Unique identifier for host node
- max: null
- min: null
- name: node
- options: []
- placeholder: null
- precision: null
- required: true
- scope: null
- template: null
- type: string
- - auto_generate: null
- default: null
- form: llm
- human_description:
- en_US: Data query start time
- ja_JP: Data query start time
- pt_BR: Data query start time
- zh_Hans: 开始时间 (微秒)
- label:
- en_US: startTime
- ja_JP: startTime
- pt_BR: startTime
- zh_Hans: startTime
- llm_description: Data query start time
- max: null
- min: null
- name: startTime
- options: []
- placeholder: null
- precision: null
- required: true
- scope: null
- template: null
- type: number
- - auto_generate: null
- default: null
- form: llm
- human_description:
- en_US: Data query end time
- ja_JP: Data query end time
- pt_BR: Data query end time
- zh_Hans: 结束时间 (微秒)
- label:
- en_US: endTime
- ja_JP: endTime
- pt_BR: endTime
- zh_Hans: endTime
- llm_description: Data query start time
- max: null
- min: null
- name: endTime
- options: []
- placeholder: null
- precision: null
- required: true
- scope: null
- template: null
- type: number
- settings: {}
- tool_label: 查询宿主机最近1分钟的系统负载
- tool_name: 查询宿主机最近1分钟的系统负载
+ tool_label: 查询宿主机最近1分钟的系统负载
+ tool_name: 查询宿主机最近1分钟的系统负载
type: builtin
- enabled: true
extra:
@@ -1480,97 +1595,6 @@ workflow:
tool_label: 查询宿主机根文件系统使用率
tool_name: 查询宿主机根文件系统使用率
type: builtin
- - enabled: true
- extra:
- description: ''
- parameters:
- endTime:
- auto: 1
- value: null
- node:
- auto: 1
- value: null
- startTime:
- auto: 1
- value: null
- provider_name: apo_select
- schemas:
- - auto_generate: null
- default: null
- form: llm
- human_description:
- en_US: Specified host name
- ja_JP: Specified host name
- pt_BR: Specified host name
- zh_Hans: 指定的主机名
- label:
- en_US: node
- ja_JP: node
- pt_BR: node
- zh_Hans: node
- llm_description: Specified host name
- max: null
- min: null
- name: node
- options: []
- placeholder: null
- precision: null
- required: true
- scope: null
- template: null
- type: string
- - auto_generate: null
- default: null
- form: llm
- human_description:
- en_US: Data query start time
- ja_JP: Data query start time
- pt_BR: Data query start time
- zh_Hans: 开始时间 (微秒)
- label:
- en_US: startTime
- ja_JP: startTime
- pt_BR: startTime
- zh_Hans: startTime
- llm_description: Data query start time
- max: null
- min: null
- name: startTime
- options: []
- placeholder: null
- precision: null
- required: true
- scope: null
- template: null
- type: number
- - auto_generate: null
- default: null
- form: llm
- human_description:
- en_US: Data query end time
- ja_JP: Data query end time
- pt_BR: Data query end time
- zh_Hans: 结束时间 (微秒)
- label:
- en_US: endTime
- ja_JP: endTime
- pt_BR: endTime
- zh_Hans: endTime
- llm_description: Data query start time
- max: null
- min: null
- name: endTime
- options: []
- placeholder: null
- precision: null
- required: true
- scope: null
- template: null
- type: number
- settings: {}
- tool_label: 宿主机CPU繁忙率(百分比)
- tool_name: 查询主机CPU利用率
- type: builtin
- enabled: true
extra:
description: ''
@@ -1789,81 +1813,33 @@ workflow:
selected: false
title: Agent
type: agent
- height: 197
+ height: 198
id: '1741159085487'
position:
- x: 1307.6754497452887
- y: 1290.1574754514506
- positionAbsolute:
- x: 1307.6754497452887
- y: 1290.1574754514506
- selected: false
- sourcePosition: right
- targetPosition: left
- type: custom
- width: 243
- - data:
- code: "\ndef get_value(data, keys):\n for key in keys:\n value =\
- \ data.get(key)\n if value is not None:\n return value\n\
- \ return \"\"\n\nimport json\ndef main(arg: str) -> dict:\n data =\
- \ json.loads(arg)\n return {\n \"node\": data.get('node', ''),\n\
- \ \"service\": get_value(data, [\"svc_name\", \"service\"]),\n \
- \ \"endpoint\": get_value(data,[\"endpoint\", \"content_key\"]),\n\
- \ \"pod\": data.get('pod', ''),\n \"namespace\": data.get('namespace',\
- \ ''),\n }\n"
- code_language: python3
- desc: ''
- outputs:
- endpoint:
- children: null
- type: string
- namespace:
- children: null
- type: string
- node:
- children: null
- type: string
- pod:
- children: null
- type: string
- service:
- children: null
- type: string
- selected: false
- title: 代码执行
- type: code
- variables:
- - value_selector:
- - '1741157526222'
- - params
- variable: arg
- height: 53
- id: '1741161440242'
- position:
- x: -69.08988532973478
- y: 292.1938971823079
+ x: 2158
+ y: 560
positionAbsolute:
- x: -69.08988532973478
- y: 292.1938971823079
+ x: 2158
+ y: 560
selected: false
sourcePosition: right
targetPosition: left
type: custom
- width: 243
+ width: 244
- data:
desc: ''
output_type: string
selected: false
- title: 变量聚合器 2
+ title: 变量聚合提供给大模型分析
type: variable-aggregator
variables:
- - '1741328045214'
- text
- - - '1741328058981'
+ - - '1742979394268'
- text
- - '1741328076453'
- text
- - - '1741328169934'
+ - - '1742979595004'
- text
- - '1741329632798'
- text
@@ -1873,7 +1849,7 @@ workflow:
- text
- - '1741328466394'
- text
- - - '1741328692906'
+ - - '1742979828391'
- text
- - '1741328742817'
- text
@@ -1881,109 +1857,31 @@ workflow:
- text
- - '1741328799030'
- text
- - - '1741591590829'
+ - - '17429797453350'
+ - text
+ - - '1741328346220'
+ - text
+ - - '1741328213545'
- text
- height: 370
+ height: 416
id: '1741162531836'
position:
- x: 1791.1271628500772
- y: 78.61010888432415
+ x: 1854
+ y: 1275
positionAbsolute:
- x: 1791.1271628500772
- y: 78.61010888432415
+ x: 1854
+ y: 1275
selected: false
sourcePosition: right
targetPosition: left
type: custom
- width: 243
+ width: 244
- data:
- desc: ''
- is_team_authorization: true
- output_schema: null
- paramSchemas:
- - auto_generate: null
- default: null
- form: llm
- human_description:
- en_US: time series metric data
- ja_JP: time series metric data
- pt_BR: time series metric data
- zh_Hans: 时序指标数据
- label:
- en_US: metricData
- ja_JP: metricData
- pt_BR: metricData
- zh_Hans: metricData
- llm_description: Time series indicator data
- max: null
- min: null
- name: metricData
- options: []
- placeholder: null
- precision: null
- required: true
- scope: null
- template: null
- type: string
- - auto_generate: null
- default: null
- form: llm
- human_description:
- en_US: threshold
- ja_JP: threshold
- pt_BR: threshold
- zh_Hans: 趋势分析阈值
- label:
- en_US: threshold
- ja_JP: threshold
- pt_BR: threshold
- zh_Hans: threshold
- llm_description: threshold
- max: null
- min: null
- name: threshold
- options: []
- placeholder: null
- precision: null
- required: false
- scope: null
- template: null
- type: string
- params:
- metricData: ''
- threshold: ''
- provider_id: apo_analysis
- provider_name: apo_analysis
- provider_type: builtin
- selected: false
- title: 趋势分析
- tool_configurations: {}
- tool_label: 趋势分析
- tool_name: trend
- tool_parameters:
- metricData:
- type: mixed
- value: '{{#1741162531836.output#}}'
- type: tool
- height: 53
- id: '1741166377433'
- position:
- x: 2391.9587465022714
- y: 113.39535872618072
- positionAbsolute:
- x: 2391.9587465022714
- y: 113.39535872618072
- selected: false
- sourcePosition: right
- targetPosition: left
- type: custom
- width: 243
- - data:
- classes:
- - id: '1'
- name: 抖动
- - id: '2'
- name: 持续
+ classes:
+ - id: '1'
+ name: 抖动
+ - id: '2'
+ name: 持续
desc: ''
instruction: 判断输入的结论是抖动还是持续
instructions: ''
@@ -2002,19 +1900,19 @@ workflow:
type: question-classifier
vision:
enabled: false
- height: 167
+ height: 168
id: '1741311244655'
position:
- x: 1978.2523323677738
- y: 1024.2103589724884
+ x: 2462
+ y: 560
positionAbsolute:
- x: 1978.2523323677738
- y: 1024.2103589724884
+ x: 2462
+ y: 560
selected: false
sourcePosition: right
targetPosition: left
type: custom
- width: 243
+ width: 244
- data:
code: "\ndef main(arg1: str) -> dict:\n res = \"true\"\n if arg1 ==\
\ \"持续\":\n res = \"false\"\n return {\n \"result\": res,\n\
@@ -2033,19 +1931,19 @@ workflow:
- '1741311244655'
- class_name
variable: arg1
- height: 53
+ height: 54
id: '1741311294320'
position:
- x: 2339.896564438594
- y: 908.8373922229209
+ x: 2766
+ y: 560
positionAbsolute:
- x: 2339.896564438594
- y: 908.8373922229209
+ x: 2766
+ y: 560
selected: false
sourcePosition: right
targetPosition: left
type: custom
- width: 243
+ width: 244
- data:
desc: ''
output_type: string
@@ -2055,21 +1953,21 @@ workflow:
variables:
- - '1741311294320'
- result
- - - '1741166377433'
- - text
- height: 128
+ - - '1742366303110'
+ - class_name
+ height: 130
id: '1741311394752'
position:
- x: 3165.5195077270564
- y: 457.05597714025964
+ x: 3070
+ y: 560
positionAbsolute:
- x: 3165.5195077270564
- y: 457.05597714025964
+ x: 3070
+ y: 560
selected: false
sourcePosition: right
targetPosition: left
type: custom
- width: 243
+ width: 244
- data:
desc: ''
is_team_authorization: true
@@ -2103,19 +2001,2187 @@ workflow:
default: null
form: llm
human_description:
- en_US: Specified endpoint name
- ja_JP: Specified endpoint name
- pt_BR: Specified endpoint name
- zh_Hans: 指定的服务端点名
+ en_US: Specified endpoint name
+ ja_JP: Specified endpoint name
+ pt_BR: Specified endpoint name
+ zh_Hans: 指定的服务端点名
+ label:
+ en_US: content_key
+ ja_JP: content_key
+ pt_BR: content_key
+ zh_Hans: content_key
+ llm_description: 指定的服务端点名
+ max: null
+ min: null
+ name: content_key
+ options: []
+ placeholder: null
+ precision: null
+ required: true
+ scope: null
+ template: null
+ type: string
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Data query start time
+ ja_JP: Data query start time
+ pt_BR: Data query start time
+ zh_Hans: 开始时间 (微秒)
+ label:
+ en_US: startTime
+ ja_JP: startTime
+ pt_BR: startTime
+ zh_Hans: startTime
+ llm_description: Data query start time
+ max: null
+ min: null
+ name: startTime
+ options: []
+ placeholder: null
+ precision: null
+ required: true
+ scope: null
+ template: null
+ type: number
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Data query end time
+ ja_JP: Data query end time
+ pt_BR: Data query end time
+ zh_Hans: 结束时间 (微秒)
+ label:
+ en_US: endTime
+ ja_JP: endTime
+ pt_BR: endTime
+ zh_Hans: endTime
+ llm_description: Data query start time
+ max: null
+ min: null
+ name: endTime
+ options: []
+ placeholder: null
+ precision: null
+ required: true
+ scope: null
+ template: null
+ type: number
+ params:
+ content_key: ''
+ endTime: ''
+ service_name: ''
+ startTime: ''
+ provider_id: apo_select
+ provider_name: apo_select
+ provider_type: builtin
+ selected: false
+ title: 服务平均响应时间(毫秒,按服务名和内容键统计,指定时间段内)
+ tool_configurations: {}
+ tool_label: 服务平均响应时间(毫秒,按服务名和内容键统计,指定时间段内)
+ tool_name: Originx 北极星指标 (服务层级) - RED指标 - 平均响应时间
+ tool_parameters:
+ content_key:
+ type: mixed
+ value: '{{#1742806924635.endpoint#}}'
+ endTime:
+ type: variable
+ value:
+ - '1741157526222'
+ - endTime
+ service_name:
+ type: mixed
+ value: '{{#1742806924635.service#}}'
+ startTime:
+ type: variable
+ value:
+ - '1741157526222'
+ - startTime
+ type: tool
+ height: 54
+ id: '1741328045214'
+ position:
+ x: 1246
+ y: 617
+ positionAbsolute:
+ x: 1246
+ y: 617
+ selected: false
+ sourcePosition: right
+ targetPosition: left
+ type: custom
+ width: 244
+ - data:
+ desc: ''
+ is_team_authorization: true
+ output_schema: null
+ paramSchemas:
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Specified pod name
+ ja_JP: Specified pod name
+ pt_BR: Specified pod name
+ zh_Hans: 指定的容器POD名称
+ label:
+ en_US: pod
+ ja_JP: pod
+ pt_BR: pod
+ zh_Hans: pod
+ llm_description: Specified pod name
+ max: null
+ min: null
+ name: pod
+ options: []
+ placeholder: null
+ precision: null
+ required: true
+ scope: null
+ template: null
+ type: string
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Specified namespace
+ ja_JP: Specified namespace
+ pt_BR: Specified namespace
+ zh_Hans: 指定的容器所在Namespace
+ label:
+ en_US: namespace
+ ja_JP: namespace
+ pt_BR: namespace
+ zh_Hans: namespace
+ llm_description: Specified namespace
+ max: null
+ min: null
+ name: namespace
+ options: []
+ placeholder: null
+ precision: null
+ required: true
+ scope: null
+ template: null
+ type: string
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Data query start time
+ ja_JP: Data query start time
+ pt_BR: Data query start time
+ zh_Hans: 开始时间 (微秒)
+ label:
+ en_US: startTime
+ ja_JP: startTime
+ pt_BR: startTime
+ zh_Hans: startTime
+ llm_description: Data query start time
+ max: null
+ min: null
+ name: startTime
+ options: []
+ placeholder: null
+ precision: null
+ required: true
+ scope: null
+ template: null
+ type: number
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Data query end time
+ ja_JP: Data query end time
+ pt_BR: Data query end time
+ zh_Hans: 结束时间 (微秒)
+ label:
+ en_US: endTime
+ ja_JP: endTime
+ pt_BR: endTime
+ zh_Hans: endTime
+ llm_description: Data query start time
+ max: null
+ min: null
+ name: endTime
+ options: []
+ placeholder: null
+ precision: null
+ required: true
+ scope: null
+ template: null
+ type: number
+ params:
+ endTime: ''
+ namespace: ''
+ pod: ''
+ startTime: ''
+ provider_id: apo_select
+ provider_name: apo_select
+ provider_type: builtin
+ selected: false
+ title: 容器CPU节流时长(使用Containerd容器运行时,按容器和Pod统计)
+ tool_configurations: {}
+ tool_label: 容器CPU节流时长(使用Containerd容器运行时,按容器和Pod统计)
+ tool_name: 容器CPU节流时长(使用Containerd容器运行时,按容器和Pod统计)
+ tool_parameters:
+ endTime:
+ type: variable
+ value:
+ - '1741157526222'
+ - endTime
+ namespace:
+ type: mixed
+ value: '{{#1742806924635.namespace#}}'
+ pod:
+ type: mixed
+ value: '{{#1742806924635.pod#}}'
+ startTime:
+ type: variable
+ value:
+ - '1741157526222'
+ - startTime
+ type: tool
+ height: 54
+ id: '1741328076453'
+ position:
+ x: 1246
+ y: 711
+ positionAbsolute:
+ x: 1246
+ y: 711
+ selected: false
+ sourcePosition: right
+ targetPosition: left
+ type: custom
+ width: 244
+ - data:
+ desc: ''
+ is_team_authorization: true
+ output_schema: null
+ paramSchemas:
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Specified pod name
+ ja_JP: Specified pod name
+ pt_BR: Specified pod name
+ zh_Hans: 指定的容器POD名称
+ label:
+ en_US: pod
+ ja_JP: pod
+ pt_BR: pod
+ zh_Hans: pod
+ llm_description: Specified pod name
+ max: null
+ min: null
+ name: pod
+ options: []
+ placeholder: null
+ precision: null
+ required: true
+ scope: null
+ template: null
+ type: string
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Specified namespace
+ ja_JP: Specified namespace
+ pt_BR: Specified namespace
+ zh_Hans: 指定的容器所在Namespace
+ label:
+ en_US: namespace
+ ja_JP: namespace
+ pt_BR: namespace
+ zh_Hans: namespace
+ llm_description: Specified namespace
+ max: null
+ min: null
+ name: namespace
+ options: []
+ placeholder: null
+ precision: null
+ required: true
+ scope: null
+ template: null
+ type: string
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Data query start time
+ ja_JP: Data query start time
+ pt_BR: Data query start time
+ zh_Hans: 开始时间 (微秒)
+ label:
+ en_US: startTime
+ ja_JP: startTime
+ pt_BR: startTime
+ zh_Hans: startTime
+ llm_description: Data query start time
+ max: null
+ min: null
+ name: startTime
+ options: []
+ placeholder: null
+ precision: null
+ required: true
+ scope: null
+ template: null
+ type: number
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Data query end time
+ ja_JP: Data query end time
+ pt_BR: Data query end time
+ zh_Hans: 结束时间 (微秒)
+ label:
+ en_US: endTime
+ ja_JP: endTime
+ pt_BR: endTime
+ zh_Hans: endTime
+ llm_description: Data query start time
+ max: null
+ min: null
+ name: endTime
+ options: []
+ placeholder: null
+ precision: null
+ required: true
+ scope: null
+ template: null
+ type: number
+ params:
+ endTime: ''
+ namespace: ''
+ pod: ''
+ startTime: ''
+ provider_id: apo_select
+ provider_name: apo_select
+ provider_type: builtin
+ selected: false
+ title: 容器与下游服务的网络往返时间(RTT,按命名空间和Pod统计)
+ tool_configurations: {}
+ tool_label: 容器与下游服务的网络往返时间(RTT,按命名空间和Pod统计)
+ tool_name: 查询容器网络与下游RTT
+ tool_parameters:
+ endTime:
+ type: variable
+ value:
+ - '1741157526222'
+ - endTime
+ namespace:
+ type: mixed
+ value: '{{#1742806924635.namespace#}}'
+ pod:
+ type: mixed
+ value: '{{#1742806924635.pod#}}'
+ startTime:
+ type: variable
+ value:
+ - '1741157526222'
+ - startTime
+ type: tool
+ height: 54
+ id: '1741328197695'
+ position:
+ x: 1246
+ y: 899
+ positionAbsolute:
+ x: 1246
+ y: 899
+ selected: false
+ sourcePosition: right
+ targetPosition: left
+ type: custom
+ width: 244
+ - data:
+ desc: ''
+ is_team_authorization: true
+ output_schema: null
+ paramSchemas:
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Specified host name
+ ja_JP: Specified host name
+ pt_BR: Specified host name
+ zh_Hans: 指定的主机名
+ label:
+ en_US: node
+ ja_JP: node
+ pt_BR: node
+ zh_Hans: node
+ llm_description: Specified host name
+ max: null
+ min: null
+ name: node
+ options: []
+ placeholder: null
+ precision: null
+ required: true
+ scope: null
+ template: null
+ type: string
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Data query start time
+ ja_JP: Data query start time
+ pt_BR: Data query start time
+ zh_Hans: 开始时间 (微秒)
+ label:
+ en_US: startTime
+ ja_JP: startTime
+ pt_BR: startTime
+ zh_Hans: startTime
+ llm_description: Data query start time
+ max: null
+ min: null
+ name: startTime
+ options: []
+ placeholder: null
+ precision: null
+ required: true
+ scope: null
+ template: null
+ type: number
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Data query end time
+ ja_JP: Data query end time
+ pt_BR: Data query end time
+ zh_Hans: 结束时间 (微秒)
+ label:
+ en_US: endTime
+ ja_JP: endTime
+ pt_BR: endTime
+ zh_Hans: endTime
+ llm_description: Data query start time
+ max: null
+ min: null
+ name: endTime
+ options: []
+ placeholder: null
+ precision: null
+ required: true
+ scope: null
+ template: null
+ type: number
+ params:
+ endTime: ''
+ node: ''
+ startTime: ''
+ provider_id: apo_select
+ provider_name: apo_select
+ provider_type: builtin
+ selected: false
+ title: 宿主机磁盘使用率(百分比,不含rootfs)
+ tool_configurations: {}
+ tool_label: 宿主机磁盘使用率(百分比,不含rootfs)
+ tool_name: 宿主机磁盘使用率(百分比,不含rootfs)
+ tool_parameters:
+ endTime:
+ type: variable
+ value:
+ - '1741157526222'
+ - endTime
+ node:
+ type: mixed
+ value: '{{#1742806924635.node#}}'
+ startTime:
+ type: variable
+ value:
+ - '1741157526222'
+ - startTime
+ type: tool
+ height: 54
+ id: '1741328213545'
+ position:
+ x: 1246
+ y: 993
+ positionAbsolute:
+ x: 1246
+ y: 993
+ selected: false
+ sourcePosition: right
+ targetPosition: left
+ type: custom
+ width: 244
+ - data:
+ desc: ''
+ is_team_authorization: true
+ output_schema: null
+ paramSchemas:
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Specified host name
+ ja_JP: Specified host name
+ pt_BR: Specified host name
+ zh_Hans: 指定的主机名
+ label:
+ en_US: node
+ ja_JP: node
+ pt_BR: node
+ zh_Hans: node
+ llm_description: Specified host name
+ max: null
+ min: null
+ name: node
+ options: []
+ placeholder: null
+ precision: null
+ required: true
+ scope: null
+ template: null
+ type: string
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Data query start time
+ ja_JP: Data query start time
+ pt_BR: Data query start time
+ zh_Hans: 开始时间 (微秒)
+ label:
+ en_US: startTime
+ ja_JP: startTime
+ pt_BR: startTime
+ zh_Hans: startTime
+ llm_description: Data query start time
+ max: null
+ min: null
+ name: startTime
+ options: []
+ placeholder: null
+ precision: null
+ required: true
+ scope: null
+ template: null
+ type: number
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Data query end time
+ ja_JP: Data query end time
+ pt_BR: Data query end time
+ zh_Hans: 结束时间 (微秒)
+ label:
+ en_US: endTime
+ ja_JP: endTime
+ pt_BR: endTime
+ zh_Hans: endTime
+ llm_description: Data query start time
+ max: null
+ min: null
+ name: endTime
+ options: []
+ placeholder: null
+ precision: null
+ required: true
+ scope: null
+ template: null
+ type: number
+ params:
+ endTime: ''
+ node: ''
+ startTime: ''
+ provider_id: apo_select
+ provider_name: apo_select
+ provider_type: builtin
+ selected: false
+ title: 宿主机网络接收速率(比特/秒)
+ tool_configurations: {}
+ tool_label: 宿主机网络接收速率(比特/秒)
+ tool_name: 宿主机网络接收速率(比特/秒)
+ tool_parameters:
+ endTime:
+ type: variable
+ value:
+ - '1741157526222'
+ - endTime
+ node:
+ type: mixed
+ value: '{{#1742806924635.node#}}'
+ startTime:
+ type: variable
+ value:
+ - '1741157526222'
+ - startTime
+ type: tool
+ height: 54
+ id: '1741328346220'
+ position:
+ x: 1246
+ y: 1087
+ positionAbsolute:
+ x: 1246
+ y: 1087
+ selected: false
+ sourcePosition: right
+ targetPosition: left
+ type: custom
+ width: 244
+ - data:
+ desc: ''
+ is_team_authorization: true
+ output_schema: null
+ paramSchemas:
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Specified host name
+ ja_JP: Specified host name
+ pt_BR: Specified host name
+ zh_Hans: 指定的主机名
+ label:
+ en_US: node
+ ja_JP: node
+ pt_BR: node
+ zh_Hans: node
+ llm_description: Specified host name
+ max: null
+ min: null
+ name: node
+ options: []
+ placeholder: null
+ precision: null
+ required: true
+ scope: null
+ template: null
+ type: string
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Data query start time
+ ja_JP: Data query start time
+ pt_BR: Data query start time
+ zh_Hans: 开始时间 (微秒)
+ label:
+ en_US: startTime
+ ja_JP: startTime
+ pt_BR: startTime
+ zh_Hans: startTime
+ llm_description: Data query start time
+ max: null
+ min: null
+ name: startTime
+ options: []
+ placeholder: null
+ precision: null
+ required: true
+ scope: null
+ template: null
+ type: number
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Data query end time
+ ja_JP: Data query end time
+ pt_BR: Data query end time
+ zh_Hans: 结束时间 (微秒)
+ label:
+ en_US: endTime
+ ja_JP: endTime
+ pt_BR: endTime
+ zh_Hans: endTime
+ llm_description: Data query start time
+ max: null
+ min: null
+ name: endTime
+ options: []
+ placeholder: null
+ precision: null
+ required: true
+ scope: null
+ template: null
+ type: number
+ params:
+ endTime: ''
+ node: ''
+ startTime: ''
+ provider_id: apo_select
+ provider_name: apo_select
+ provider_type: builtin
+ selected: false
+ title: 宿主机磁盘读取数据速率(字节/秒)
+ tool_configurations: {}
+ tool_label: 宿主机磁盘读取数据速率(字节/秒)
+ tool_name: 宿主机磁盘读取数据速率(字节/秒)
+ tool_parameters:
+ endTime:
+ type: variable
+ value:
+ - '1741157526222'
+ - endTime
+ node:
+ type: mixed
+ value: '{{#1742806924635.node#}}'
+ startTime:
+ type: variable
+ value:
+ - '1741157526222'
+ - startTime
+ type: tool
+ height: 54
+ id: '1741328423453'
+ position:
+ x: 1246
+ y: 1181
+ positionAbsolute:
+ x: 1246
+ y: 1181
+ selected: false
+ sourcePosition: right
+ targetPosition: left
+ type: custom
+ width: 244
+ - data:
+ desc: ''
+ is_team_authorization: true
+ output_schema: null
+ paramSchemas:
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Specified host name
+ ja_JP: Specified host name
+ pt_BR: Specified host name
+ zh_Hans: 指定的主机名
+ label:
+ en_US: node
+ ja_JP: node
+ pt_BR: node
+ zh_Hans: node
+ llm_description: Specified host name
+ max: null
+ min: null
+ name: node
+ options: []
+ placeholder: null
+ precision: null
+ required: true
+ scope: null
+ template: null
+ type: string
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Data query start time
+ ja_JP: Data query start time
+ pt_BR: Data query start time
+ zh_Hans: 开始时间 (微秒)
+ label:
+ en_US: startTime
+ ja_JP: startTime
+ pt_BR: startTime
+ zh_Hans: startTime
+ llm_description: Data query start time
+ max: null
+ min: null
+ name: startTime
+ options: []
+ placeholder: null
+ precision: null
+ required: true
+ scope: null
+ template: null
+ type: number
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Data query end time
+ ja_JP: Data query end time
+ pt_BR: Data query end time
+ zh_Hans: 结束时间 (微秒)
+ label:
+ en_US: endTime
+ ja_JP: endTime
+ pt_BR: endTime
+ zh_Hans: endTime
+ llm_description: Data query start time
+ max: null
+ min: null
+ name: endTime
+ options: []
+ placeholder: null
+ precision: null
+ required: true
+ scope: null
+ template: null
+ type: number
+ params:
+ endTime: ''
+ node: ''
+ startTime: ''
+ provider_id: apo_select
+ provider_name: apo_select
+ provider_type: builtin
+ selected: false
+ title: 宿主机磁盘写入数据速率(字节/秒)
+ tool_configurations: {}
+ tool_label: 宿主机磁盘写入数据速率(字节/秒)
+ tool_name: 宿主机磁盘写入数据速率(字节/秒)
+ tool_parameters:
+ endTime:
+ type: variable
+ value:
+ - '1741157526222'
+ - endTime
+ node:
+ type: mixed
+ value: '{{#1742806924635.node#}}'
+ startTime:
+ type: variable
+ value:
+ - '1741157526222'
+ - startTime
+ type: tool
+ height: 54
+ id: '1741328466394'
+ position:
+ x: 1246
+ y: 1275
+ positionAbsolute:
+ x: 1246
+ y: 1275
+ selected: false
+ sourcePosition: right
+ targetPosition: left
+ type: custom
+ width: 244
+ - data:
+ desc: ''
+ is_team_authorization: true
+ output_schema: null
+ paramSchemas:
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Specified host name
+ ja_JP: Specified host name
+ pt_BR: Specified host name
+ zh_Hans: 指定的主机名
+ label:
+ en_US: node
+ ja_JP: node
+ pt_BR: node
+ zh_Hans: node
+ llm_description: Specified host name
+ max: null
+ min: null
+ name: node
+ options: []
+ placeholder: null
+ precision: null
+ required: true
+ scope: null
+ template: null
+ type: string
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Data query start time
+ ja_JP: Data query start time
+ pt_BR: Data query start time
+ zh_Hans: 开始时间 (微秒)
+ label:
+ en_US: startTime
+ ja_JP: startTime
+ pt_BR: startTime
+ zh_Hans: startTime
+ llm_description: Data query start time
+ max: null
+ min: null
+ name: startTime
+ options: []
+ placeholder: null
+ precision: null
+ required: true
+ scope: null
+ template: null
+ type: number
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Data query end time
+ ja_JP: Data query end time
+ pt_BR: Data query end time
+ zh_Hans: 结束时间 (微秒)
+ label:
+ en_US: endTime
+ ja_JP: endTime
+ pt_BR: endTime
+ zh_Hans: endTime
+ llm_description: Data query start time
+ max: null
+ min: null
+ name: endTime
+ options: []
+ placeholder: null
+ precision: null
+ required: true
+ scope: null
+ template: null
+ type: number
+ params:
+ endTime: ''
+ node: ''
+ startTime: ''
+ provider_id: apo_select
+ provider_name: apo_select
+ provider_type: builtin
+ selected: false
+ title: 宿主机磁盘IO耗时速率
+ tool_configurations: {}
+ tool_label: 宿主机磁盘IO耗时速率
+ tool_name: 宿主机磁盘IO耗时速率
+ tool_parameters:
+ endTime:
+ type: variable
+ value:
+ - '1741157526222'
+ - endTime
+ node:
+ type: mixed
+ value: '{{#1742806924635.node#}}'
+ startTime:
+ type: variable
+ value:
+ - '1741157526222'
+ - startTime
+ type: tool
+ height: 54
+ id: '1741328742817'
+ position:
+ x: 1246
+ y: 1369
+ positionAbsolute:
+ x: 1246
+ y: 1369
+ selected: false
+ sourcePosition: right
+ targetPosition: left
+ type: custom
+ width: 244
+ - data:
+ desc: ''
+ is_team_authorization: true
+ output_schema: null
+ paramSchemas:
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Specified host name
+ ja_JP: Specified host name
+ pt_BR: Specified host name
+ zh_Hans: 指定的主机名
+ label:
+ en_US: node
+ ja_JP: node
+ pt_BR: node
+ zh_Hans: node
+ llm_description: Specified host name
+ max: null
+ min: null
+ name: node
+ options: []
+ placeholder: null
+ precision: null
+ required: true
+ scope: null
+ template: null
+ type: string
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Data query start time
+ ja_JP: Data query start time
+ pt_BR: Data query start time
+ zh_Hans: 开始时间 (微秒)
+ label:
+ en_US: startTime
+ ja_JP: startTime
+ pt_BR: startTime
+ zh_Hans: startTime
+ llm_description: Data query start time
+ max: null
+ min: null
+ name: startTime
+ options: []
+ placeholder: null
+ precision: null
+ required: true
+ scope: null
+ template: null
+ type: number
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Data query end time
+ ja_JP: Data query end time
+ pt_BR: Data query end time
+ zh_Hans: 结束时间 (微秒)
+ label:
+ en_US: endTime
+ ja_JP: endTime
+ pt_BR: endTime
+ zh_Hans: endTime
+ llm_description: Data query start time
+ max: null
+ min: null
+ name: endTime
+ options: []
+ placeholder: null
+ precision: null
+ required: true
+ scope: null
+ template: null
+ type: number
+ params:
+ endTime: ''
+ node: ''
+ startTime: ''
+ provider_id: apo_select
+ provider_name: apo_select
+ provider_type: builtin
+ selected: false
+ title: 宿主机IO等待CPU繁忙率
+ tool_configurations: {}
+ tool_label: 宿主机IO等待CPU繁忙率
+ tool_name: host_cpu_iowait
+ tool_parameters:
+ endTime:
+ type: variable
+ value:
+ - '1741157526222'
+ - endTime
+ node:
+ type: mixed
+ value: '{{#1742806924635.node#}}'
+ startTime:
+ type: variable
+ value:
+ - '1741157526222'
+ - startTime
+ type: tool
+ height: 54
+ id: '1741328773213'
+ position:
+ x: 1246
+ y: 1463
+ positionAbsolute:
+ x: 1246
+ y: 1463
+ selected: false
+ sourcePosition: right
+ targetPosition: left
+ type: custom
+ width: 244
+ - data:
+ desc: ''
+ is_team_authorization: true
+ output_schema: null
+ paramSchemas:
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Specified host name
+ ja_JP: Specified host name
+ pt_BR: Specified host name
+ zh_Hans: 指定的主机名
+ label:
+ en_US: node
+ ja_JP: node
+ pt_BR: node
+ zh_Hans: node
+ llm_description: Specified host name
+ max: null
+ min: null
+ name: node
+ options: []
+ placeholder: null
+ precision: null
+ required: true
+ scope: null
+ template: null
+ type: string
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Data query start time
+ ja_JP: Data query start time
+ pt_BR: Data query start time
+ zh_Hans: 开始时间 (微秒)
+ label:
+ en_US: startTime
+ ja_JP: startTime
+ pt_BR: startTime
+ zh_Hans: startTime
+ llm_description: Data query start time
+ max: null
+ min: null
+ name: startTime
+ options: []
+ placeholder: null
+ precision: null
+ required: true
+ scope: null
+ template: null
+ type: number
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Data query end time
+ ja_JP: Data query end time
+ pt_BR: Data query end time
+ zh_Hans: 结束时间 (微秒)
+ label:
+ en_US: endTime
+ ja_JP: endTime
+ pt_BR: endTime
+ zh_Hans: endTime
+ llm_description: Data query start time
+ max: null
+ min: null
+ name: endTime
+ options: []
+ placeholder: null
+ precision: null
+ required: true
+ scope: null
+ template: null
+ type: number
+ params:
+ endTime: ''
+ node: ''
+ startTime: ''
+ provider_id: apo_select
+ provider_name: apo_select
+ provider_type: builtin
+ selected: false
+ title: 宿主机当前打开文件描述符数
+ tool_configurations: {}
+ tool_label: 宿主机当前打开文件描述符数
+ tool_name: host_cpu_fd_open
+ tool_parameters:
+ endTime:
+ type: variable
+ value:
+ - '1741157526222'
+ - endTime
+ node:
+ type: mixed
+ value: '{{#1742806924635.node#}}'
+ startTime:
+ type: variable
+ value:
+ - '1741157526222'
+ - startTime
+ type: tool
+ height: 54
+ id: '1741328799030'
+ position:
+ x: 1246
+ y: 1557
+ positionAbsolute:
+ x: 1246
+ y: 1557
+ selected: false
+ sourcePosition: right
+ targetPosition: left
+ type: custom
+ width: 244
+ - data:
+ desc: ''
+ is_team_authorization: true
+ output_schema: null
+ paramSchemas:
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Specified service name
+ ja_JP: Specified service name
+ pt_BR: Specified service name
+ zh_Hans: 指定的服务名
+ label:
+ en_US: service_name
+ ja_JP: service_name
+ pt_BR: service_name
+ zh_Hans: service_name
+ llm_description: 指定的服务名
+ max: null
+ min: null
+ name: service_name
+ options: []
+ placeholder: null
+ precision: null
+ required: true
+ scope: null
+ template: null
+ type: string
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Specified endpoint name
+ ja_JP: Specified endpoint name
+ pt_BR: Specified endpoint name
+ zh_Hans: 指定的服务端点名
+ label:
+ en_US: content_key
+ ja_JP: content_key
+ pt_BR: content_key
+ zh_Hans: content_key
+ llm_description: 指定的服务端点名
+ max: null
+ min: null
+ name: content_key
+ options: []
+ placeholder: null
+ precision: null
+ required: true
+ scope: null
+ template: null
+ type: string
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Data query start time
+ ja_JP: Data query start time
+ pt_BR: Data query start time
+ zh_Hans: 开始时间 (微秒)
+ label:
+ en_US: startTime
+ ja_JP: startTime
+ pt_BR: startTime
+ zh_Hans: startTime
+ llm_description: Data query start time
+ max: null
+ min: null
+ name: startTime
+ options: []
+ placeholder: null
+ precision: null
+ required: true
+ scope: null
+ template: null
+ type: number
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Data query end time
+ ja_JP: Data query end time
+ pt_BR: Data query end time
+ zh_Hans: 结束时间 (微秒)
+ label:
+ en_US: endTime
+ ja_JP: endTime
+ pt_BR: endTime
+ zh_Hans: endTime
+ llm_description: Data query start time
+ max: null
+ min: null
+ name: endTime
+ options: []
+ placeholder: null
+ precision: null
+ required: true
+ scope: null
+ template: null
+ type: number
+ params:
+ content_key: ''
+ endTime: ''
+ service_name: ''
+ startTime: ''
+ provider_id: apo_select
+ provider_name: apo_select
+ provider_type: builtin
+ selected: false
+ title: 服务请求成功率(按服务名和内容键统计,指定时间段内)
+ tool_configurations: {}
+ tool_label: 服务请求成功率(按服务名和内容键统计,指定时间段内)
+ tool_name: Originx 北极星指标 (服务层级) - RED指标 - 请求成功率
+ tool_parameters:
+ content_key:
+ type: mixed
+ value: '{{#1742806924635.endpoint#}}'
+ endTime:
+ type: variable
+ value:
+ - '1741157526222'
+ - endTime
+ service_name:
+ type: mixed
+ value: '{{#1742806924635.service#}}'
+ startTime:
+ type: variable
+ value:
+ - '1741157526222'
+ - startTime
+ type: tool
+ height: 54
+ id: '1741329632798'
+ position:
+ x: 1246
+ y: 805
+ positionAbsolute:
+ x: 1246
+ y: 805
+ selected: false
+ sourcePosition: right
+ targetPosition: left
+ type: custom
+ width: 244
+ - data:
+ context:
+ enabled: false
+ variable_selector: []
+ desc: ''
+ model:
+ completion_params:
+ temperature: 0.7
+ mode: chat
+ name: deepseek-chat
+ provider: langgenius/deepseek/deepseek
+ prompt_template:
+ - id: c981a70d-9ebb-4f03-949a-8d78826f9bda
+ role: system
+ text: 你是一个智能助手,帮助用户解决可观测性领域的问题
+ - id: c62c7537-195d-41e7-9127-116cf3debc7c
+ role: user
+ text: '##目的
+
+ 请分析系统/应用在过去15分钟内的指标变化趋势,并结合当前的告警事件进行分析。
+
+ ##步骤
+
+ 1. 列出过去15分钟内MetricsData的变化趋势,描述这些Metrics的变化是否正常,是否有异常的波动或趋势。
+
+ 2. 告警有效性确认:结合告警事件,判断当前告警是否有效。
+
+ 如果MetricsData持续上升或处于高位,则认为告警有效。
+
+ 如果处于波动状态,即偶尔上升,但随后下降,则认为告警无效。
+
+ 如果最终MetricsData回到正常范围或低位值,则认为告警无效。
+
+ 如果有历史数据,则需要对比分析历史数据,如果相比历史数据升高,告警也为有效
+
+ ##输出
+
+ 描述MetricsData趋势,并得出告警是否有效的结论。
+
+ 注意:告警有效性分析的结论只能是有效或无效
+
+ ##Data
+
+ MetricsData
+
+ {{#1741162531836.output#}}
+
+ metricsdata的历史数据
+
+ {{#1742434016239.output#}}
+
+ 警报事件描述
+
+ {{#1741157526222.alert#}}'
+ selected: false
+ title: 大模型分析指标数据
+ type: llm
+ variables: []
+ vision:
+ enabled: false
+ height: 90
+ id: '1742366141890'
+ position:
+ x: 2462
+ y: 1314
+ positionAbsolute:
+ x: 2462
+ y: 1314
+ selected: false
+ sourcePosition: right
+ targetPosition: left
+ type: custom
+ width: 244
+ - data:
+ classes:
+ - id: '1'
+ name: 'true'
+ - id: '2'
+ name: 'false'
+ desc: ''
+ instruction: '# 目的
+
+ 根据输入的结论进行分类
+
+ 如果结论中认为告警有效,分类到false
+
+ 如果结论中认为告警无效,分类到true
+
+ # 注意
+
+ 请仔细检查文本,并寻找关于告警有效性的结论,不要错误分类'
+ instructions: ''
+ model:
+ completion_params:
+ temperature: 0.7
+ mode: chat
+ name: deepseek-chat
+ provider: langgenius/deepseek/deepseek
+ query_variable_selector:
+ - '1742366141890'
+ - text
+ selected: false
+ title: 结果分类
+ topics: []
+ type: question-classifier
+ vision:
+ enabled: false
+ height: 168
+ id: '1742366303110'
+ position:
+ x: 2766
+ y: 1218
+ positionAbsolute:
+ x: 2766
+ y: 1218
+ selected: false
+ sourcePosition: right
+ targetPosition: left
+ type: custom
+ width: 244
+ - data:
+ code: "SECOND = 1000000 # microseconds\nMINUTE = 60 * SECOND\nHOUR = 60 *\
+ \ MINUTE\n\ndef main(arg1: int, arg2: int) -> dict:\n \n return {\n\
+ \ \"history_st\": arg1 - (24*HOUR),\n \"history_et\": arg2,\n\
+ \ }\n"
+ code_language: python3
+ desc: ''
+ outputs:
+ history_et:
+ children: null
+ type: number
+ history_st:
+ children: null
+ type: number
+ retry_config:
+ max_retries: 3
+ retry_enabled: true
+ retry_interval: 1000
+ selected: false
+ title: 选择历史数据查询区间
+ type: code
+ variables:
+ - value_selector:
+ - '1741157526222'
+ - startTime
+ variable: arg1
+ - value_selector:
+ - '1741157526222'
+ - endTime
+ variable: arg2
+ height: 80
+ id: '1742433446760'
+ position:
+ x: 638
+ y: 560
+ positionAbsolute:
+ x: 638
+ y: 560
+ selected: false
+ sourcePosition: right
+ targetPosition: left
+ type: custom
+ width: 244
+ - data:
+ desc: ''
+ is_team_authorization: true
+ output_schema: null
+ paramSchemas:
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Specified service name
+ ja_JP: Specified service name
+ pt_BR: Specified service name
+ zh_Hans: 指定的服务名
+ label:
+ en_US: service_name
+ ja_JP: service_name
+ pt_BR: service_name
+ zh_Hans: service_name
+ llm_description: 指定的服务名
+ max: null
+ min: null
+ name: service_name
+ options: []
+ placeholder: null
+ precision: null
+ required: true
+ scope: null
+ template: null
+ type: string
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Specified endpoint name
+ ja_JP: Specified endpoint name
+ pt_BR: Specified endpoint name
+ zh_Hans: 指定的服务端点名
+ label:
+ en_US: content_key
+ ja_JP: content_key
+ pt_BR: content_key
+ zh_Hans: content_key
+ llm_description: 指定的服务端点名
+ max: null
+ min: null
+ name: content_key
+ options: []
+ placeholder: null
+ precision: null
+ required: true
+ scope: null
+ template: null
+ type: string
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Data query start time
+ ja_JP: Data query start time
+ pt_BR: Data query start time
+ zh_Hans: 开始时间 (微秒)
+ label:
+ en_US: startTime
+ ja_JP: startTime
+ pt_BR: startTime
+ zh_Hans: startTime
+ llm_description: Data query start time
+ max: null
+ min: null
+ name: startTime
+ options: []
+ placeholder: null
+ precision: null
+ required: true
+ scope: null
+ template: null
+ type: number
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Data query end time
+ ja_JP: Data query end time
+ pt_BR: Data query end time
+ zh_Hans: 结束时间 (微秒)
+ label:
+ en_US: endTime
+ ja_JP: endTime
+ pt_BR: endTime
+ zh_Hans: endTime
+ llm_description: Data query start time
+ max: null
+ min: null
+ name: endTime
+ options: []
+ placeholder: null
+ precision: null
+ required: true
+ scope: null
+ template: null
+ type: number
+ params:
+ content_key: ''
+ endTime: ''
+ service_name: ''
+ startTime: ''
+ provider_id: apo_select
+ provider_name: apo_select
+ provider_type: builtin
+ selected: false
+ title: 历史数据 服务平均响应时间(毫秒,按服务名和内容键统计,指定时间段内)
+ tool_configurations: {}
+ tool_label: 服务平均响应时间(毫秒,按服务名和内容键统计,指定时间段内)
+ tool_name: Originx 北极星指标 (服务层级) - RED指标 - 平均响应时间
+ tool_parameters:
+ content_key:
+ type: mixed
+ value: '{{#1742806924635.endpoint#}}'
+ endTime:
+ type: variable
+ value:
+ - '1742433446760'
+ - history_et
+ service_name:
+ type: mixed
+ value: '{{#1742806924635.service#}}'
+ startTime:
+ type: variable
+ value:
+ - '1742433446760'
+ - history_st
+ type: tool
+ height: 54
+ id: '17424339242280'
+ position:
+ x: 1550
+ y: 617
+ positionAbsolute:
+ x: 1550
+ y: 617
+ selected: false
+ sourcePosition: right
+ targetPosition: left
+ type: custom
+ width: 244
+ - data:
+ desc: ''
+ output_type: string
+ selected: false
+ title: 聚合历史指标数据
+ type: variable-aggregator
+ variables:
+ - - '17424339242280'
+ - text
+ - - '17429797664440'
+ - text
+ - - '17424348570980'
+ - text
+ - - '17424348526540'
+ - text
+ - - '17424348206030'
+ - text
+ - - '17424347242840'
+ - text
+ - - '17424346884650'
+ - text
+ - - '17424342365860'
+ - text
+ - - '17424344697090'
+ - text
+ - - '17424345080000'
+ - text
+ - - '17424345826170'
+ - text
+ - - '17424345315500'
+ - text
+ - - '17429798797920'
+ - text
+ - - '17429835599060'
+ - text
+ - - '17429835940550'
+ - text
+ height: 416
+ id: '1742434016239'
+ position:
+ x: 2145.168583736809
+ y: 1031.2701292364982
+ positionAbsolute:
+ x: 2145.168583736809
+ y: 1031.2701292364982
+ selected: false
+ sourcePosition: right
+ targetPosition: left
+ type: custom
+ width: 244
+ - data:
+ desc: ''
+ is_team_authorization: true
+ output_schema: null
+ paramSchemas:
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Specified pod name
+ ja_JP: Specified pod name
+ pt_BR: Specified pod name
+ zh_Hans: 指定的容器POD名称
+ label:
+ en_US: pod
+ ja_JP: pod
+ pt_BR: pod
+ zh_Hans: pod
+ llm_description: Specified pod name
+ max: null
+ min: null
+ name: pod
+ options: []
+ placeholder: null
+ precision: null
+ required: true
+ scope: null
+ template: null
+ type: string
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Specified namespace
+ ja_JP: Specified namespace
+ pt_BR: Specified namespace
+ zh_Hans: 指定的容器所在Namespace
+ label:
+ en_US: namespace
+ ja_JP: namespace
+ pt_BR: namespace
+ zh_Hans: namespace
+ llm_description: Specified namespace
+ max: null
+ min: null
+ name: namespace
+ options: []
+ placeholder: null
+ precision: null
+ required: true
+ scope: null
+ template: null
+ type: string
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Data query start time
+ ja_JP: Data query start time
+ pt_BR: Data query start time
+ zh_Hans: 开始时间 (微秒)
+ label:
+ en_US: startTime
+ ja_JP: startTime
+ pt_BR: startTime
+ zh_Hans: startTime
+ llm_description: Data query start time
+ max: null
+ min: null
+ name: startTime
+ options: []
+ placeholder: null
+ precision: null
+ required: true
+ scope: null
+ template: null
+ type: number
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Data query end time
+ ja_JP: Data query end time
+ pt_BR: Data query end time
+ zh_Hans: 结束时间 (微秒)
+ label:
+ en_US: endTime
+ ja_JP: endTime
+ pt_BR: endTime
+ zh_Hans: endTime
+ llm_description: Data query start time
+ max: null
+ min: null
+ name: endTime
+ options: []
+ placeholder: null
+ precision: null
+ required: true
+ scope: null
+ template: null
+ type: number
+ params:
+ endTime: ''
+ namespace: ''
+ pod: ''
+ startTime: ''
+ provider_id: apo_select
+ provider_name: apo_select
+ provider_type: builtin
+ selected: false
+ title: 历史数据 容器CPU节流时长(使用Containerd容器运行时,按容器和Pod统计)
+ tool_configurations: {}
+ tool_label: 容器CPU节流时长(使用Containerd容器运行时,按容器和Pod统计)
+ tool_name: 容器CPU节流时长(使用Containerd容器运行时,按容器和Pod统计)
+ tool_parameters:
+ endTime:
+ type: variable
+ value:
+ - '1742433446760'
+ - history_et
+ namespace:
+ type: mixed
+ value: '{{#1742806924635.namespace#}}'
+ pod:
+ type: mixed
+ value: '{{#1742806924635.pod#}}'
+ startTime:
+ type: variable
+ value:
+ - '1742433446760'
+ - history_st
+ type: tool
+ height: 54
+ id: '17424342365860'
+ position:
+ x: 1550
+ y: 711
+ positionAbsolute:
+ x: 1550
+ y: 711
+ selected: false
+ sourcePosition: right
+ targetPosition: left
+ type: custom
+ width: 244
+ - data:
+ desc: ''
+ is_team_authorization: true
+ output_schema: null
+ paramSchemas:
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Specified service name
+ ja_JP: Specified service name
+ pt_BR: Specified service name
+ zh_Hans: 指定的服务名
+ label:
+ en_US: service_name
+ ja_JP: service_name
+ pt_BR: service_name
+ zh_Hans: service_name
+ llm_description: 指定的服务名
+ max: null
+ min: null
+ name: service_name
+ options: []
+ placeholder: null
+ precision: null
+ required: true
+ scope: null
+ template: null
+ type: string
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Specified endpoint name
+ ja_JP: Specified endpoint name
+ pt_BR: Specified endpoint name
+ zh_Hans: 指定的服务端点名
+ label:
+ en_US: content_key
+ ja_JP: content_key
+ pt_BR: content_key
+ zh_Hans: content_key
+ llm_description: 指定的服务端点名
+ max: null
+ min: null
+ name: content_key
+ options: []
+ placeholder: null
+ precision: null
+ required: true
+ scope: null
+ template: null
+ type: string
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Data query start time
+ ja_JP: Data query start time
+ pt_BR: Data query start time
+ zh_Hans: 开始时间 (微秒)
+ label:
+ en_US: startTime
+ ja_JP: startTime
+ pt_BR: startTime
+ zh_Hans: startTime
+ llm_description: Data query start time
+ max: null
+ min: null
+ name: startTime
+ options: []
+ placeholder: null
+ precision: null
+ required: true
+ scope: null
+ template: null
+ type: number
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Data query end time
+ ja_JP: Data query end time
+ pt_BR: Data query end time
+ zh_Hans: 结束时间 (微秒)
+ label:
+ en_US: endTime
+ ja_JP: endTime
+ pt_BR: endTime
+ zh_Hans: endTime
+ llm_description: Data query start time
+ max: null
+ min: null
+ name: endTime
+ options: []
+ placeholder: null
+ precision: null
+ required: true
+ scope: null
+ template: null
+ type: number
+ params:
+ content_key: ''
+ endTime: ''
+ service_name: ''
+ startTime: ''
+ provider_id: apo_select
+ provider_name: apo_select
+ provider_type: builtin
+ selected: false
+ title: '历史数据 服务请求成功率(按服务名和内容键统计,指定时间段内) '
+ tool_configurations: {}
+ tool_label: 服务请求成功率(按服务名和内容键统计,指定时间段内)
+ tool_name: Originx 北极星指标 (服务层级) - RED指标 - 请求成功率
+ tool_parameters:
+ content_key:
+ type: mixed
+ value: '{{#1742806924635.endpoint#}}'
+ endTime:
+ type: variable
+ value:
+ - '1742433446760'
+ - history_et
+ service_name:
+ type: mixed
+ value: '{{#1742806924635.service#}}'
+ startTime:
+ type: variable
+ value:
+ - '1742433446760'
+ - history_st
+ type: tool
+ height: 54
+ id: '17424344697090'
+ position:
+ x: 1550
+ y: 805
+ positionAbsolute:
+ x: 1550
+ y: 805
+ selected: false
+ sourcePosition: right
+ targetPosition: left
+ type: custom
+ width: 244
+ - data:
+ desc: ''
+ is_team_authorization: true
+ output_schema: null
+ paramSchemas:
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Specified pod name
+ ja_JP: Specified pod name
+ pt_BR: Specified pod name
+ zh_Hans: 指定的容器POD名称
+ label:
+ en_US: pod
+ ja_JP: pod
+ pt_BR: pod
+ zh_Hans: pod
+ llm_description: Specified pod name
+ max: null
+ min: null
+ name: pod
+ options: []
+ placeholder: null
+ precision: null
+ required: true
+ scope: null
+ template: null
+ type: string
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Specified namespace
+ ja_JP: Specified namespace
+ pt_BR: Specified namespace
+ zh_Hans: 指定的容器所在Namespace
+ label:
+ en_US: namespace
+ ja_JP: namespace
+ pt_BR: namespace
+ zh_Hans: namespace
+ llm_description: Specified namespace
+ max: null
+ min: null
+ name: namespace
+ options: []
+ placeholder: null
+ precision: null
+ required: true
+ scope: null
+ template: null
+ type: string
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Data query start time
+ ja_JP: Data query start time
+ pt_BR: Data query start time
+ zh_Hans: 开始时间 (微秒)
+ label:
+ en_US: startTime
+ ja_JP: startTime
+ pt_BR: startTime
+ zh_Hans: startTime
+ llm_description: Data query start time
+ max: null
+ min: null
+ name: startTime
+ options: []
+ placeholder: null
+ precision: null
+ required: true
+ scope: null
+ template: null
+ type: number
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Data query end time
+ ja_JP: Data query end time
+ pt_BR: Data query end time
+ zh_Hans: 结束时间 (微秒)
+ label:
+ en_US: endTime
+ ja_JP: endTime
+ pt_BR: endTime
+ zh_Hans: endTime
+ llm_description: Data query start time
+ max: null
+ min: null
+ name: endTime
+ options: []
+ placeholder: null
+ precision: null
+ required: true
+ scope: null
+ template: null
+ type: number
+ params:
+ endTime: ''
+ namespace: ''
+ pod: ''
+ startTime: ''
+ provider_id: apo_select
+ provider_name: apo_select
+ provider_type: builtin
+ selected: false
+ title: '历史数据 容器与下游服务的网络往返时间(RTT,按命名空间和Pod统计) '
+ tool_configurations: {}
+ tool_label: 容器与下游服务的网络往返时间(RTT,按命名空间和Pod统计)
+ tool_name: 查询容器网络与下游RTT
+ tool_parameters:
+ endTime:
+ type: variable
+ value:
+ - '1742433446760'
+ - history_et
+ namespace:
+ type: mixed
+ value: '{{#1742806924635.namespace#}}'
+ pod:
+ type: mixed
+ value: '{{#1742806924635.pod#}}'
+ startTime:
+ type: variable
+ value:
+ - '1742433446760'
+ - history_st
+ type: tool
+ height: 54
+ id: '17424345080000'
+ position:
+ x: 1550
+ y: 899
+ positionAbsolute:
+ x: 1550
+ y: 899
+ selected: false
+ sourcePosition: right
+ targetPosition: left
+ type: custom
+ width: 244
+ - data:
+ desc: ''
+ is_team_authorization: true
+ output_schema: null
+ paramSchemas:
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Specified host name
+ ja_JP: Specified host name
+ pt_BR: Specified host name
+ zh_Hans: 指定的主机名
label:
- en_US: content_key
- ja_JP: content_key
- pt_BR: content_key
- zh_Hans: content_key
- llm_description: 指定的服务端点名
+ en_US: node
+ ja_JP: node
+ pt_BR: node
+ zh_Hans: node
+ llm_description: Specified host name
max: null
min: null
- name: content_key
+ name: node
options: []
placeholder: null
precision: null
@@ -2172,49 +4238,45 @@ workflow:
template: null
type: number
params:
- content_key: ''
endTime: ''
- service_name: ''
+ node: ''
startTime: ''
provider_id: apo_select
provider_name: apo_select
provider_type: builtin
selected: false
- title: 服务平均响应时间(毫秒,按服务名和内容键统计,指定时间段内)
+ title: 历史数据 宿主机磁盘使用率(百分比,不含rootfs)
tool_configurations: {}
- tool_label: 服务平均响应时间(毫秒,按服务名和内容键统计,指定时间段内)
- tool_name: Originx 北极星指标 (服务层级) - RED指标 - 平均响应时间
+ tool_label: 宿主机磁盘使用率(百分比,不含rootfs)
+ tool_name: 宿主机磁盘使用率(百分比,不含rootfs)
tool_parameters:
- content_key:
- type: mixed
- value: '{{#1741161440242.endpoint#}}'
endTime:
type: variable
value:
- - '1741157526222'
- - endTime
- service_name:
+ - '1742433446760'
+ - history_et
+ node:
type: mixed
- value: '{{#1741161440242.service#}}'
+ value: '{{#1742806924635.node#}}'
startTime:
type: variable
value:
- - '1741157526222'
- - startTime
+ - '1742433446760'
+ - history_st
type: tool
- height: 53
- id: '1741328045214'
+ height: 54
+ id: '17424345315500'
position:
- x: 855.3123364340672
- y: 87.84552204580373
+ x: 1550
+ y: 993
positionAbsolute:
- x: 855.3123364340672
- y: 87.84552204580373
+ x: 1550
+ y: 993
selected: false
sourcePosition: right
targetPosition: left
type: custom
- width: 243
+ width: 244
- data:
desc: ''
is_team_authorization: true
@@ -2224,43 +4286,19 @@ workflow:
default: null
form: llm
human_description:
- en_US: Specified pod name
- ja_JP: Specified pod name
- pt_BR: Specified pod name
- zh_Hans: 指定的容器POD名称
- label:
- en_US: pod
- ja_JP: pod
- pt_BR: pod
- zh_Hans: pod
- llm_description: Specified pod name
- max: null
- min: null
- name: pod
- options: []
- placeholder: null
- precision: null
- required: true
- scope: null
- template: null
- type: string
- - auto_generate: null
- default: null
- form: llm
- human_description:
- en_US: Specified namespace
- ja_JP: Specified namespace
- pt_BR: Specified namespace
- zh_Hans: 指定的容器所在Namespace
+ en_US: Specified host name
+ ja_JP: Specified host name
+ pt_BR: Specified host name
+ zh_Hans: 指定的主机名
label:
- en_US: namespace
- ja_JP: namespace
- pt_BR: namespace
- zh_Hans: namespace
- llm_description: Specified namespace
+ en_US: node
+ ja_JP: node
+ pt_BR: node
+ zh_Hans: node
+ llm_description: Specified host name
max: null
min: null
- name: namespace
+ name: node
options: []
placeholder: null
precision: null
@@ -2318,48 +4356,44 @@ workflow:
type: number
params:
endTime: ''
- namespace: ''
- pod: ''
+ node: ''
startTime: ''
provider_id: apo_select
provider_name: apo_select
provider_type: builtin
selected: false
- title: 容器CPU使用率(使用Containerd容器运行时,按容器和Pod统计)
+ title: 历史数据 宿主机网络接收速率(比特/秒)
tool_configurations: {}
- tool_label: 容器CPU使用率(使用Containerd容器运行时,按容器和Pod统计)
- tool_name: 查询容器CPU利用率
+ tool_label: 宿主机网络接收速率(比特/秒)
+ tool_name: 宿主机网络接收速率(比特/秒)
tool_parameters:
endTime:
type: variable
value:
- - '1741157526222'
- - endTime
- namespace:
- type: mixed
- value: '{{#1741161440242.namespace#}}'
- pod:
+ - '1742433446760'
+ - history_et
+ node:
type: mixed
- value: '{{#1741161440242.pod#}}'
+ value: '{{#1742806924635.node#}}'
startTime:
type: variable
value:
- - '1741157526222'
- - startTime
+ - '1742433446760'
+ - history_st
type: tool
- height: 53
- id: '1741328058981'
+ height: 54
+ id: '17424345826170'
position:
- x: 866.9205146355775
- y: 182.43066738622156
+ x: 1550
+ y: 1087
positionAbsolute:
- x: 866.9205146355775
- y: 182.43066738622156
+ x: 1550
+ y: 1087
selected: false
sourcePosition: right
targetPosition: left
type: custom
- width: 243
+ width: 244
- data:
desc: ''
is_team_authorization: true
@@ -2369,43 +4403,19 @@ workflow:
default: null
form: llm
human_description:
- en_US: Specified pod name
- ja_JP: Specified pod name
- pt_BR: Specified pod name
- zh_Hans: 指定的容器POD名称
- label:
- en_US: pod
- ja_JP: pod
- pt_BR: pod
- zh_Hans: pod
- llm_description: Specified pod name
- max: null
- min: null
- name: pod
- options: []
- placeholder: null
- precision: null
- required: true
- scope: null
- template: null
- type: string
- - auto_generate: null
- default: null
- form: llm
- human_description:
- en_US: Specified namespace
- ja_JP: Specified namespace
- pt_BR: Specified namespace
- zh_Hans: 指定的容器所在Namespace
+ en_US: Specified host name
+ ja_JP: Specified host name
+ pt_BR: Specified host name
+ zh_Hans: 指定的主机名
label:
- en_US: namespace
- ja_JP: namespace
- pt_BR: namespace
- zh_Hans: namespace
- llm_description: Specified namespace
+ en_US: node
+ ja_JP: node
+ pt_BR: node
+ zh_Hans: node
+ llm_description: Specified host name
max: null
min: null
- name: namespace
+ name: node
options: []
placeholder: null
precision: null
@@ -2463,48 +4473,44 @@ workflow:
type: number
params:
endTime: ''
- namespace: ''
- pod: ''
+ node: ''
startTime: ''
provider_id: apo_select
provider_name: apo_select
provider_type: builtin
selected: false
- title: 容器CPU节流时长(使用Containerd容器运行时,按容器和Pod统计)
+ title: 历史数据 宿主机磁盘读取数据速率(字节/秒)
tool_configurations: {}
- tool_label: 容器CPU节流时长(使用Containerd容器运行时,按容器和Pod统计)
- tool_name: 容器CPU节流时长(使用Containerd容器运行时,按容器和Pod统计)
+ tool_label: 宿主机磁盘读取数据速率(字节/秒)
+ tool_name: 宿主机磁盘读取数据速率(字节/秒)
tool_parameters:
endTime:
type: variable
value:
- - '1741157526222'
- - endTime
- namespace:
- type: mixed
- value: '{{#1741161440242.namespace#}}'
- pod:
+ - '1742433446760'
+ - history_et
+ node:
type: mixed
- value: '{{#1741161440242.pod#}}'
+ value: '{{#1742806924635.node#}}'
startTime:
type: variable
value:
- - '1741157526222'
- - startTime
+ - '1742433446760'
+ - history_st
type: tool
- height: 53
- id: '1741328076453'
+ height: 54
+ id: '17424346884650'
position:
- x: 879.4543026140257
- y: 267.35126206280336
+ x: 1550
+ y: 1181
positionAbsolute:
- x: 879.4543026140257
- y: 267.35126206280336
+ x: 1550
+ y: 1181
selected: false
sourcePosition: right
targetPosition: left
type: custom
- width: 243
+ width: 244
- data:
desc: ''
is_team_authorization: true
@@ -2514,43 +4520,19 @@ workflow:
default: null
form: llm
human_description:
- en_US: Specified pod name
- ja_JP: Specified pod name
- pt_BR: Specified pod name
- zh_Hans: 指定的容器POD名称
- label:
- en_US: pod
- ja_JP: pod
- pt_BR: pod
- zh_Hans: pod
- llm_description: Specified pod name
- max: null
- min: null
- name: pod
- options: []
- placeholder: null
- precision: null
- required: true
- scope: null
- template: null
- type: string
- - auto_generate: null
- default: null
- form: llm
- human_description:
- en_US: Specified namespace
- ja_JP: Specified namespace
- pt_BR: Specified namespace
- zh_Hans: 指定的容器所在Namespace
+ en_US: Specified host name
+ ja_JP: Specified host name
+ pt_BR: Specified host name
+ zh_Hans: 指定的主机名
label:
- en_US: namespace
- ja_JP: namespace
- pt_BR: namespace
- zh_Hans: namespace
- llm_description: Specified namespace
+ en_US: node
+ ja_JP: node
+ pt_BR: node
+ zh_Hans: node
+ llm_description: Specified host name
max: null
min: null
- name: namespace
+ name: node
options: []
placeholder: null
precision: null
@@ -2608,48 +4590,44 @@ workflow:
type: number
params:
endTime: ''
- namespace: ''
- pod: ''
+ node: ''
startTime: ''
provider_id: apo_select
provider_name: apo_select
provider_type: builtin
selected: false
- title: 容器内存使用字节数(使用Containerd容器运行时,按容器和Pod统计)
+ title: '历史数据 宿主机磁盘写入数据速率(字节/秒) '
tool_configurations: {}
- tool_label: 容器内存使用字节数(使用Containerd容器运行时,按容器和Pod统计)
- tool_name: 查询容器内存使用量
+ tool_label: 宿主机磁盘写入数据速率(字节/秒)
+ tool_name: 宿主机磁盘写入数据速率(字节/秒)
tool_parameters:
endTime:
type: variable
value:
- - '1741157526222'
- - endTime
- namespace:
- type: mixed
- value: '{{#1741161440242.namespace#}}'
- pod:
+ - '1742433446760'
+ - history_et
+ node:
type: mixed
- value: '{{#1741161440242.pod#}}'
+ value: '{{#1742806924635.node#}}'
startTime:
type: variable
value:
- - '1741157526222'
- - startTime
+ - '1742433446760'
+ - history_st
type: tool
- height: 53
- id: '1741328169934'
+ height: 54
+ id: '17424347242840'
position:
- x: 879.4543026140257
- y: 347.02153779457154
+ x: 1550
+ y: 1275
positionAbsolute:
- x: 879.4543026140257
- y: 347.02153779457154
+ x: 1550
+ y: 1275
selected: false
sourcePosition: right
targetPosition: left
type: custom
- width: 243
+ width: 244
- data:
desc: ''
is_team_authorization: true
@@ -2659,43 +4637,19 @@ workflow:
default: null
form: llm
human_description:
- en_US: Specified pod name
- ja_JP: Specified pod name
- pt_BR: Specified pod name
- zh_Hans: 指定的容器POD名称
- label:
- en_US: pod
- ja_JP: pod
- pt_BR: pod
- zh_Hans: pod
- llm_description: Specified pod name
- max: null
- min: null
- name: pod
- options: []
- placeholder: null
- precision: null
- required: true
- scope: null
- template: null
- type: string
- - auto_generate: null
- default: null
- form: llm
- human_description:
- en_US: Specified namespace
- ja_JP: Specified namespace
- pt_BR: Specified namespace
- zh_Hans: 指定的容器所在Namespace
+ en_US: Specified host name
+ ja_JP: Specified host name
+ pt_BR: Specified host name
+ zh_Hans: 指定的主机名
label:
- en_US: namespace
- ja_JP: namespace
- pt_BR: namespace
- zh_Hans: namespace
- llm_description: Specified namespace
+ en_US: node
+ ja_JP: node
+ pt_BR: node
+ zh_Hans: node
+ llm_description: Specified host name
max: null
min: null
- name: namespace
+ name: node
options: []
placeholder: null
precision: null
@@ -2753,48 +4707,44 @@ workflow:
type: number
params:
endTime: ''
- namespace: ''
- pod: ''
+ node: ''
startTime: ''
provider_id: apo_select
provider_name: apo_select
provider_type: builtin
selected: false
- title: 容器与下游服务的网络往返时间(RTT,按命名空间和Pod统计)
+ title: 历史数据 宿主机磁盘IO耗时速率
tool_configurations: {}
- tool_label: 容器与下游服务的网络往返时间(RTT,按命名空间和Pod统计)
- tool_name: 查询容器网络与下游RTT
+ tool_label: 宿主机磁盘IO耗时速率
+ tool_name: 宿主机磁盘IO耗时速率
tool_parameters:
endTime:
type: variable
value:
- - '1741157526222'
- - endTime
- namespace:
- type: mixed
- value: '{{#1741161440242.namespace#}}'
- pod:
+ - '1742433446760'
+ - history_et
+ node:
type: mixed
- value: '{{#1741161440242.pod#}}'
+ value: '{{#1742806924635.node#}}'
startTime:
type: variable
value:
- - '1741157526222'
- - startTime
+ - '1742433446760'
+ - history_st
type: tool
- height: 53
- id: '1741328197695'
+ height: 54
+ id: '17424348206030'
position:
- x: 879.4543026140257
- y: 516.6534783332379
+ x: 1550
+ y: 1369
positionAbsolute:
- x: 879.4543026140257
- y: 516.6534783332379
+ x: 1550
+ y: 1369
selected: false
sourcePosition: right
targetPosition: left
type: custom
- width: 243
+ width: 244
- data:
desc: ''
is_team_authorization: true
@@ -2880,38 +4830,38 @@ workflow:
provider_name: apo_select
provider_type: builtin
selected: false
- title: 宿主机磁盘使用率(百分比,不含rootfs)
+ title: 历史数据 宿主机IO等待CPU繁忙率
tool_configurations: {}
- tool_label: 宿主机磁盘使用率(百分比,不含rootfs)
- tool_name: 宿主机磁盘使用率(百分比,不含rootfs)
+ tool_label: 宿主机IO等待CPU繁忙率
+ tool_name: host_cpu_iowait
tool_parameters:
endTime:
type: variable
value:
- - '1741157526222'
- - endTime
+ - '1742433446760'
+ - history_et
node:
type: mixed
- value: '{{#1741161440242.node#}}'
+ value: '{{#1742806924635.node#}}'
startTime:
type: variable
value:
- - '1741157526222'
- - startTime
+ - '1742433446760'
+ - history_st
type: tool
- height: 53
- id: '1741328213545'
+ height: 54
+ id: '17424348526540'
position:
- x: 897.1352138415443
- y: 617.4421900673747
+ x: 1550
+ y: 1463
positionAbsolute:
- x: 897.1352138415443
- y: 617.4421900673747
+ x: 1550
+ y: 1463
selected: false
sourcePosition: right
targetPosition: left
type: custom
- width: 243
+ width: 244
- data:
desc: ''
is_team_authorization: true
@@ -2997,38 +4947,86 @@ workflow:
provider_name: apo_select
provider_type: builtin
selected: false
- title: 宿主机网络接收速率(比特/秒)
+ title: 历史数据 宿主机当前打开文件描述符数
tool_configurations: {}
- tool_label: 宿主机网络接收速率(比特/秒)
- tool_name: 宿主机网络接收速率(比特/秒)
+ tool_label: 宿主机当前打开文件描述符数
+ tool_name: host_cpu_fd_open
tool_parameters:
endTime:
type: variable
value:
- - '1741157526222'
- - endTime
+ - '1742433446760'
+ - history_et
node:
type: mixed
- value: '{{#1741161440242.node#}}'
+ value: '{{#1742806924635.node#}}'
startTime:
type: variable
value:
- - '1741157526222'
- - startTime
+ - '1742433446760'
+ - history_st
type: tool
- height: 53
- id: '1741328346220'
+ height: 54
+ id: '17424348570980'
+ position:
+ x: 1550
+ y: 1557
+ positionAbsolute:
+ x: 1550
+ y: 1557
+ selected: false
+ sourcePosition: right
+ targetPosition: left
+ type: custom
+ width: 244
+ - data:
+ code: " \ndef get_value(data, keys): \n for key in keys: \n value = data.get(key)\
+ \ \n if value is not None: \n return value \n return \"\" \n\n\
+ import json \n\ndef main(arg: str) -> dict:\n data = json.loads(arg) \n\
+ \ return { \n \"node\": get_value(data, [\"svc_node\", \"node\", \"nodename\"\
+ ]), \n \"service\": get_value(data, [\"svc_name\", \"service\"]),\
+ \ \n \"endpoint\": get_value(data,[\"endpoint\", \"content_key\"]), \n\
+ \ \"pod\": get_value(data,[\"pod\", \"src_pod\", \"pod_name\"]), \n \"\
+ namespace\": get_value(data,[\"namespace\", \"src_namespace\"]), \n}"
+ code_language: python3
+ desc: ''
+ outputs:
+ endpoint:
+ children: null
+ type: string
+ namespace:
+ children: null
+ type: string
+ node:
+ children: null
+ type: string
+ pod:
+ children: null
+ type: string
+ service:
+ children: null
+ type: string
+ selected: false
+ title: 告警事件标签提取
+ type: code
+ variables:
+ - value_selector:
+ - '1741157526222'
+ - params
+ variable: arg
+ height: 54
+ id: '1742806924635'
position:
- x: 897.1352138415443
- y: 706.3425334205976
+ x: 334
+ y: 560
positionAbsolute:
- x: 897.1352138415443
- y: 706.3425334205976
+ x: 334
+ y: 560
selected: false
sourcePosition: right
targetPosition: left
type: custom
- width: 243
+ width: 244
- data:
desc: ''
is_team_authorization: true
@@ -3038,23 +5036,23 @@ workflow:
default: null
form: llm
human_description:
- en_US: Specified host name
- ja_JP: Specified host name
- pt_BR: Specified host name
- zh_Hans: 指定的主机名
+ en_US: cAdvisor job name
+ ja_JP: cAdvisor job name
+ pt_BR: cAdvisor job name
+ zh_Hans: cAdvisor任务名称
label:
- en_US: node
- ja_JP: node
- pt_BR: node
- zh_Hans: node
- llm_description: Specified host name
+ en_US: cAdvisor job name
+ ja_JP: cAdvisor job name
+ pt_BR: cAdvisor job name
+ zh_Hans: cAdvisor任务名称
+ llm_description: cAdvisor job name
max: null
min: null
- name: node
+ name: cadvisor_job_name
options: []
placeholder: null
precision: null
- required: true
+ required: false
scope: null
template: null
type: string
@@ -3062,16 +5060,64 @@ workflow:
default: null
form: llm
human_description:
- en_US: Data query start time
- ja_JP: Data query start time
- pt_BR: Data query start time
+ en_US: Namespace
+ ja_JP: Namespace
+ pt_BR: Namespace
+ zh_Hans: 命名空间
+ label:
+ en_US: Namespace
+ ja_JP: Namespace
+ pt_BR: Namespace
+ zh_Hans: 命名空间
+ llm_description: Namespace
+ max: null
+ min: null
+ name: namespace
+ options: []
+ placeholder: null
+ precision: null
+ required: false
+ scope: null
+ template: null
+ type: string
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Pod name
+ ja_JP: Pod name
+ pt_BR: Pod name
+ zh_Hans: Pod名称
+ label:
+ en_US: Pod name
+ ja_JP: Pod name
+ pt_BR: Pod name
+ zh_Hans: Pod名称
+ llm_description: Pod name
+ max: null
+ min: null
+ name: pod
+ options: []
+ placeholder: null
+ precision: null
+ required: false
+ scope: null
+ template: null
+ type: string
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Data query start time(Microsecond)
+ ja_JP: Data query start time(Microsecond)
+ pt_BR: Data query start time(Microsecond)
zh_Hans: 开始时间 (微秒)
label:
en_US: startTime
ja_JP: startTime
pt_BR: startTime
zh_Hans: startTime
- llm_description: Data query start time
+ llm_description: Data query start time(Microsecond)
max: null
min: null
name: startTime
@@ -3086,16 +5132,16 @@ workflow:
default: null
form: llm
human_description:
- en_US: Data query end time
- ja_JP: Data query end time
- pt_BR: Data query end time
+ en_US: Data query end time(Microsecond)
+ ja_JP: Data query end time(Microsecond)
+ pt_BR: Data query end time(Microsecond)
zh_Hans: 结束时间 (微秒)
label:
en_US: endTime
ja_JP: endTime
pt_BR: endTime
zh_Hans: endTime
- llm_description: Data query start time
+ llm_description: Data query end time(Microsecond)
max: null
min: null
name: endTime
@@ -3107,45 +5153,51 @@ workflow:
template: null
type: number
params:
+ cadvisor_job_name: ''
endTime: ''
- node: ''
+ namespace: ''
+ pod: ''
startTime: ''
provider_id: apo_select
provider_name: apo_select
provider_type: builtin
selected: false
- title: 宿主机磁盘读取数据速率(字节/秒)
+ title: 容器CPU 使用率
tool_configurations: {}
- tool_label: 宿主机磁盘读取数据速率(字节/秒)
- tool_name: 宿主机磁盘读取数据速率(字节/秒)
+ tool_label: Container CPU usage rate (Containerd runtime, aggregated by container
+ and Pod)
+ tool_name: 容器CPU使用率(使用Containerd容器运行时,按容器和Pod统计)
tool_parameters:
endTime:
type: variable
value:
- '1741157526222'
- endTime
- node:
+ namespace:
type: mixed
- value: '{{#1741161440242.node#}}'
+ value: '{{#1742806924635.namespace#}}'
+ pod:
+ type: mixed
+ value: '{{#1742806924635.pod#}}'
startTime:
type: variable
value:
- '1741157526222'
- startTime
type: tool
- height: 53
- id: '1741328423453'
+ height: 54
+ id: '1742979394268'
position:
- x: 909.6690018199924
- y: 807.5848583297699
+ x: 1246
+ y: 1839
positionAbsolute:
- x: 909.6690018199924
- y: 807.5848583297699
+ x: 1246
+ y: 1839
selected: false
sourcePosition: right
targetPosition: left
type: custom
- width: 243
+ width: 244
- data:
desc: ''
is_team_authorization: true
@@ -3155,23 +5207,23 @@ workflow:
default: null
form: llm
human_description:
- en_US: Specified host name
- ja_JP: Specified host name
- pt_BR: Specified host name
- zh_Hans: 指定的主机名
+ en_US: cAdvisor job name
+ ja_JP: cAdvisor job name
+ pt_BR: cAdvisor job name
+ zh_Hans: cAdvisor任务名称
label:
- en_US: node
- ja_JP: node
- pt_BR: node
- zh_Hans: node
- llm_description: Specified host name
+ en_US: cAdvisor job name
+ ja_JP: cAdvisor job name
+ pt_BR: cAdvisor job name
+ zh_Hans: cAdvisor任务名称
+ llm_description: cAdvisor job name
max: null
min: null
- name: node
+ name: cadvisor_job_name
options: []
placeholder: null
precision: null
- required: true
+ required: false
scope: null
template: null
type: string
@@ -3179,16 +5231,64 @@ workflow:
default: null
form: llm
human_description:
- en_US: Data query start time
- ja_JP: Data query start time
- pt_BR: Data query start time
+ en_US: Namespace
+ ja_JP: Namespace
+ pt_BR: Namespace
+ zh_Hans: 命名空间
+ label:
+ en_US: Namespace
+ ja_JP: Namespace
+ pt_BR: Namespace
+ zh_Hans: 命名空间
+ llm_description: Namespace
+ max: null
+ min: null
+ name: namespace
+ options: []
+ placeholder: null
+ precision: null
+ required: false
+ scope: null
+ template: null
+ type: string
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Pod name
+ ja_JP: Pod name
+ pt_BR: Pod name
+ zh_Hans: Pod名称
+ label:
+ en_US: Pod name
+ ja_JP: Pod name
+ pt_BR: Pod name
+ zh_Hans: Pod名称
+ llm_description: Pod name
+ max: null
+ min: null
+ name: pod
+ options: []
+ placeholder: null
+ precision: null
+ required: false
+ scope: null
+ template: null
+ type: string
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Data query start time(Microsecond)
+ ja_JP: Data query start time(Microsecond)
+ pt_BR: Data query start time(Microsecond)
zh_Hans: 开始时间 (微秒)
label:
en_US: startTime
ja_JP: startTime
pt_BR: startTime
zh_Hans: startTime
- llm_description: Data query start time
+ llm_description: Data query start time(Microsecond)
max: null
min: null
name: startTime
@@ -3203,16 +5303,16 @@ workflow:
default: null
form: llm
human_description:
- en_US: Data query end time
- ja_JP: Data query end time
- pt_BR: Data query end time
+ en_US: Data query end time(Microsecond)
+ ja_JP: Data query end time(Microsecond)
+ pt_BR: Data query end time(Microsecond)
zh_Hans: 结束时间 (微秒)
label:
en_US: endTime
ja_JP: endTime
pt_BR: endTime
zh_Hans: endTime
- llm_description: Data query start time
+ llm_description: Data query end time(Microsecond)
max: null
min: null
name: endTime
@@ -3224,45 +5324,51 @@ workflow:
template: null
type: number
params:
+ cadvisor_job_name: ''
endTime: ''
- node: ''
+ namespace: ''
+ pod: ''
startTime: ''
provider_id: apo_select
provider_name: apo_select
provider_type: builtin
selected: false
- title: 宿主机磁盘写入数据速率(字节/秒)
+ title: 容器内存占用
tool_configurations: {}
- tool_label: 宿主机磁盘写入数据速率(字节/秒)
- tool_name: 宿主机磁盘写入数据速率(字节/秒)
+ tool_label: Container memory usage in bytes (Containerd runtime, aggregated
+ by container and Pod)
+ tool_name: 容器内存使用字节数(使用Containerd容器运行时,按容器和Pod统计)
tool_parameters:
endTime:
type: variable
value:
- '1741157526222'
- endTime
- node:
+ namespace:
+ type: mixed
+ value: '{{#1742806924635.namespace#}}'
+ pod:
type: mixed
- value: '{{#1741161440242.node#}}'
+ value: '{{#1742806924635.pod#}}'
startTime:
type: variable
value:
- '1741157526222'
- startTime
type: tool
- height: 53
- id: '1741328466394'
+ height: 54
+ id: '1742979595004'
position:
- x: 922.0951827508213
- y: 890.0354967992098
+ x: 1246
+ y: 1933
positionAbsolute:
- x: 922.0951827508213
- y: 890.0354967992098
+ x: 1246
+ y: 1933
selected: false
sourcePosition: right
targetPosition: left
type: custom
- width: 243
+ width: 244
- data:
desc: ''
is_team_authorization: true
@@ -3272,23 +5378,23 @@ workflow:
default: null
form: llm
human_description:
- en_US: Specified host name
- ja_JP: Specified host name
- pt_BR: Specified host name
- zh_Hans: 指定的主机名
+ en_US: cAdvisor job name
+ ja_JP: cAdvisor job name
+ pt_BR: cAdvisor job name
+ zh_Hans: cAdvisor任务名称
label:
- en_US: node
- ja_JP: node
- pt_BR: node
- zh_Hans: node
- llm_description: Specified host name
+ en_US: cAdvisor job name
+ ja_JP: cAdvisor job name
+ pt_BR: cAdvisor job name
+ zh_Hans: cAdvisor任务名称
+ llm_description: cAdvisor job name
max: null
min: null
- name: node
+ name: cadvisor_job_name
options: []
placeholder: null
precision: null
- required: true
+ required: false
scope: null
template: null
type: string
@@ -3296,16 +5402,64 @@ workflow:
default: null
form: llm
human_description:
- en_US: Data query start time
- ja_JP: Data query start time
- pt_BR: Data query start time
+ en_US: Namespace
+ ja_JP: Namespace
+ pt_BR: Namespace
+ zh_Hans: 命名空间
+ label:
+ en_US: Namespace
+ ja_JP: Namespace
+ pt_BR: Namespace
+ zh_Hans: 命名空间
+ llm_description: Namespace
+ max: null
+ min: null
+ name: namespace
+ options: []
+ placeholder: null
+ precision: null
+ required: false
+ scope: null
+ template: null
+ type: string
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Pod name
+ ja_JP: Pod name
+ pt_BR: Pod name
+ zh_Hans: Pod名称
+ label:
+ en_US: Pod name
+ ja_JP: Pod name
+ pt_BR: Pod name
+ zh_Hans: Pod名称
+ llm_description: Pod name
+ max: null
+ min: null
+ name: pod
+ options: []
+ placeholder: null
+ precision: null
+ required: false
+ scope: null
+ template: null
+ type: string
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Data query start time(Microsecond)
+ ja_JP: Data query start time(Microsecond)
+ pt_BR: Data query start time(Microsecond)
zh_Hans: 开始时间 (微秒)
label:
en_US: startTime
ja_JP: startTime
pt_BR: startTime
zh_Hans: startTime
- llm_description: Data query start time
+ llm_description: Data query start time(Microsecond)
max: null
min: null
name: startTime
@@ -3320,16 +5474,16 @@ workflow:
default: null
form: llm
human_description:
- en_US: Data query end time
- ja_JP: Data query end time
- pt_BR: Data query end time
+ en_US: Data query end time(Microsecond)
+ ja_JP: Data query end time(Microsecond)
+ pt_BR: Data query end time(Microsecond)
zh_Hans: 结束时间 (微秒)
label:
en_US: endTime
ja_JP: endTime
pt_BR: endTime
zh_Hans: endTime
- llm_description: Data query start time
+ llm_description: Data query end time(Microsecond)
max: null
min: null
name: endTime
@@ -3341,45 +5495,51 @@ workflow:
template: null
type: number
params:
+ cadvisor_job_name: ''
endTime: ''
- node: ''
+ namespace: ''
+ pod: ''
startTime: ''
provider_id: apo_select
provider_name: apo_select
provider_type: builtin
selected: false
- title: 宿主机CPU繁忙率(百分比)
+ title: 容器内存占用
tool_configurations: {}
- tool_label: 宿主机CPU繁忙率(百分比)
- tool_name: 查询主机CPU利用率
+ tool_label: Container memory usage in bytes (Containerd runtime, aggregated
+ by container and Pod)
+ tool_name: 容器内存使用字节数(使用Containerd容器运行时,按容器和Pod统计)
tool_parameters:
endTime:
type: variable
value:
- '1741157526222'
- endTime
- node:
+ namespace:
+ type: mixed
+ value: '{{#1742806924635.namespace#}}'
+ pod:
type: mixed
- value: '{{#1741161440242.node#}}'
+ value: '{{#1742806924635.pod#}}'
startTime:
type: variable
value:
- '1741157526222'
- startTime
type: tool
- height: 53
- id: '1741328692906'
+ height: 54
+ id: '17429797453350'
position:
- x: 1288.1326361010936
- y: 765.9218546549957
+ x: 1246
+ y: 1651
positionAbsolute:
- x: 1288.1326361010936
- y: 765.9218546549957
+ x: 1246
+ y: 1651
selected: false
sourcePosition: right
targetPosition: left
type: custom
- width: 243
+ width: 244
- data:
desc: ''
is_team_authorization: true
@@ -3389,23 +5549,23 @@ workflow:
default: null
form: llm
human_description:
- en_US: Specified host name
- ja_JP: Specified host name
- pt_BR: Specified host name
- zh_Hans: 指定的主机名
+ en_US: cAdvisor job name
+ ja_JP: cAdvisor job name
+ pt_BR: cAdvisor job name
+ zh_Hans: cAdvisor任务名称
label:
- en_US: node
- ja_JP: node
- pt_BR: node
- zh_Hans: node
- llm_description: Specified host name
+ en_US: cAdvisor job name
+ ja_JP: cAdvisor job name
+ pt_BR: cAdvisor job name
+ zh_Hans: cAdvisor任务名称
+ llm_description: cAdvisor job name
max: null
min: null
- name: node
+ name: cadvisor_job_name
options: []
placeholder: null
precision: null
- required: true
+ required: false
scope: null
template: null
type: string
@@ -3413,16 +5573,64 @@ workflow:
default: null
form: llm
human_description:
- en_US: Data query start time
- ja_JP: Data query start time
- pt_BR: Data query start time
+ en_US: Namespace
+ ja_JP: Namespace
+ pt_BR: Namespace
+ zh_Hans: 命名空间
+ label:
+ en_US: Namespace
+ ja_JP: Namespace
+ pt_BR: Namespace
+ zh_Hans: 命名空间
+ llm_description: Namespace
+ max: null
+ min: null
+ name: namespace
+ options: []
+ placeholder: null
+ precision: null
+ required: false
+ scope: null
+ template: null
+ type: string
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Pod name
+ ja_JP: Pod name
+ pt_BR: Pod name
+ zh_Hans: Pod名称
+ label:
+ en_US: Pod name
+ ja_JP: Pod name
+ pt_BR: Pod name
+ zh_Hans: Pod名称
+ llm_description: Pod name
+ max: null
+ min: null
+ name: pod
+ options: []
+ placeholder: null
+ precision: null
+ required: false
+ scope: null
+ template: null
+ type: string
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Data query start time(Microsecond)
+ ja_JP: Data query start time(Microsecond)
+ pt_BR: Data query start time(Microsecond)
zh_Hans: 开始时间 (微秒)
label:
en_US: startTime
ja_JP: startTime
pt_BR: startTime
zh_Hans: startTime
- llm_description: Data query start time
+ llm_description: Data query start time(Microsecond)
max: null
min: null
name: startTime
@@ -3437,16 +5645,16 @@ workflow:
default: null
form: llm
human_description:
- en_US: Data query end time
- ja_JP: Data query end time
- pt_BR: Data query end time
+ en_US: Data query end time(Microsecond)
+ ja_JP: Data query end time(Microsecond)
+ pt_BR: Data query end time(Microsecond)
zh_Hans: 结束时间 (微秒)
label:
en_US: endTime
ja_JP: endTime
pt_BR: endTime
zh_Hans: endTime
- llm_description: Data query start time
+ llm_description: Data query end time(Microsecond)
max: null
min: null
name: endTime
@@ -3458,45 +5666,51 @@ workflow:
template: null
type: number
params:
+ cadvisor_job_name: ''
endTime: ''
- node: ''
+ namespace: ''
+ pod: ''
startTime: ''
provider_id: apo_select
provider_name: apo_select
provider_type: builtin
selected: false
- title: 宿主机磁盘IO耗时速率
+ title: 历史数据 容器内存占用
tool_configurations: {}
- tool_label: 宿主机磁盘IO耗时速率
- tool_name: 宿主机磁盘IO耗时速率
+ tool_label: Container memory usage in bytes (Containerd runtime, aggregated
+ by container and Pod)
+ tool_name: 容器内存使用字节数(使用Containerd容器运行时,按容器和Pod统计)
tool_parameters:
endTime:
type: variable
value:
- - '1741157526222'
- - endTime
- node:
+ - '1742433446760'
+ - history_et
+ namespace:
+ type: mixed
+ value: '{{#1742806924635.namespace#}}'
+ pod:
type: mixed
- value: '{{#1741161440242.node#}}'
+ value: '{{#1742806924635.pod#}}'
startTime:
type: variable
value:
- - '1741157526222'
- - startTime
+ - '1742433446760'
+ - history_st
type: tool
- height: 53
- id: '1741328742817'
+ height: 54
+ id: '17429797664440'
position:
- x: 1320.3050732843196
- y: 838.8279382371494
+ x: 1550
+ y: 1651
positionAbsolute:
- x: 1320.3050732843196
- y: 838.8279382371494
+ x: 1550
+ y: 1651
selected: false
sourcePosition: right
targetPosition: left
type: custom
- width: 243
+ width: 244
- data:
desc: ''
is_team_authorization: true
@@ -3506,23 +5720,47 @@ workflow:
default: null
form: llm
human_description:
- en_US: Specified host name
- ja_JP: Specified host name
- pt_BR: Specified host name
- zh_Hans: 指定的主机名
+ en_US: Prometheus job name for host metrics
+ ja_JP: Prometheus job name for host metrics
+ pt_BR: Prometheus job name for host metrics
+ zh_Hans: Prometheus任务名称(宿主机指标)
label:
- en_US: node
- ja_JP: node
- pt_BR: node
- zh_Hans: node
- llm_description: Specified host name
+ en_US: Prometheus Job
+ ja_JP: Prometheus Job
+ pt_BR: Tarefa Prometheus
+ zh_Hans: Prometheus任务
+ llm_description: Unique identifier for metrics scrape job
+ max: null
+ min: null
+ name: job
+ options: []
+ placeholder: null
+ precision: null
+ required: false
+ scope: null
+ template: null
+ type: string
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Host node identifier
+ ja_JP: Host node identifier
+ pt_BR: Host node identifier
+ zh_Hans: 宿主机节点标识
+ label:
+ en_US: Host Node
+ ja_JP: Host Node
+ pt_BR: Host Node
+ zh_Hans: 宿主机节点
+ llm_description: Unique identifier for host node
max: null
min: null
name: node
options: []
placeholder: null
precision: null
- required: true
+ required: false
scope: null
template: null
type: string
@@ -3530,16 +5768,16 @@ workflow:
default: null
form: llm
human_description:
- en_US: Data query start time
- ja_JP: Data query start time
- pt_BR: Data query start time
+ en_US: Data query start time(Microsecond)
+ ja_JP: Data query start time(Microsecond)
+ pt_BR: Data query start time(Microsecond)
zh_Hans: 开始时间 (微秒)
label:
en_US: startTime
ja_JP: startTime
pt_BR: startTime
zh_Hans: startTime
- llm_description: Data query start time
+ llm_description: Data query start time(Microsecond)
max: null
min: null
name: startTime
@@ -3554,16 +5792,16 @@ workflow:
default: null
form: llm
human_description:
- en_US: Data query end time
- ja_JP: Data query end time
- pt_BR: Data query end time
+ en_US: Data query end time(Microsecond)
+ ja_JP: Data query end time(Microsecond)
+ pt_BR: Data query end time(Microsecond)
zh_Hans: 结束时间 (微秒)
label:
en_US: endTime
ja_JP: endTime
pt_BR: endTime
zh_Hans: endTime
- llm_description: Data query start time
+ llm_description: Data query end time(Microsecond)
max: null
min: null
name: endTime
@@ -3576,16 +5814,17 @@ workflow:
type: number
params:
endTime: ''
+ job: ''
node: ''
startTime: ''
provider_id: apo_select
provider_name: apo_select
provider_type: builtin
selected: false
- title: 宿主机IO等待CPU繁忙率
+ title: 宿主机cpu
tool_configurations: {}
- tool_label: 宿主机IO等待CPU繁忙率
- tool_name: host_cpu_iowait
+ tool_label: Query host's CPU pressure
+ tool_name: 查询宿主机CPU压力
tool_parameters:
endTime:
type: variable
@@ -3594,26 +5833,26 @@ workflow:
- endTime
node:
type: mixed
- value: '{{#1741161440242.node#}}'
+ value: '{{#1742806924635.node#}}'
startTime:
type: variable
value:
- '1741157526222'
- startTime
type: tool
- height: 53
- id: '1741328773213'
+ height: 54
+ id: '1742979828391'
position:
- x: 1295.1943032554088
- y: 918.3967184410467
+ x: 1246
+ y: 1745
positionAbsolute:
- x: 1295.1943032554088
- y: 918.3967184410467
+ x: 1246
+ y: 1745
selected: false
sourcePosition: right
targetPosition: left
type: custom
- width: 243
+ width: 244
- data:
desc: ''
is_team_authorization: true
@@ -3623,23 +5862,47 @@ workflow:
default: null
form: llm
human_description:
- en_US: Specified host name
- ja_JP: Specified host name
- pt_BR: Specified host name
- zh_Hans: 指定的主机名
+ en_US: Prometheus job name for host metrics
+ ja_JP: Prometheus job name for host metrics
+ pt_BR: Prometheus job name for host metrics
+ zh_Hans: Prometheus任务名称(宿主机指标)
label:
- en_US: node
- ja_JP: node
- pt_BR: node
- zh_Hans: node
- llm_description: Specified host name
+ en_US: Prometheus Job
+ ja_JP: Prometheus Job
+ pt_BR: Tarefa Prometheus
+ zh_Hans: Prometheus任务
+ llm_description: Unique identifier for metrics scrape job
+ max: null
+ min: null
+ name: job
+ options: []
+ placeholder: null
+ precision: null
+ required: false
+ scope: null
+ template: null
+ type: string
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Host node identifier
+ ja_JP: Host node identifier
+ pt_BR: Host node identifier
+ zh_Hans: 宿主机节点标识
+ label:
+ en_US: Host Node
+ ja_JP: Host Node
+ pt_BR: Host Node
+ zh_Hans: 宿主机节点
+ llm_description: Unique identifier for host node
max: null
min: null
name: node
options: []
placeholder: null
precision: null
- required: true
+ required: false
scope: null
template: null
type: string
@@ -3647,16 +5910,16 @@ workflow:
default: null
form: llm
human_description:
- en_US: Data query start time
- ja_JP: Data query start time
- pt_BR: Data query start time
+ en_US: Data query start time(Microsecond)
+ ja_JP: Data query start time(Microsecond)
+ pt_BR: Data query start time(Microsecond)
zh_Hans: 开始时间 (微秒)
label:
en_US: startTime
ja_JP: startTime
pt_BR: startTime
zh_Hans: startTime
- llm_description: Data query start time
+ llm_description: Data query start time(Microsecond)
max: null
min: null
name: startTime
@@ -3671,16 +5934,16 @@ workflow:
default: null
form: llm
human_description:
- en_US: Data query end time
- ja_JP: Data query end time
- pt_BR: Data query end time
+ en_US: Data query end time(Microsecond)
+ ja_JP: Data query end time(Microsecond)
+ pt_BR: Data query end time(Microsecond)
zh_Hans: 结束时间 (微秒)
label:
en_US: endTime
ja_JP: endTime
pt_BR: endTime
zh_Hans: endTime
- llm_description: Data query start time
+ llm_description: Data query end time(Microsecond)
max: null
min: null
name: endTime
@@ -3693,44 +5956,45 @@ workflow:
type: number
params:
endTime: ''
+ job: ''
node: ''
startTime: ''
provider_id: apo_select
provider_name: apo_select
provider_type: builtin
selected: false
- title: 宿主机当前打开文件描述符数
+ title: 历史数据 宿主机cpu
tool_configurations: {}
- tool_label: 宿主机当前打开文件描述符数
- tool_name: host_cpu_fd_open
+ tool_label: Query host's CPU pressure
+ tool_name: 查询宿主机CPU压力
tool_parameters:
endTime:
type: variable
value:
- - '1741157526222'
- - endTime
+ - '1742433446760'
+ - history_et
node:
type: mixed
- value: '{{#1741161440242.node#}}'
+ value: '{{#1742806924635.node#}}'
startTime:
type: variable
value:
- - '1741157526222'
- - startTime
+ - '1742433446760'
+ - history_st
type: tool
- height: 53
- id: '1741328799030'
+ height: 54
+ id: '17429798797920'
position:
- x: 1300.5588170319227
- y: 999.2631864254831
+ x: 1550
+ y: 1745
positionAbsolute:
- x: 1300.5588170319227
- y: 999.2631864254831
+ x: 1550
+ y: 1745
selected: false
sourcePosition: right
targetPosition: left
type: custom
- width: 243
+ width: 244
- data:
desc: ''
is_team_authorization: true
@@ -3740,23 +6004,23 @@ workflow:
default: null
form: llm
human_description:
- en_US: Specified service name
- ja_JP: Specified service name
- pt_BR: Specified service name
- zh_Hans: 指定的服务名
+ en_US: cAdvisor job name
+ ja_JP: cAdvisor job name
+ pt_BR: cAdvisor job name
+ zh_Hans: cAdvisor任务名称
label:
- en_US: service_name
- ja_JP: service_name
- pt_BR: service_name
- zh_Hans: service_name
- llm_description: 指定的服务名
+ en_US: cAdvisor job name
+ ja_JP: cAdvisor job name
+ pt_BR: cAdvisor job name
+ zh_Hans: cAdvisor任务名称
+ llm_description: cAdvisor job name
max: null
min: null
- name: service_name
+ name: cadvisor_job_name
options: []
placeholder: null
precision: null
- required: true
+ required: false
scope: null
template: null
type: string
@@ -3764,23 +6028,23 @@ workflow:
default: null
form: llm
human_description:
- en_US: Specified endpoint name
- ja_JP: Specified endpoint name
- pt_BR: Specified endpoint name
- zh_Hans: 指定的服务端点名
+ en_US: Namespace
+ ja_JP: Namespace
+ pt_BR: Namespace
+ zh_Hans: 命名空间
label:
- en_US: content_key
- ja_JP: content_key
- pt_BR: content_key
- zh_Hans: content_key
- llm_description: 指定的服务端点名
+ en_US: Namespace
+ ja_JP: Namespace
+ pt_BR: Namespace
+ zh_Hans: 命名空间
+ llm_description: Namespace
max: null
min: null
- name: content_key
+ name: namespace
options: []
placeholder: null
precision: null
- required: true
+ required: false
scope: null
template: null
type: string
@@ -3788,16 +6052,40 @@ workflow:
default: null
form: llm
human_description:
- en_US: Data query start time
- ja_JP: Data query start time
- pt_BR: Data query start time
+ en_US: Pod name
+ ja_JP: Pod name
+ pt_BR: Pod name
+ zh_Hans: Pod名称
+ label:
+ en_US: Pod name
+ ja_JP: Pod name
+ pt_BR: Pod name
+ zh_Hans: Pod名称
+ llm_description: Pod name
+ max: null
+ min: null
+ name: pod
+ options: []
+ placeholder: null
+ precision: null
+ required: false
+ scope: null
+ template: null
+ type: string
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Data query start time(Microsecond)
+ ja_JP: Data query start time(Microsecond)
+ pt_BR: Data query start time(Microsecond)
zh_Hans: 开始时间 (微秒)
label:
en_US: startTime
ja_JP: startTime
pt_BR: startTime
zh_Hans: startTime
- llm_description: Data query start time
+ llm_description: Data query start time(Microsecond)
max: null
min: null
name: startTime
@@ -3812,16 +6100,16 @@ workflow:
default: null
form: llm
human_description:
- en_US: Data query end time
- ja_JP: Data query end time
- pt_BR: Data query end time
+ en_US: Data query end time(Microsecond)
+ ja_JP: Data query end time(Microsecond)
+ pt_BR: Data query end time(Microsecond)
zh_Hans: 结束时间 (微秒)
label:
en_US: endTime
ja_JP: endTime
pt_BR: endTime
zh_Hans: endTime
- llm_description: Data query start time
+ llm_description: Data query end time(Microsecond)
max: null
min: null
name: endTime
@@ -3833,49 +6121,51 @@ workflow:
template: null
type: number
params:
- content_key: ''
+ cadvisor_job_name: ''
endTime: ''
- service_name: ''
+ namespace: ''
+ pod: ''
startTime: ''
provider_id: apo_select
provider_name: apo_select
provider_type: builtin
selected: false
- title: 服务请求成功率(按服务名和内容键统计,指定时间段内)
+ title: '历史数据 容器CPU 使用率 '
tool_configurations: {}
- tool_label: 服务请求成功率(按服务名和内容键统计,指定时间段内)
- tool_name: Originx 北极星指标 (服务层级) - RED指标 - 请求成功率
+ tool_label: Container CPU usage rate (Containerd runtime, aggregated by container
+ and Pod)
+ tool_name: 容器CPU使用率(使用Containerd容器运行时,按容器和Pod统计)
tool_parameters:
- content_key:
- type: mixed
- value: '{{#1741161440242.endpoint#}}'
endTime:
type: variable
value:
- '1741157526222'
- endTime
- service_name:
+ namespace:
+ type: mixed
+ value: '{{#1742806924635.namespace#}}'
+ pod:
type: mixed
- value: '{{#1741161440242.service#}}'
+ value: '{{#1742806924635.pod#}}'
startTime:
type: variable
value:
- '1741157526222'
- startTime
type: tool
- height: 53
- id: '1741329632798'
+ height: 54
+ id: '17429835599060'
position:
- x: 879.4543026140257
- y: 428.59818368333947
+ x: 1550
+ y: 1839
positionAbsolute:
- x: 879.4543026140257
- y: 428.59818368333947
+ x: 1550
+ y: 1839
selected: false
sourcePosition: right
targetPosition: left
type: custom
- width: 243
+ width: 244
- data:
desc: ''
is_team_authorization: true
@@ -3885,23 +6175,23 @@ workflow:
default: null
form: llm
human_description:
- en_US: Specified pod name
- ja_JP: Specified pod name
- pt_BR: Specified pod name
- zh_Hans: 指定的容器POD名称
+ en_US: cAdvisor job name
+ ja_JP: cAdvisor job name
+ pt_BR: cAdvisor job name
+ zh_Hans: cAdvisor任务名称
label:
- en_US: pod
- ja_JP: pod
- pt_BR: pod
- zh_Hans: pod
- llm_description: Specified pod name
+ en_US: cAdvisor job name
+ ja_JP: cAdvisor job name
+ pt_BR: cAdvisor job name
+ zh_Hans: cAdvisor任务名称
+ llm_description: cAdvisor job name
max: null
min: null
- name: pod
+ name: cadvisor_job_name
options: []
placeholder: null
precision: null
- required: true
+ required: false
scope: null
template: null
type: string
@@ -3909,23 +6199,23 @@ workflow:
default: null
form: llm
human_description:
- en_US: Specified namespace
- ja_JP: Specified namespace
- pt_BR: Specified namespace
- zh_Hans: 指定的容器所在Namespace
+ en_US: Namespace
+ ja_JP: Namespace
+ pt_BR: Namespace
+ zh_Hans: 命名空间
label:
- en_US: namespace
- ja_JP: namespace
- pt_BR: namespace
- zh_Hans: namespace
- llm_description: Specified namespace
+ en_US: Namespace
+ ja_JP: Namespace
+ pt_BR: Namespace
+ zh_Hans: 命名空间
+ llm_description: Namespace
max: null
min: null
name: namespace
options: []
placeholder: null
precision: null
- required: true
+ required: false
scope: null
template: null
type: string
@@ -3933,16 +6223,40 @@ workflow:
default: null
form: llm
human_description:
- en_US: Data query start time
- ja_JP: Data query start time
- pt_BR: Data query start time
+ en_US: Pod name
+ ja_JP: Pod name
+ pt_BR: Pod name
+ zh_Hans: Pod名称
+ label:
+ en_US: Pod name
+ ja_JP: Pod name
+ pt_BR: Pod name
+ zh_Hans: Pod名称
+ llm_description: Pod name
+ max: null
+ min: null
+ name: pod
+ options: []
+ placeholder: null
+ precision: null
+ required: false
+ scope: null
+ template: null
+ type: string
+ - auto_generate: null
+ default: null
+ form: llm
+ human_description:
+ en_US: Data query start time(Microsecond)
+ ja_JP: Data query start time(Microsecond)
+ pt_BR: Data query start time(Microsecond)
zh_Hans: 开始时间 (微秒)
label:
en_US: startTime
ja_JP: startTime
pt_BR: startTime
zh_Hans: startTime
- llm_description: Data query start time
+ llm_description: Data query start time(Microsecond)
max: null
min: null
name: startTime
@@ -3957,16 +6271,16 @@ workflow:
default: null
form: llm
human_description:
- en_US: Data query end time
- ja_JP: Data query end time
- pt_BR: Data query end time
+ en_US: Data query end time(Microsecond)
+ ja_JP: Data query end time(Microsecond)
+ pt_BR: Data query end time(Microsecond)
zh_Hans: 结束时间 (微秒)
label:
en_US: endTime
ja_JP: endTime
pt_BR: endTime
zh_Hans: endTime
- llm_description: Data query start time
+ llm_description: Data query end time(Microsecond)
max: null
min: null
name: endTime
@@ -3978,6 +6292,7 @@ workflow:
template: null
type: number
params:
+ cadvisor_job_name: ''
endTime: ''
namespace: ''
pod: ''
@@ -3986,10 +6301,11 @@ workflow:
provider_name: apo_select
provider_type: builtin
selected: false
- title: 容器内存使用字节数(使用Containerd容器运行时,按容器和Pod统计)
+ title: 历史数据 容器内存占用
tool_configurations: {}
- tool_label: 容器内存使用字节数(使用Containerd容器运行时,按容器和Pod统计)
- tool_name: 查询容器内存使用量
+ tool_label: Container memory usage in bytes (Containerd runtime, aggregated
+ by container and Pod)
+ tool_name: 容器内存使用字节数(使用Containerd容器运行时,按容器和Pod统计)
tool_parameters:
endTime:
type: variable
@@ -3998,30 +6314,30 @@ workflow:
- endTime
namespace:
type: mixed
- value: '{{#1741161440242.namespace#}}'
+ value: '{{#1742806924635.namespace#}}'
pod:
type: mixed
- value: '{{#1741161440242.pod#}}'
+ value: '{{#1742806924635.pod#}}'
startTime:
type: variable
value:
- '1741157526222'
- startTime
type: tool
- height: 53
- id: '1741591590829'
+ height: 54
+ id: '17429835940550'
position:
- x: 1106.622658811791
- y: 1100.534952103478
+ x: 1550
+ y: 1933
positionAbsolute:
- x: 1106.622658811791
- y: 1100.534952103478
+ x: 1550
+ y: 1933
selected: false
sourcePosition: right
targetPosition: left
type: custom
- width: 243
+ width: 244
viewport:
- x: 171.57866536216355
- y: 331.8252495324367
- zoom: 0.2578933989536625
+ x: 289.1589008663707
+ y: -174.9404993893893
+ zoom: 0.5537771915449453
diff --git a/api/initializer/plugin.py b/api/initializer/plugin.py
index 1a753dfbfc..f2c4da0770 100644
--- a/api/initializer/plugin.py
+++ b/api/initializer/plugin.py
@@ -30,6 +30,7 @@ def init_plugin():
try:
with open(file_entry.path, 'rb') as file:
+
file_size = os.fstat(file.fileno()).st_size
if file_size > dify_config.PLUGIN_MAX_PACKAGE_SIZE:
logging.error(f"File size exceeds the limit: {file_entry.path}")