fix: iteration node use the main thread pool

2026-01-24 05:46:13 +08:00 · 2024-12-02 21:13:47 +08:00 · 2024-12-02 21:13:39 +08:00
193 changed files with 1974 additions and 4824 deletions
--- a/api/.env.example
+++ b/api/.env.example
@ -413,3 +413,4 @@ RESET_PASSWORD_TOKEN_EXPIRY_MINUTES=5

 CREATE_TIDB_SERVICE_JOB_ENABLED=false

+RETRIEVAL_TOP_N=0
--- a/api/.ruff.toml
+++ b/api/.ruff.toml
@ -20,8 +20,6 @@ select = [
    "PLC0208", # iteration-over-set
    "PLC2801", # unnecessary-dunder-call
    "PLC0414", # useless-import-alias
-    "PLE0604", # invalid-all-object
-    "PLE0605", # invalid-all-format
    "PLR0402", # manual-from-import
    "PLR1711", # useless-return
    "PLR1714", # repeated-equality-comparison
@ -30,7 +28,6 @@ select = [
    "RUF100", # unused-noqa
    "RUF101", # redirected-noqa
    "RUF200", # invalid-pyproject-toml
-    "RUF022", # unsorted-dunder-all
    "S506", # unsafe-yaml-load
    "SIM", # flake8-simplify rules
    "TRY400", # error-instead-of-exception
--- a/api/commands.py
+++ b/api/commands.py
@ -259,7 +259,7 @@ def migrate_knowledge_vector_database():
    skipped_count = 0
    total_count = 0
    vector_type = dify_config.VECTOR_STORE
-    upper_collection_vector_types = {
+    upper_colletion_vector_types = {
        VectorType.MILVUS,
        VectorType.PGVECTOR,
        VectorType.RELYT,
@ -267,7 +267,7 @@ def migrate_knowledge_vector_database():
        VectorType.ORACLE,
        VectorType.ELASTICSEARCH,
    }
-    lower_collection_vector_types = {
+    lower_colletion_vector_types = {
        VectorType.ANALYTICDB,
        VectorType.CHROMA,
        VectorType.MYSCALE,
@ -307,7 +307,7 @@ def migrate_knowledge_vector_database():
                        continue
                collection_name = ""
                dataset_id = dataset.id
-                if vector_type in upper_collection_vector_types:
+                if vector_type in upper_colletion_vector_types:
                    collection_name = Dataset.gen_collection_name_by_id(dataset_id)
                elif vector_type == VectorType.QDRANT:
                    if dataset.collection_binding_id:
@ -323,7 +323,7 @@ def migrate_knowledge_vector_database():
                    else:
                        collection_name = Dataset.gen_collection_name_by_id(dataset_id)

-                elif vector_type in lower_collection_vector_types:
+                elif vector_type in lower_colletion_vector_types:
                    collection_name = Dataset.gen_collection_name_by_id(dataset_id).lower()
                else:
                    raise ValueError(f"Vector store {vector_type} is not supported.")
--- a/api/configs/feature/init.py
+++ b/api/configs/feature/init.py
@ -626,6 +626,8 @@ class DataSetConfig(BaseSettings):
        default=30,
    )

+    RETRIEVAL_TOP_N: int = Field(description="number of retrieval top_n", default=0)
+

 class WorkspaceConfig(BaseSettings):
    """
--- a/api/configs/packaging/init.py
+++ b/api/configs/packaging/init.py
@ -9,7 +9,7 @@ class PackagingInfo(BaseSettings):

    CURRENT_VERSION: str = Field(
        description="Dify version",
-        default="0.13.1",
+        default="0.12.1",
    )

    COMMIT_SHA: str = Field(
--- a/api/controllers/console/app/workflow.py
+++ b/api/controllers/console/app/workflow.py
@ -100,11 +100,11 @@ class DraftWorkflowApi(Resource):
        try:
            environment_variables_list = args.get("environment_variables") or []
            environment_variables = [
-                variable_factory.build_environment_variable_from_mapping(obj) for obj in environment_variables_list
+                variable_factory.build_variable_from_mapping(obj) for obj in environment_variables_list
            ]
            conversation_variables_list = args.get("conversation_variables") or []
            conversation_variables = [
-                variable_factory.build_conversation_variable_from_mapping(obj) for obj in conversation_variables_list
+                variable_factory.build_variable_from_mapping(obj) for obj in conversation_variables_list
            ]
            workflow = workflow_service.sync_draft_workflow(
                app_model=app_model,
@ -382,7 +382,7 @@ class DefaultBlockConfigApi(Resource):
        filters = None
        if args.get("q"):
            try:
-                filters = json.loads(args.get("q", ""))
+                filters = json.loads(args.get("q"))
            except json.JSONDecodeError:
                raise ValueError("Invalid filters")

--- a/api/core/app/apps/README.md
+++ b/api/core/app/apps/README.md
@ -2,7 +2,7 @@

 Due to the presence of tasks in App Runner that require long execution times, such as LLM generation and external requests, Flask-Sqlalchemy's strategy for database connection pooling is to allocate one connection (transaction) per request. This approach keeps a connection occupied even during non-DB tasks, leading to the inability to acquire new connections during high concurrency requests due to multiple long-running tasks.

-Therefore, the database operations in App Runner and Task Pipeline must ensure connections are closed immediately after use, and it's better to pass IDs rather than Model objects to avoid detach errors.
+Therefore, the database operations in App Runner and Task Pipeline must ensure connections are closed immediately after use, and it's better to pass IDs rather than Model objects to avoid deattach errors.

 Examples:

--- a/api/core/app/apps/workflow_app_runner.py
+++ b/api/core/app/apps/workflow_app_runner.py
@ -43,7 +43,7 @@ from core.workflow.graph_engine.entities.event import (
 )
 from core.workflow.graph_engine.entities.graph import Graph
 from core.workflow.nodes import NodeType
-from core.workflow.nodes.node_mapping import NODE_TYPE_CLASSES_MAPPING
+from core.workflow.nodes.node_mapping import node_type_classes_mapping
 from core.workflow.workflow_entry import WorkflowEntry
 from extensions.ext_database import db
 from models.model import App
@ -138,8 +138,7 @@ class WorkflowBasedAppRunner(AppRunner):

        # Get node class
        node_type = NodeType(iteration_node_config.get("data", {}).get("type"))
-        node_version = iteration_node_config.get("data", {}).get("version", "1")
-        node_cls = NODE_TYPE_CLASSES_MAPPING[node_type][node_version]
+        node_cls = node_type_classes_mapping[node_type]

        # init variable pool
        variable_pool = VariablePool(
--- a/api/core/file/init.py
+++ b/api/core/file/init.py
@ -7,13 +7,13 @@ from .models import (
 )

 __all__ = [
-    "FILE_MODEL_IDENTITY",
-    "ArrayFileAttribute",
-    "File",
-    "FileAttribute",
-    "FileBelongsTo",
-    "FileTransferMethod",
    "FileType",
    "FileUploadConfig",
+    "FileTransferMethod",
+    "FileBelongsTo",
+    "File",
    "ImageConfig",
+    "FileAttribute",
+    "ArrayFileAttribute",
+    "FILE_MODEL_IDENTITY",
 ]
--- a/api/core/model_runtime/docs/zh_Hans/interfaces.md
+++ b/api/core/model_runtime/docs/zh_Hans/interfaces.md
@ -91,7 +91,7 @@ class XinferenceProvider(Provider):
      """
  ```

-  也可以直接抛出对应 Errors，并做如下定义，这样在之后的调用中可以直接抛出`InvokeConnectionError`等异常。
+  也可以直接抛出对应Erros，并做如下定义，这样在之后的调用中可以直接抛出`InvokeConnectionError`等异常。
  
    ```python
    @property
--- a/api/core/model_runtime/entities/init.py
+++ b/api/core/model_runtime/entities/init.py
@ -18,25 +18,25 @@ from .message_entities import (
 from .model_entities import ModelPropertyKey

 __all__ = [
-    "AssistantPromptMessage",
-    "AudioPromptMessageContent",
-    "DocumentPromptMessageContent",
    "ImagePromptMessageContent",
+    "VideoPromptMessageContent",
+    "PromptMessage",
+    "PromptMessageRole",
+    "LLMUsage",
+    "ModelPropertyKey",
+    "AssistantPromptMessage",
+    "PromptMessage",
+    "PromptMessageContent",
+    "PromptMessageRole",
+    "SystemPromptMessage",
+    "TextPromptMessageContent",
+    "UserPromptMessage",
+    "PromptMessageTool",
+    "ToolPromptMessage",
+    "PromptMessageContentType",
    "LLMResult",
    "LLMResultChunk",
    "LLMResultChunkDelta",
-    "LLMUsage",
-    "ModelPropertyKey",
-    "PromptMessage",
-    "PromptMessage",
-    "PromptMessageContent",
-    "PromptMessageContentType",
-    "PromptMessageRole",
-    "PromptMessageRole",
-    "PromptMessageTool",
-    "SystemPromptMessage",
-    "TextPromptMessageContent",
-    "ToolPromptMessage",
-    "UserPromptMessage",
-    "VideoPromptMessageContent",
+    "AudioPromptMessageContent",
+    "DocumentPromptMessageContent",
 ]
--- a/api/core/model_runtime/model_providers/bedrock/bedrock.yaml
+++ b/api/core/model_runtime/model_providers/bedrock/bedrock.yaml
@ -16,7 +16,6 @@ help:
 supported_model_types:
  - llm
  - text-embedding
-  - rerank
 configurate_methods:
  - predefined-model
 provider_credential_schema:
--- a/api/core/model_runtime/model_providers/bedrock/llm/amazon.nova-lite-v1.yaml
+++ b/api/core/model_runtime/model_providers/bedrock/llm/amazon.nova-lite-v1.yaml
@ -1,52 +0,0 @@
-model: amazon.nova-lite-v1:0
-label:
-  en_US: Nova Lite V1
-model_type: llm
-features:
-  - agent-thought
-  - tool-call
-  - stream-tool-call
-model_properties:
-  mode: chat
-  context_size: 300000
-parameter_rules:
-  - name: max_new_tokens
-    use_template: max_tokens
-    required: true
-    default: 2048
-    min: 1
-    max: 5000
-  - name: temperature
-    use_template: temperature
-    required: false
-    type: float
-    default: 1
-    min: 0.0
-    max: 1.0
-    help:
-      zh_Hans: 生成内容的随机性。
-      en_US: The amount of randomness injected into the response.
-  - name: top_p
-    required: false
-    type: float
-    default: 0.999
-    min: 0.000
-    max: 1.000
-    help:
-      zh_Hans: 在核采样中，Anthropic Claude 按概率递减顺序计算每个后续标记的所有选项的累积分布，并在达到 top_p 指定的特定概率时将其切断。您应该更改温度或top_p，但不能同时更改两者。
-      en_US: In nucleus sampling, Anthropic Claude computes the cumulative distribution over all the options for each subsequent token in decreasing probability order and cuts it off once it reaches a particular probability specified by top_p. You should alter either temperature or top_p, but not both.
-  - name: top_k
-    required: false
-    type: int
-    default: 0
-    min: 0
-    # tip docs from aws has error, max value is 500
-    max: 500
-    help:
-      zh_Hans: 对于每个后续标记，仅从前 K 个选项中进行采样。使用 top_k 删除长尾低概率响应。
-      en_US: Only sample from the top K options for each subsequent token. Use top_k to remove long tail low probability responses.
-pricing:
-  input: '0.00006'
-  output: '0.00024'
-  unit: '0.001'
-  currency: USD
--- a/api/core/model_runtime/model_providers/bedrock/llm/amazon.nova-micro-v1.yaml
+++ b/api/core/model_runtime/model_providers/bedrock/llm/amazon.nova-micro-v1.yaml
@ -1,52 +0,0 @@
-model: amazon.nova-micro-v1:0
-label:
-  en_US: Nova Micro V1
-model_type: llm
-features:
-  - agent-thought
-  - tool-call
-  - stream-tool-call
-model_properties:
-  mode: chat
-  context_size: 128000
-parameter_rules:
-  - name: max_new_tokens
-    use_template: max_tokens
-    required: true
-    default: 2048
-    min: 1
-    max: 5000
-  - name: temperature
-    use_template: temperature
-    required: false
-    type: float
-    default: 1
-    min: 0.0
-    max: 1.0
-    help:
-      zh_Hans: 生成内容的随机性。
-      en_US: The amount of randomness injected into the response.
-  - name: top_p
-    required: false
-    type: float
-    default: 0.999
-    min: 0.000
-    max: 1.000
-    help:
-      zh_Hans: 在核采样中，Anthropic Claude 按概率递减顺序计算每个后续标记的所有选项的累积分布，并在达到 top_p 指定的特定概率时将其切断。您应该更改温度或top_p，但不能同时更改两者。
-      en_US: In nucleus sampling, Anthropic Claude computes the cumulative distribution over all the options for each subsequent token in decreasing probability order and cuts it off once it reaches a particular probability specified by top_p. You should alter either temperature or top_p, but not both.
-  - name: top_k
-    required: false
-    type: int
-    default: 0
-    min: 0
-    # tip docs from aws has error, max value is 500
-    max: 500
-    help:
-      zh_Hans: 对于每个后续标记，仅从前 K 个选项中进行采样。使用 top_k 删除长尾低概率响应。
-      en_US: Only sample from the top K options for each subsequent token. Use top_k to remove long tail low probability responses.
-pricing:
-  input: '0.000035'
-  output: '0.00014'
-  unit: '0.001'
-  currency: USD
--- a/api/core/model_runtime/model_providers/bedrock/llm/amazon.nova-pro-v1.yaml
+++ b/api/core/model_runtime/model_providers/bedrock/llm/amazon.nova-pro-v1.yaml
@ -1,52 +0,0 @@
-model: amazon.nova-pro-v1:0
-label:
-  en_US: Nova Pro V1
-model_type: llm
-features:
-  - agent-thought
-  - tool-call
-  - stream-tool-call
-model_properties:
-  mode: chat
-  context_size: 300000
-parameter_rules:
-  - name: max_new_tokens
-    use_template: max_tokens
-    required: true
-    default: 2048
-    min: 1
-    max: 5000
-  - name: temperature
-    use_template: temperature
-    required: false
-    type: float
-    default: 1
-    min: 0.0
-    max: 1.0
-    help:
-      zh_Hans: 生成内容的随机性。
-      en_US: The amount of randomness injected into the response.
-  - name: top_p
-    required: false
-    type: float
-    default: 0.999
-    min: 0.000
-    max: 1.000
-    help:
-      zh_Hans: 在核采样中，Anthropic Claude 按概率递减顺序计算每个后续标记的所有选项的累积分布，并在达到 top_p 指定的特定概率时将其切断。您应该更改温度或top_p，但不能同时更改两者。
-      en_US: In nucleus sampling, Anthropic Claude computes the cumulative distribution over all the options for each subsequent token in decreasing probability order and cuts it off once it reaches a particular probability specified by top_p. You should alter either temperature or top_p, but not both.
-  - name: top_k
-    required: false
-    type: int
-    default: 0
-    min: 0
-    # tip docs from aws has error, max value is 500
-    max: 500
-    help:
-      zh_Hans: 对于每个后续标记，仅从前 K 个选项中进行采样。使用 top_k 删除长尾低概率响应。
-      en_US: Only sample from the top K options for each subsequent token. Use top_k to remove long tail low probability responses.
-pricing:
-  input: '0.0008'
-  output: '0.0032'
-  unit: '0.001'
-  currency: USD
--- a/api/core/model_runtime/model_providers/bedrock/llm/llm.py
+++ b/api/core/model_runtime/model_providers/bedrock/llm/llm.py
@ -70,8 +70,6 @@ class BedrockLargeLanguageModel(LargeLanguageModel):
        {"prefix": "cohere.command-r", "support_system_prompts": True, "support_tool_use": True},
        {"prefix": "amazon.titan", "support_system_prompts": False, "support_tool_use": False},
        {"prefix": "ai21.jamba-1-5", "support_system_prompts": True, "support_tool_use": False},
-        {"prefix": "amazon.nova", "support_system_prompts": True, "support_tool_use": False},
-        {"prefix": "us.amazon.nova", "support_system_prompts": True, "support_tool_use": False},
    ]

    @staticmethod
@ -196,13 +194,6 @@ class BedrockLargeLanguageModel(LargeLanguageModel):
        if model_info["support_tool_use"] and tools:
            parameters["toolConfig"] = self._convert_converse_tool_config(tools=tools)
        try:
-            # for issue #10976
-            conversations_list = parameters["messages"]
-            # if two consecutive user messages found, combine them into one message
-            for i in range(len(conversations_list) - 2, -1, -1):
-                if conversations_list[i]["role"] == conversations_list[i + 1]["role"]:
-                    conversations_list[i]["content"].extend(conversations_list.pop(i + 1)["content"])
-
            if stream:
                response = bedrock_client.converse_stream(**parameters)
                return self._handle_converse_stream_response(
--- a/api/core/model_runtime/model_providers/bedrock/llm/us.amazon.nova-lite-v1.yaml
+++ b/api/core/model_runtime/model_providers/bedrock/llm/us.amazon.nova-lite-v1.yaml
@ -1,52 +0,0 @@
-model: us.amazon.nova-lite-v1:0
-label:
-  en_US: Nova Lite V1 (US.Cross Region Inference)
-model_type: llm
-features:
-  - agent-thought
-  - tool-call
-  - stream-tool-call
-model_properties:
-  mode: chat
-  context_size: 300000
-parameter_rules:
-  - name: max_new_tokens
-    use_template: max_tokens
-    required: true
-    default: 2048
-    min: 1
-    max: 5000
-  - name: temperature
-    use_template: temperature
-    required: false
-    type: float
-    default: 1
-    min: 0.0
-    max: 1.0
-    help:
-      zh_Hans: 生成内容的随机性。
-      en_US: The amount of randomness injected into the response.
-  - name: top_p
-    required: false
-    type: float
-    default: 0.999
-    min: 0.000
-    max: 1.000
-    help:
-      zh_Hans: 在核采样中，Anthropic Claude 按概率递减顺序计算每个后续标记的所有选项的累积分布，并在达到 top_p 指定的特定概率时将其切断。您应该更改温度或top_p，但不能同时更改两者。
-      en_US: In nucleus sampling, Anthropic Claude computes the cumulative distribution over all the options for each subsequent token in decreasing probability order and cuts it off once it reaches a particular probability specified by top_p. You should alter either temperature or top_p, but not both.
-  - name: top_k
-    required: false
-    type: int
-    default: 0
-    min: 0
-    # tip docs from aws has error, max value is 500
-    max: 500
-    help:
-      zh_Hans: 对于每个后续标记，仅从前 K 个选项中进行采样。使用 top_k 删除长尾低概率响应。
-      en_US: Only sample from the top K options for each subsequent token. Use top_k to remove long tail low probability responses.
-pricing:
-  input: '0.00006'
-  output: '0.00024'
-  unit: '0.001'
-  currency: USD
--- a/api/core/model_runtime/model_providers/bedrock/llm/us.amazon.nova-micro-v1.yaml
+++ b/api/core/model_runtime/model_providers/bedrock/llm/us.amazon.nova-micro-v1.yaml
@ -1,52 +0,0 @@
-model: us.amazon.nova-micro-v1:0
-label:
-  en_US: Nova Micro V1 (US.Cross Region Inference)
-model_type: llm
-features:
-  - agent-thought
-  - tool-call
-  - stream-tool-call
-model_properties:
-  mode: chat
-  context_size: 128000
-parameter_rules:
-  - name: max_new_tokens
-    use_template: max_tokens
-    required: true
-    default: 2048
-    min: 1
-    max: 5000
-  - name: temperature
-    use_template: temperature
-    required: false
-    type: float
-    default: 1
-    min: 0.0
-    max: 1.0
-    help:
-      zh_Hans: 生成内容的随机性。
-      en_US: The amount of randomness injected into the response.
-  - name: top_p
-    required: false
-    type: float
-    default: 0.999
-    min: 0.000
-    max: 1.000
-    help:
-      zh_Hans: 在核采样中，Anthropic Claude 按概率递减顺序计算每个后续标记的所有选项的累积分布，并在达到 top_p 指定的特定概率时将其切断。您应该更改温度或top_p，但不能同时更改两者。
-      en_US: In nucleus sampling, Anthropic Claude computes the cumulative distribution over all the options for each subsequent token in decreasing probability order and cuts it off once it reaches a particular probability specified by top_p. You should alter either temperature or top_p, but not both.
-  - name: top_k
-    required: false
-    type: int
-    default: 0
-    min: 0
-    # tip docs from aws has error, max value is 500
-    max: 500
-    help:
-      zh_Hans: 对于每个后续标记，仅从前 K 个选项中进行采样。使用 top_k 删除长尾低概率响应。
-      en_US: Only sample from the top K options for each subsequent token. Use top_k to remove long tail low probability responses.
-pricing:
-  input: '0.000035'
-  output: '0.00014'
-  unit: '0.001'
-  currency: USD
--- a/api/core/model_runtime/model_providers/bedrock/llm/us.amazon.nova-pro-v1.yaml
+++ b/api/core/model_runtime/model_providers/bedrock/llm/us.amazon.nova-pro-v1.yaml
@ -1,52 +0,0 @@
-model: us.amazon.nova-pro-v1:0
-label:
-  en_US: Nova Pro V1 (US.Cross Region Inference)
-model_type: llm
-features:
-  - agent-thought
-  - tool-call
-  - stream-tool-call
-model_properties:
-  mode: chat
-  context_size: 300000
-parameter_rules:
-  - name: max_new_tokens
-    use_template: max_tokens
-    required: true
-    default: 2048
-    min: 1
-    max: 5000
-  - name: temperature
-    use_template: temperature
-    required: false
-    type: float
-    default: 1
-    min: 0.0
-    max: 1.0
-    help:
-      zh_Hans: 生成内容的随机性。
-      en_US: The amount of randomness injected into the response.
-  - name: top_p
-    required: false
-    type: float
-    default: 0.999
-    min: 0.000
-    max: 1.000
-    help:
-      zh_Hans: 在核采样中，Anthropic Claude 按概率递减顺序计算每个后续标记的所有选项的累积分布，并在达到 top_p 指定的特定概率时将其切断。您应该更改温度或top_p，但不能同时更改两者。
-      en_US: In nucleus sampling, Anthropic Claude computes the cumulative distribution over all the options for each subsequent token in decreasing probability order and cuts it off once it reaches a particular probability specified by top_p. You should alter either temperature or top_p, but not both.
-  - name: top_k
-    required: false
-    type: int
-    default: 0
-    min: 0
-    # tip docs from aws has error, max value is 500
-    max: 500
-    help:
-      zh_Hans: 对于每个后续标记，仅从前 K 个选项中进行采样。使用 top_k 删除长尾低概率响应。
-      en_US: Only sample from the top K options for each subsequent token. Use top_k to remove long tail low probability responses.
-pricing:
-  input: '0.0008'
-  output: '0.0032'
-  unit: '0.001'
-  currency: USD
--- a/api/core/model_runtime/model_providers/bedrock/rerank/init.py
+++ b/api/core/model_runtime/model_providers/bedrock/rerank/init.py
--- a/api/core/model_runtime/model_providers/bedrock/rerank/_position.yaml
+++ b/api/core/model_runtime/model_providers/bedrock/rerank/_position.yaml
@ -1,2 +0,0 @@
- amazon.rerank-v1
- cohere.rerank-v3-5
--- a/api/core/model_runtime/model_providers/bedrock/rerank/amazon.rerank-v1.yaml
+++ b/api/core/model_runtime/model_providers/bedrock/rerank/amazon.rerank-v1.yaml
@ -1,4 +0,0 @@
-model: amazon.rerank-v1:0
-model_type: rerank
-model_properties:
-  context_size: 5120
--- a/api/core/model_runtime/model_providers/bedrock/rerank/cohere.rerank-v3-5.yaml
+++ b/api/core/model_runtime/model_providers/bedrock/rerank/cohere.rerank-v3-5.yaml
@ -1,4 +0,0 @@
-model: cohere.rerank-v3-5:0
-model_type: rerank
-model_properties:
-  context_size: 5120
--- a/api/core/model_runtime/model_providers/bedrock/rerank/rerank.py
+++ b/api/core/model_runtime/model_providers/bedrock/rerank/rerank.py
@ -1,147 +0,0 @@
-from typing import Optional
-
-import boto3
-from botocore.config import Config
-
-from core.model_runtime.entities.rerank_entities import RerankDocument, RerankResult
-from core.model_runtime.errors.invoke import (
-    InvokeAuthorizationError,
-    InvokeBadRequestError,
-    InvokeConnectionError,
-    InvokeError,
-    InvokeRateLimitError,
-    InvokeServerUnavailableError,
-)
-from core.model_runtime.errors.validate import CredentialsValidateFailedError
-from core.model_runtime.model_providers.__base.rerank_model import RerankModel
-
-
-class BedrockRerankModel(RerankModel):
-    """
-    Model class for Cohere rerank model.
-    """
-
-    def _invoke(
-        self,
-        model: str,
-        credentials: dict,
-        query: str,
-        docs: list[str],
-        score_threshold: Optional[float] = None,
-        top_n: Optional[int] = None,
-        user: Optional[str] = None,
-    ) -> RerankResult:
-        """
-        Invoke rerank model
-
-        :param model: model name
-        :param credentials: model credentials
-        :param query: search query
-        :param docs: docs for reranking
-        :param score_threshold: score threshold
-        :param top_n: top n
-        :param user: unique user id
-        :return: rerank result
-        """
-
-        if len(docs) == 0:
-            return RerankResult(model=model, docs=docs)
-
-        # initialize client
-        client_config = Config(region_name=credentials["aws_region"])
-        bedrock_runtime = boto3.client(
-            service_name="bedrock-agent-runtime",
-            config=client_config,
-            aws_access_key_id=credentials.get("aws_access_key_id", ""),
-            aws_secret_access_key=credentials.get("aws_secret_access_key"),
-        )
-        queries = [{"type": "TEXT", "textQuery": {"text": query}}]
-        text_sources = []
-        for text in docs:
-            text_sources.append(
-                {
-                    "type": "INLINE",
-                    "inlineDocumentSource": {
-                        "type": "TEXT",
-                        "textDocument": {
-                            "text": text,
-                        },
-                    },
-                }
-            )
-        modelId = model
-        region = credentials["aws_region"]
-        model_package_arn = f"arn:aws:bedrock:{region}::foundation-model/{modelId}"
-        rerankingConfiguration = {
-            "type": "BEDROCK_RERANKING_MODEL",
-            "bedrockRerankingConfiguration": {
-                "numberOfResults": top_n,
-                "modelConfiguration": {
-                    "modelArn": model_package_arn,
-                },
-            },
-        }
-        response = bedrock_runtime.rerank(
-            queries=queries, sources=text_sources, rerankingConfiguration=rerankingConfiguration
-        )
-
-        rerank_documents = []
-        for idx, result in enumerate(response["results"]):
-            # format document
-            index = result["index"]
-            rerank_document = RerankDocument(
-                index=index,
-                text=docs[index],
-                score=result["relevanceScore"],
-            )
-
-            # score threshold check
-            if score_threshold is not None:
-                if rerank_document.score >= score_threshold:
-                    rerank_documents.append(rerank_document)
-            else:
-                rerank_documents.append(rerank_document)
-
-        return RerankResult(model=model, docs=rerank_documents)
-
-    def validate_credentials(self, model: str, credentials: dict) -> None:
-        """
-        Validate model credentials
-
-        :param model: model name
-        :param credentials: model credentials
-        :return:
-        """
-        try:
-            self.invoke(
-                model=model,
-                credentials=credentials,
-                query="What is the capital of the United States?",
-                docs=[
-                    "Carson City is the capital city of the American state of Nevada. At the 2010 United States "
-                    "Census, Carson City had a population of 55,274.",
-                    "The Commonwealth of the Northern Mariana Islands is a group of islands in the Pacific Ocean that "
-                    "are a political division controlled by the United States. Its capital is Saipan.",
-                ],
-                score_threshold=0.8,
-            )
-        except Exception as ex:
-            raise CredentialsValidateFailedError(str(ex))
-
-    @property
-    def _invoke_error_mapping(self) -> dict[type[InvokeError], list[type[Exception]]]:
-        """
-        Map model invoke error to unified error
-        The key is the ermd = genai.GenerativeModel(model) error type thrown to the caller
-        The value is the md = genai.GenerativeModel(model) error type thrown by the model,
-        which needs to be converted into a unified error type for the caller.
-
-        :return: Invoke emd = genai.GenerativeModel(model) error mapping
-        """
-        return {
-            InvokeConnectionError: [],
-            InvokeServerUnavailableError: [],
-            InvokeRateLimitError: [],
-            InvokeAuthorizationError: [],
-            InvokeBadRequestError: [],
-        }
--- a/api/core/model_runtime/model_providers/moonshot/llm/llm.py
+++ b/api/core/model_runtime/model_providers/moonshot/llm/llm.py
@ -252,7 +252,7 @@ class MoonshotLargeLanguageModel(OAIAPICompatLargeLanguageModel):
                # ignore sse comments
                if chunk.startswith(":"):
                    continue
-                decoded_chunk = chunk.strip().removeprefix("data: ")
+                decoded_chunk = chunk.strip().lstrip("data: ").lstrip()
                chunk_json = None
                try:
                    chunk_json = json.loads(decoded_chunk)
--- a/api/core/model_runtime/model_providers/openai_api_compatible/llm/llm.py
+++ b/api/core/model_runtime/model_providers/openai_api_compatible/llm/llm.py
@ -462,7 +462,7 @@ class OAIAPICompatLargeLanguageModel(_CommonOaiApiCompat, LargeLanguageModel):
                # ignore sse comments
                if chunk.startswith(":"):
                    continue
-                decoded_chunk = chunk.strip().removeprefix("data: ")
+                decoded_chunk = chunk.strip().lstrip("data: ").lstrip()
                if decoded_chunk == "[DONE]":  # Some provider returns "data: [DONE]"
                    continue

--- a/api/core/model_runtime/model_providers/stepfun/llm/llm.py
+++ b/api/core/model_runtime/model_providers/stepfun/llm/llm.py
@ -250,7 +250,7 @@ class StepfunLargeLanguageModel(OAIAPICompatLargeLanguageModel):
                # ignore sse comments
                if chunk.startswith(":"):
                    continue
-                decoded_chunk = chunk.strip().removeprefix("data: ")
+                decoded_chunk = chunk.strip().lstrip("data: ").lstrip()
                chunk_json = None
                try:
                    chunk_json = json.loads(decoded_chunk)
--- a/api/core/model_runtime/model_providers/volcengine_maas/legacy/volc_sdk/init.py
+++ b/api/core/model_runtime/model_providers/volcengine_maas/legacy/volc_sdk/init.py
@ -1,4 +1,4 @@
 from .common import ChatRole
 from .maas import MaasError, MaasService

-__all__ = ["ChatRole", "MaasError", "MaasService"]
+__all__ = ["MaasService", "ChatRole", "MaasError"]
--- a/api/core/model_runtime/model_providers/wenxin/rerank/rerank.py
+++ b/api/core/model_runtime/model_providers/wenxin/rerank/rerank.py
@ -17,13 +17,7 @@ class WenxinRerank(_CommonWenxin):
    def rerank(self, model: str, query: str, docs: list[str], top_n: Optional[int] = None):
        access_token = self._get_access_token()
        url = f"{self.api_bases[model]}?access_token={access_token}"
-        # For issue #11252
-        # for wenxin Rerank model top_n length should be equal or less than docs length
-        if top_n is not None and top_n > len(docs):
-            top_n = len(docs)
-        # for wenxin Rerank model, query should not be an empty string
-        if query == "":
-            query = " "  # FIXME: this is a workaround for wenxin rerank model for better user experience.
+
        try:
            response = httpx.post(
                url,
@ -31,11 +25,7 @@ class WenxinRerank(_CommonWenxin):
                headers={"Content-Type": "application/json"},
            )
            response.raise_for_status()
-            data = response.json()
-            # wenxin error handling
-            if "error_code" in data:
-                raise InternalServerError(data["error_msg"])
-            return data
+            return response.json()
        except httpx.HTTPStatusError as e:
            raise InternalServerError(str(e))

@ -79,9 +69,6 @@ class WenxinRerankModel(RerankModel):
            results = wenxin_rerank.rerank(model, query, docs, top_n)

            rerank_documents = []
-            if "results" not in results:
-                raise ValueError("results key not found in response")
-
            for result in results["results"]:
                index = result["index"]
                if "document" in result:
--- a/api/core/model_runtime/model_providers/zhipuai/llm/glm-4-0520.yaml
+++ b/api/core/model_runtime/model_providers/zhipuai/llm/glm-4-0520.yaml
@ -8,7 +8,6 @@ features:
  - stream-tool-call
 model_properties:
  mode: chat
-  context_size: 131072
 parameter_rules:
  - name: temperature
    use_template: temperature
--- a/api/core/model_runtime/model_providers/zhipuai/llm/glm-4-air.yaml
+++ b/api/core/model_runtime/model_providers/zhipuai/llm/glm-4-air.yaml
@ -8,7 +8,6 @@ features:
  - stream-tool-call
 model_properties:
  mode: chat
-  context_size: 131072
 parameter_rules:
  - name: temperature
    use_template: temperature
--- a/api/core/model_runtime/model_providers/zhipuai/llm/glm-4-airx.yaml
+++ b/api/core/model_runtime/model_providers/zhipuai/llm/glm-4-airx.yaml
@ -8,7 +8,6 @@ features:
  - stream-tool-call
 model_properties:
  mode: chat
-  context_size: 8192
 parameter_rules:
  - name: temperature
    use_template: temperature
--- a/api/core/model_runtime/model_providers/zhipuai/llm/glm-4-flash.yaml
+++ b/api/core/model_runtime/model_providers/zhipuai/llm/glm-4-flash.yaml
@ -8,7 +8,6 @@ features:
  - stream-tool-call
 model_properties:
  mode: chat
-  context_size: 131072
 parameter_rules:
  - name: temperature
    use_template: temperature
--- a/api/core/model_runtime/model_providers/zhipuai/llm/glm-4-flashx.yaml
+++ b/api/core/model_runtime/model_providers/zhipuai/llm/glm-4-flashx.yaml
@ -8,7 +8,6 @@ features:
  - stream-tool-call
 model_properties:
  mode: chat
-  context_size: 131072
 parameter_rules:
  - name: temperature
    use_template: temperature
--- a/api/core/model_runtime/model_providers/zhipuai/llm/glm_3_turbo.yaml
+++ b/api/core/model_runtime/model_providers/zhipuai/llm/glm_3_turbo.yaml
@ -8,7 +8,6 @@ features:
  - stream-tool-call
 model_properties:
  mode: chat
-  context_size: 131072
 parameter_rules:
  - name: temperature
    use_template: temperature
--- a/api/core/model_runtime/model_providers/zhipuai/llm/glm_4.yaml
+++ b/api/core/model_runtime/model_providers/zhipuai/llm/glm_4.yaml
@ -8,7 +8,6 @@ features:
  - stream-tool-call
 model_properties:
  mode: chat
-  context_size: 131072
 parameter_rules:
  - name: temperature
    use_template: temperature
--- a/api/core/model_runtime/model_providers/zhipuai/llm/glm_4_long.yaml
+++ b/api/core/model_runtime/model_providers/zhipuai/llm/glm_4_long.yaml
@ -8,7 +8,7 @@ features:
  - stream-tool-call
 model_properties:
  mode: chat
-  context_size: 1048576
+  context_size: 10240
 parameter_rules:
  - name: temperature
    use_template: temperature
--- a/api/core/model_runtime/model_providers/zhipuai/llm/glm_4_plus.yaml
+++ b/api/core/model_runtime/model_providers/zhipuai/llm/glm_4_plus.yaml
@ -8,7 +8,6 @@ features:
  - stream-tool-call
 model_properties:
  mode: chat
-  context_size: 131072
 parameter_rules:
  - name: temperature
    use_template: temperature
--- a/api/core/model_runtime/model_providers/zhipuai/llm/glm_4v.yaml
+++ b/api/core/model_runtime/model_providers/zhipuai/llm/glm_4v.yaml
@ -4,7 +4,6 @@ label:
 model_type: llm
 model_properties:
  mode: chat
-  context_size: 2048
 features:
  - vision
 parameter_rules:
--- a/api/core/model_runtime/model_providers/zhipuai/llm/glm_4v_plus.yaml
+++ b/api/core/model_runtime/model_providers/zhipuai/llm/glm_4v_plus.yaml
@ -4,7 +4,6 @@ label:
 model_type: llm
 model_properties:
  mode: chat
-  context_size: 8192
 features:
  - vision
  - video
--- a/api/core/model_runtime/model_providers/zhipuai/llm/llm.py
+++ b/api/core/model_runtime/model_providers/zhipuai/llm/llm.py
@ -22,6 +22,18 @@ from core.model_runtime.model_providers.__base.large_language_model import Large
 from core.model_runtime.model_providers.zhipuai._common import _CommonZhipuaiAI
 from core.model_runtime.utils import helper

+GLM_JSON_MODE_PROMPT = """You should always follow the instructions and output a valid JSON object.
+The structure of the JSON object you can found in the instructions, use {"answer": "$your_answer"} as the default structure
+if you are not sure about the structure.
+
+And you should always end the block with a "```" to indicate the end of the JSON object.
+
+<instructions>
+{{instructions}}
+</instructions>
+
+```JSON"""  # noqa: E501
+

 class ZhipuAILargeLanguageModel(_CommonZhipuaiAI, LargeLanguageModel):
    def _invoke(
@ -52,8 +64,42 @@ class ZhipuAILargeLanguageModel(_CommonZhipuaiAI, LargeLanguageModel):
        credentials_kwargs = self._to_credential_kwargs(credentials)

        # invoke model
+        # stop = stop or []
+        # self._transform_json_prompts(model, credentials, prompt_messages, model_parameters, tools, stop, stream, user)
        return self._generate(model, credentials_kwargs, prompt_messages, model_parameters, tools, stop, stream, user)

+    # def _transform_json_prompts(self, model: str, credentials: dict,
+    #                             prompt_messages: list[PromptMessage], model_parameters: dict,
+    #                             tools: list[PromptMessageTool] | None = None, stop: list[str] | None = None,
+    #                             stream: bool = True, user: str | None = None) \
+    #                         -> None:
+    #     """
+    #     Transform json prompts to model prompts
+    #     """
+    #     if "}\n\n" not in stop:
+    #         stop.append("}\n\n")
+
+    #     # check if there is a system message
+    #     if len(prompt_messages) > 0 and isinstance(prompt_messages[0], SystemPromptMessage):
+    #         # override the system message
+    #         prompt_messages[0] = SystemPromptMessage(
+    #             content=GLM_JSON_MODE_PROMPT.replace("{{instructions}}", prompt_messages[0].content)
+    #         )
+    #     else:
+    #         # insert the system message
+    #         prompt_messages.insert(0, SystemPromptMessage(
+    #             content=GLM_JSON_MODE_PROMPT.replace("{{instructions}}", "Please output a valid JSON object.")
+    #         ))
+    #     # check if the last message is a user message
+    #     if len(prompt_messages) > 0 and isinstance(prompt_messages[-1], UserPromptMessage):
+    #         # add ```JSON\n to the last message
+    #         prompt_messages[-1].content += "\n```JSON\n"
+    #     else:
+    #         # append a user message
+    #         prompt_messages.append(UserPromptMessage(
+    #             content="```JSON\n"
+    #         ))
+
    def get_num_tokens(
        self,
        model: str,
@ -124,7 +170,7 @@ class ZhipuAILargeLanguageModel(_CommonZhipuaiAI, LargeLanguageModel):
        :return: full response or stream response chunk generator result
        """
        extra_model_kwargs = {}
-        # request to glm-4v-plus with stop words will always respond "finish_reason":"network_error"
+        # request to glm-4v-plus with stop words will always response "finish_reason":"network_error"
        if stop and model != "glm-4v-plus":
            extra_model_kwargs["stop"] = stop

@ -140,7 +186,7 @@ class ZhipuAILargeLanguageModel(_CommonZhipuaiAI, LargeLanguageModel):
        # resolve zhipuai model not support system message and user message, assistant message must be in sequence
        new_prompt_messages: list[PromptMessage] = []
        for prompt_message in prompt_messages:
-            copy_prompt_message = prompt_message.model_copy()
+            copy_prompt_message = prompt_message.copy()
            if copy_prompt_message.role in {PromptMessageRole.USER, PromptMessageRole.SYSTEM, PromptMessageRole.TOOL}:
                if isinstance(copy_prompt_message.content, list):
                    # check if model is 'glm-4v'
@ -192,38 +238,59 @@ class ZhipuAILargeLanguageModel(_CommonZhipuaiAI, LargeLanguageModel):
            params = self._construct_glm_4v_parameter(model, new_prompt_messages, model_parameters)
        else:
            params = {"model": model, "messages": [], **model_parameters}
-            for prompt_message in new_prompt_messages:
-                if prompt_message.role == PromptMessageRole.TOOL:
-                    params["messages"].append(
-                        {
-                            "role": "tool",
-                            "content": prompt_message.content,
-                            "tool_call_id": prompt_message.tool_call_id,
-                        }
-                    )
-                elif isinstance(prompt_message, AssistantPromptMessage):
-                    if prompt_message.tool_calls:
+            # glm model
+            if not model.startswith("chatglm"):
+                for prompt_message in new_prompt_messages:
+                    if prompt_message.role == PromptMessageRole.TOOL:
                        params["messages"].append(
                            {
-                                "role": "assistant",
+                                "role": "tool",
                                "content": prompt_message.content,
-                                "tool_calls": [
-                                    {
-                                        "id": tool_call.id,
-                                        "type": tool_call.type,
-                                        "function": {
-                                            "name": tool_call.function.name,
-                                            "arguments": tool_call.function.arguments,
-                                        },
-                                    }
-                                    for tool_call in prompt_message.tool_calls
-                                ],
+                                "tool_call_id": prompt_message.tool_call_id,
                            }
                        )
+                    elif isinstance(prompt_message, AssistantPromptMessage):
+                        if prompt_message.tool_calls:
+                            params["messages"].append(
+                                {
+                                    "role": "assistant",
+                                    "content": prompt_message.content,
+                                    "tool_calls": [
+                                        {
+                                            "id": tool_call.id,
+                                            "type": tool_call.type,
+                                            "function": {
+                                                "name": tool_call.function.name,
+                                                "arguments": tool_call.function.arguments,
+                                            },
+                                        }
+                                        for tool_call in prompt_message.tool_calls
+                                    ],
+                                }
+                            )
+                        else:
+                            params["messages"].append({"role": "assistant", "content": prompt_message.content})
                    else:
-                        params["messages"].append({"role": "assistant", "content": prompt_message.content})
-                else:
-                    params["messages"].append({"role": prompt_message.role.value, "content": prompt_message.content})
+                        params["messages"].append(
+                            {"role": prompt_message.role.value, "content": prompt_message.content}
+                        )
+            else:
+                # chatglm model
+                for prompt_message in new_prompt_messages:
+                    # merge system message to user message
+                    if prompt_message.role in {
+                        PromptMessageRole.SYSTEM,
+                        PromptMessageRole.TOOL,
+                        PromptMessageRole.USER,
+                    }:
+                        if len(params["messages"]) > 0 and params["messages"][-1]["role"] == "user":
+                            params["messages"][-1]["content"] += "\n\n" + prompt_message.content
+                        else:
+                            params["messages"].append({"role": "user", "content": prompt_message.content})
+                    else:
+                        params["messages"].append(
+                            {"role": prompt_message.role.value, "content": prompt_message.content}
+                        )

        if tools and len(tools) > 0:
            params["tools"] = [{"type": "function", "function": helper.dump_model(tool)} for tool in tools]
@ -339,7 +406,7 @@ class ZhipuAILargeLanguageModel(_CommonZhipuaiAI, LargeLanguageModel):
        Handle llm stream response

        :param model: model name
-        :param responses: response
+        :param response: response
        :param prompt_messages: prompt messages
        :return: llm response chunk generator result
        """
@ -438,7 +505,7 @@ class ZhipuAILargeLanguageModel(_CommonZhipuaiAI, LargeLanguageModel):
        if tools and len(tools) > 0:
            text += "\n\nTools:"
            for tool in tools:
-                text += f"\n{tool.model_dump_json()}"
+                text += f"\n{tool.json()}"

        # trim off the trailing ' ' that might come from the "Assistant: "
        return text.rstrip()
--- a/api/core/prompt/prompt_templates/advanced_prompt_templates.py
+++ b/api/core/prompt/prompt_templates/advanced_prompt_templates.py
@ -5,7 +5,7 @@ BAICHUAN_CONTEXT = "用户在与一个客观的助手对话。助手会尊重找
 CHAT_APP_COMPLETION_PROMPT_CONFIG = {
    "completion_prompt_config": {
        "prompt": {
-            "text": "{{#pre_prompt#}}\nHere are the chat histories between human and assistant, inside <histories></histories> XML tags.\n\n<histories>\n{{#histories#}}\n</histories>\n\n\nHuman: {{#query#}}\n\nAssistant: "  # noqa: E501
+            "text": "{{#pre_prompt#}}\nHere is the chat histories between human and assistant, inside <histories></histories> XML tags.\n\n<histories>\n{{#histories#}}\n</histories>\n\n\nHuman: {{#query#}}\n\nAssistant: "  # noqa: E501
        },
        "conversation_histories_role": {"user_prefix": "Human", "assistant_prefix": "Assistant"},
    },
--- a/api/core/rag/datasource/retrieval_service.py
+++ b/api/core/rag/datasource/retrieval_service.py
@ -3,6 +3,7 @@ from typing import Optional

 from flask import Flask, current_app

+from configs import DifyConfig
 from core.rag.data_post_processor.data_post_processor import DataPostProcessor
 from core.rag.datasource.keyword.keyword_factory import Keyword
 from core.rag.datasource.vdb.vector_factory import Vector
@ -113,7 +114,7 @@ class RetrievalService:
                query=query,
                documents=all_documents,
                score_threshold=score_threshold,
-                top_n=top_k,
+                top_n=DifyConfig.RETRIEVAL_TOP_N or top_k,
            )

        return all_documents
@ -185,7 +186,7 @@ class RetrievalService:
                                query=query,
                                documents=documents,
                                score_threshold=score_threshold,
-                                top_n=len(documents),
+                                top_n=DifyConfig.RETRIEVAL_TOP_N or len(documents),
                            )
                        )
                    else:
@ -230,7 +231,7 @@ class RetrievalService:
                                query=query,
                                documents=documents,
                                score_threshold=score_threshold,
-                                top_n=len(documents),
+                                top_n=DifyConfig.RETRIEVAL_TOP_N or len(documents),
                            )
                        )
                    else:
--- a/api/core/rag/datasource/vdb/oceanbase/oceanbase_vector.py
+++ b/api/core/rag/datasource/vdb/oceanbase/oceanbase_vector.py
@ -104,7 +104,8 @@ class OceanBaseVector(BaseVector):
                val = int(row[6])
                vals.append(val)
            if len(vals) == 0:
-                raise ValueError("ob_vector_memory_limit_percentage not found in parameters.")
+                print("ob_vector_memory_limit_percentage not found in parameters.")
+                exit(1)
            if any(val == 0 for val in vals):
                try:
                    self._client.perform_raw_text_sql("ALTER SYSTEM SET ob_vector_memory_limit_percentage = 30")
@ -199,10 +200,10 @@ class OceanBaseVectorFactory(AbstractVectorFactory):
        return OceanBaseVector(
            collection_name,
            OceanBaseVectorConfig(
-                host=dify_config.OCEANBASE_VECTOR_HOST or "",
-                port=dify_config.OCEANBASE_VECTOR_PORT or 0,
-                user=dify_config.OCEANBASE_VECTOR_USER or "",
+                host=dify_config.OCEANBASE_VECTOR_HOST,
+                port=dify_config.OCEANBASE_VECTOR_PORT,
+                user=dify_config.OCEANBASE_VECTOR_USER,
                password=(dify_config.OCEANBASE_VECTOR_PASSWORD or ""),
-                database=dify_config.OCEANBASE_VECTOR_DATABASE or "",
+                database=dify_config.OCEANBASE_VECTOR_DATABASE,
            ),
        )
--- a/api/core/rag/datasource/vdb/tidb_on_qdrant/tidb_on_qdrant_vector.py
+++ b/api/core/rag/datasource/vdb/tidb_on_qdrant/tidb_on_qdrant_vector.py
@ -375,6 +375,7 @@ class TidbOnQdrantVector(BaseVector):
        for result in results:
            if result:
                document = self._document_from_scored_point(result, Field.CONTENT_KEY.value, Field.METADATA_KEY.value)
+                document.metadata["vector"] = result.vector
                documents.append(document)

        return documents
@ -393,7 +394,6 @@ class TidbOnQdrantVector(BaseVector):
    ) -> Document:
        return Document(
            page_content=scored_point.payload.get(content_payload_key),
-            vector=scored_point.vector,
            metadata=scored_point.payload.get(metadata_payload_key) or {},
        )

--- a/api/core/tools/provider/builtin/comfyui/comfyui.py
+++ b/api/core/tools/provider/builtin/comfyui/comfyui.py
@ -15,7 +15,7 @@ class ComfyUIProvider(BuiltinToolProviderController):

        try:
            ws.connect(ws_address)
-        except Exception as e:
+        except Exception:
            raise ToolProviderCredentialValidationError(f"can not connect to {ws_address}")
        finally:
            ws.close()
--- a/api/core/tools/provider/builtin/gitlab/tools/gitlab_mergerequests.yaml
+++ b/api/core/tools/provider/builtin/gitlab/tools/gitlab_mergerequests.yaml
@ -6,9 +6,9 @@ identity:
    zh_Hans: GitLab 合并请求查询
 description:
  human:
-    en_US: A tool for query GitLab merge requests, Input should be a exists repository or branch.
+    en_US: A tool for query GitLab merge requests, Input should be a exists reposity or branch.
    zh_Hans: 一个用于查询 GitLab 代码合并请求的工具，输入的内容应该是一个已存在的仓库名或者分支。
-  llm: A tool for query GitLab merge requests, Input should be a exists repository or branch.
+  llm: A tool for query GitLab merge requests, Input should be a exists reposity or branch.
 parameters:
  - name: repository
    type: string
--- a/api/core/tools/provider/builtin/wolframalpha/tools/wolframalpha.py
+++ b/api/core/tools/provider/builtin/wolframalpha/tools/wolframalpha.py
@ -61,7 +61,7 @@ class WolframAlphaTool(BuiltinTool):
                params["input"] = query
            else:
                finished = True
-                if "sources" in response_data["queryresult"]:
+                if "souces" in response_data["queryresult"]:
                    return self.create_link_message(response_data["queryresult"]["sources"]["url"])
                elif "pods" in response_data["queryresult"]:
                    result = response_data["queryresult"]["pods"][0]["subpods"][0]["plaintext"]
--- a/api/core/variables/init.py
+++ b/api/core/variables/init.py
@ -32,32 +32,32 @@ from .variables import (
 )

 __all__ = [
-    "ArrayAnySegment",
-    "ArrayAnyVariable",
-    "ArrayFileSegment",
-    "ArrayFileVariable",
-    "ArrayNumberSegment",
-    "ArrayNumberVariable",
-    "ArrayObjectSegment",
-    "ArrayObjectVariable",
-    "ArraySegment",
-    "ArrayStringSegment",
-    "ArrayStringVariable",
-    "FileSegment",
-    "FileVariable",
-    "FloatSegment",
-    "FloatVariable",
-    "IntegerSegment",
    "IntegerVariable",
-    "NoneSegment",
-    "NoneVariable",
-    "ObjectSegment",
+    "FloatVariable",
    "ObjectVariable",
    "SecretVariable",
-    "Segment",
-    "SegmentGroup",
-    "SegmentType",
-    "StringSegment",
    "StringVariable",
+    "ArrayAnyVariable",
    "Variable",
+    "SegmentType",
+    "SegmentGroup",
+    "Segment",
+    "NoneSegment",
+    "NoneVariable",
+    "IntegerSegment",
+    "FloatSegment",
+    "ObjectSegment",
+    "ArrayAnySegment",
+    "StringSegment",
+    "ArrayStringVariable",
+    "ArrayNumberVariable",
+    "ArrayObjectVariable",
+    "ArraySegment",
+    "ArrayFileSegment",
+    "ArrayNumberSegment",
+    "ArrayObjectSegment",
+    "ArrayStringSegment",
+    "FileSegment",
+    "FileVariable",
+    "ArrayFileVariable",
 ]
--- a/api/core/variables/types.py
+++ b/api/core/variables/types.py
@ -2,19 +2,16 @@ from enum import StrEnum


 class SegmentType(StrEnum):
+    NONE = "none"
    NUMBER = "number"
    STRING = "string"
-    OBJECT = "object"
    SECRET = "secret"
-
-    FILE = "file"
-
    ARRAY_ANY = "array[any]"
    ARRAY_STRING = "array[string]"
    ARRAY_NUMBER = "array[number]"
    ARRAY_OBJECT = "array[object]"
+    OBJECT = "object"
+    FILE = "file"
    ARRAY_FILE = "array[file]"

-    NONE = "none"
-
    GROUP = "group"
--- a/api/core/workflow/callbacks/init.py
+++ b/api/core/workflow/callbacks/init.py
@ -2,6 +2,6 @@ from .base_workflow_callback import WorkflowCallback
 from .workflow_logging_callback import WorkflowLoggingCallback

 __all__ = [
-    "WorkflowCallback",
    "WorkflowLoggingCallback",
+    "WorkflowCallback",
 ]
--- a/api/core/workflow/graph_engine/graph_engine.py
+++ b/api/core/workflow/graph_engine/graph_engine.py
@ -38,7 +38,7 @@ from core.workflow.nodes.answer.answer_stream_processor import AnswerStreamProce
 from core.workflow.nodes.base import BaseNode
 from core.workflow.nodes.end.end_stream_processor import EndStreamProcessor
 from core.workflow.nodes.event import RunCompletedEvent, RunRetrieverResourceEvent, RunStreamChunkEvent
-from core.workflow.nodes.node_mapping import NODE_TYPE_CLASSES_MAPPING
+from core.workflow.nodes.node_mapping import node_type_classes_mapping
 from extensions.ext_database import db
 from models.enums import UserFrom
 from models.workflow import WorkflowNodeExecutionStatus, WorkflowType
@ -227,8 +227,7 @@ class GraphEngine:

            # convert to specific node
            node_type = NodeType(node_config.get("data", {}).get("type"))
-            node_version = node_config.get("data", {}).get("version", "1")
-            node_cls = NODE_TYPE_CLASSES_MAPPING[node_type][node_version]
+            node_cls = node_type_classes_mapping[node_type]

            previous_node_id = previous_route_node_state.node_id if previous_route_node_state else None

--- a/api/core/workflow/nodes/answer/init.py
+++ b/api/core/workflow/nodes/answer/init.py
@ -1,4 +1,4 @@
 from .answer_node import AnswerNode
 from .entities import AnswerStreamGenerateRoute

-__all__ = ["AnswerNode", "AnswerStreamGenerateRoute"]
+__all__ = ["AnswerStreamGenerateRoute", "AnswerNode"]
--- a/api/core/workflow/nodes/answer/answer_stream_generate_router.py
+++ b/api/core/workflow/nodes/answer/answer_stream_generate_router.py
@ -153,7 +153,7 @@ class AnswerStreamGeneratorRouter:
                NodeType.IF_ELSE,
                NodeType.QUESTION_CLASSIFIER,
                NodeType.ITERATION,
-                NodeType.VARIABLE_ASSIGNER,
+                NodeType.CONVERSATION_VARIABLE_ASSIGNER,
            }:
                answer_dependencies[answer_node_id].append(source_node_id)
            else:
--- a/api/core/workflow/nodes/base/init.py
+++ b/api/core/workflow/nodes/base/init.py
@ -1,4 +1,4 @@
 from .entities import BaseIterationNodeData, BaseIterationState, BaseNodeData
 from .node import BaseNode

-__all__ = ["BaseIterationNodeData", "BaseIterationState", "BaseNode", "BaseNodeData"]
+__all__ = ["BaseNode", "BaseNodeData", "BaseIterationNodeData", "BaseIterationState"]
--- a/api/core/workflow/nodes/base/entities.py
+++ b/api/core/workflow/nodes/base/entities.py
@ -7,7 +7,6 @@ from pydantic import BaseModel
 class BaseNodeData(ABC, BaseModel):
    title: str
    desc: Optional[str] = None
-    version: str = "1"


 class BaseIterationNodeData(BaseNodeData):
--- a/api/core/workflow/nodes/base/node.py
+++ b/api/core/workflow/nodes/base/node.py
@ -55,9 +55,7 @@ class BaseNode(Generic[GenericNodeData]):
            raise ValueError("Node ID is required.")

        self.node_id = node_id
-
-        node_data = self._node_data_cls.model_validate(config.get("data", {}))
-        self.node_data = cast(GenericNodeData, node_data)
+        self.node_data: GenericNodeData = cast(GenericNodeData, self._node_data_cls(**config.get("data", {})))

    @abstractmethod
    def _run(self) -> NodeRunResult | Generator[Union[NodeEvent, "InNodeEvent"], None, None]:
--- a/api/core/workflow/nodes/end/init.py
+++ b/api/core/workflow/nodes/end/init.py
@ -1,4 +1,4 @@
 from .end_node import EndNode
 from .entities import EndStreamParam

-__all__ = ["EndNode", "EndStreamParam"]
+__all__ = ["EndStreamParam", "EndNode"]
--- a/api/core/workflow/nodes/enums.py
+++ b/api/core/workflow/nodes/enums.py
@ -14,11 +14,11 @@ class NodeType(StrEnum):
    HTTP_REQUEST = "http-request"
    TOOL = "tool"
    VARIABLE_AGGREGATOR = "variable-aggregator"
-    LEGACY_VARIABLE_AGGREGATOR = "variable-assigner"  # TODO: Merge this into VARIABLE_AGGREGATOR in the database.
+    VARIABLE_ASSIGNER = "variable-assigner"  # TODO: Merge this into VARIABLE_AGGREGATOR in the database.
    LOOP = "loop"
    ITERATION = "iteration"
    ITERATION_START = "iteration-start"  # Fake start node for iteration.
    PARAMETER_EXTRACTOR = "parameter-extractor"
-    VARIABLE_ASSIGNER = "assigner"
+    CONVERSATION_VARIABLE_ASSIGNER = "assigner"
    DOCUMENT_EXTRACTOR = "document-extractor"
    LIST_OPERATOR = "list-operator"
--- a/api/core/workflow/nodes/event/init.py
+++ b/api/core/workflow/nodes/event/init.py
@ -2,9 +2,9 @@ from .event import ModelInvokeCompletedEvent, RunCompletedEvent, RunRetrieverRes
 from .types import NodeEvent

 __all__ = [
-    "ModelInvokeCompletedEvent",
-    "NodeEvent",
    "RunCompletedEvent",
    "RunRetrieverResourceEvent",
    "RunStreamChunkEvent",
+    "NodeEvent",
+    "ModelInvokeCompletedEvent",
 ]
--- a/api/core/workflow/nodes/http_request/init.py
+++ b/api/core/workflow/nodes/http_request/init.py
@ -1,4 +1,4 @@
 from .entities import BodyData, HttpRequestNodeAuthorization, HttpRequestNodeBody, HttpRequestNodeData
 from .node import HttpRequestNode

-__all__ = ["BodyData", "HttpRequestNode", "HttpRequestNodeAuthorization", "HttpRequestNodeBody", "HttpRequestNodeData"]
+__all__ = ["HttpRequestNodeData", "HttpRequestNodeAuthorization", "HttpRequestNodeBody", "BodyData", "HttpRequestNode"]
--- a/api/core/workflow/nodes/http_request/node.py
+++ b/api/core/workflow/nodes/http_request/node.py
@ -1,9 +1,11 @@
 import logging
 from collections.abc import Mapping, Sequence
+from mimetypes import guess_extension
+from os import path
 from typing import Any

 from configs import dify_config
-from core.file import File, FileTransferMethod
+from core.file import File, FileTransferMethod, FileType
 from core.tools.tool_file_manager import ToolFileManager
 from core.workflow.entities.node_entities import NodeRunResult
 from core.workflow.entities.variable_entities import VariableSelector
@ -148,6 +150,11 @@ class HttpRequestNode(BaseNode[HttpRequestNodeData]):
        content = response.content

        if is_file and content_type:
+            # extract filename from url
+            filename = path.basename(url)
+            # extract extension if possible
+            extension = guess_extension(content_type) or ".bin"
+
            tool_file = ToolFileManager.create_file_by_raw(
                user_id=self.user_id,
                tenant_id=self.tenant_id,
@ -158,6 +165,7 @@ class HttpRequestNode(BaseNode[HttpRequestNodeData]):

            mapping = {
                "tool_file_id": tool_file.id,
+                "type": FileType.IMAGE.value,
                "transfer_method": FileTransferMethod.TOOL_FILE.value,
            }
            file = file_factory.build_from_mapping(
--- a/api/core/workflow/nodes/if_else/if_else_node.py
+++ b/api/core/workflow/nodes/if_else/if_else_node.py
@ -24,7 +24,7 @@ class IfElseNode(BaseNode[IfElseNodeData]):
        """
        node_inputs: dict[str, list] = {"conditions": []}

-        process_data: dict[str, list] = {"condition_results": []}
+        process_datas: dict[str, list] = {"condition_results": []}

        input_conditions = []
        final_result = False
@ -40,7 +40,7 @@ class IfElseNode(BaseNode[IfElseNodeData]):
                        operator=case.logical_operator,
                    )

-                    process_data["condition_results"].append(
+                    process_datas["condition_results"].append(
                        {
                            "group": case.model_dump(),
                            "results": group_result,
@ -65,7 +65,7 @@ class IfElseNode(BaseNode[IfElseNodeData]):

                selected_case_id = "true" if final_result else "false"

-                process_data["condition_results"].append(
+                process_datas["condition_results"].append(
                    {"group": "default", "results": group_result, "final_result": final_result}
                )

@ -73,7 +73,7 @@ class IfElseNode(BaseNode[IfElseNodeData]):

        except Exception as e:
            return NodeRunResult(
-                status=WorkflowNodeExecutionStatus.FAILED, inputs=node_inputs, process_data=process_data, error=str(e)
+                status=WorkflowNodeExecutionStatus.FAILED, inputs=node_inputs, process_data=process_datas, error=str(e)
            )

        outputs = {"result": final_result, "selected_case_id": selected_case_id}
@ -81,7 +81,7 @@ class IfElseNode(BaseNode[IfElseNodeData]):
        data = NodeRunResult(
            status=WorkflowNodeExecutionStatus.SUCCEEDED,
            inputs=node_inputs,
-            process_data=process_data,
+            process_data=process_datas,
            edge_source_handle=selected_case_id or "false",  # Use case ID or 'default'
            outputs=outputs,
        )
--- a/api/core/workflow/nodes/iteration/iteration_node.py
+++ b/api/core/workflow/nodes/iteration/iteration_node.py
@ -116,7 +116,7 @@ class IterationNode(BaseNode[IterationNodeData]):
        variable_pool.add([self.node_id, "item"], iterator_list_value[0])

        # init graph engine
-        from core.workflow.graph_engine.graph_engine import GraphEngine, GraphEngineThreadPool
+        from core.workflow.graph_engine.graph_engine import GraphEngine

        graph_engine = GraphEngine(
            tenant_id=self.tenant_id,
@ -162,7 +162,8 @@ class IterationNode(BaseNode[IterationNodeData]):
            if self.node_data.is_parallel:
                futures: list[Future] = []
                q = Queue()
-                thread_pool = GraphEngineThreadPool(max_workers=self.node_data.parallel_nums, max_submit_count=100)
+                thread_pool = graph_engine.workflow_thread_pool_mapping[self.thread_pool_id]
+                thread_pool._max_workers = self.node_data.parallel_nums
                for index, item in enumerate(iterator_list_value):
                    future: Future = thread_pool.submit(
                        self._run_single_iter_parallel,
@ -235,7 +236,10 @@ class IterationNode(BaseNode[IterationNodeData]):
                run_result=NodeRunResult(
                    status=WorkflowNodeExecutionStatus.SUCCEEDED,
                    outputs={"output": jsonable_encoder(outputs)},
-                    metadata={NodeRunMetadataKey.ITERATION_DURATION_MAP: iter_run_map},
+                    metadata={
+                        NodeRunMetadataKey.ITERATION_DURATION_MAP: iter_run_map,
+                        "total_tokens": graph_engine.graph_runtime_state.total_tokens,
+                    },
                )
            )
        except IterationNodeError as e:
@ -258,6 +262,7 @@ class IterationNode(BaseNode[IterationNodeData]):
                run_result=NodeRunResult(
                    status=WorkflowNodeExecutionStatus.FAILED,
                    error=str(e),
+                    metadata={"total_tokens": graph_engine.graph_runtime_state.total_tokens},
                )
            )
        finally:
@ -297,13 +302,12 @@ class IterationNode(BaseNode[IterationNodeData]):
            # variable selector to variable mapping
            try:
                # Get node class
-                from core.workflow.nodes.node_mapping import NODE_TYPE_CLASSES_MAPPING
+                from core.workflow.nodes.node_mapping import node_type_classes_mapping

                node_type = NodeType(sub_node_config.get("data", {}).get("type"))
-                if node_type not in NODE_TYPE_CLASSES_MAPPING:
+                node_cls = node_type_classes_mapping.get(node_type)
+                if not node_cls:
                    continue
-                node_version = sub_node_config.get("data", {}).get("version", "1")
-                node_cls = NODE_TYPE_CLASSES_MAPPING[node_type][node_version]

                sub_node_variable_mapping = node_cls.extract_variable_selector_to_variable_mapping(
                    graph_config=graph_config, config=sub_node_config
--- a/api/core/workflow/nodes/llm/node.py
+++ b/api/core/workflow/nodes/llm/node.py
@ -815,7 +815,7 @@ class LLMNode(BaseNode[LLMNodeData]):
                    "completion_model": {
                        "conversation_histories_role": {"user_prefix": "Human", "assistant_prefix": "Assistant"},
                        "prompt": {
-                            "text": "Here are the chat histories between human and assistant, inside "
+                            "text": "Here is the chat histories between human and assistant, inside "
                            "<histories></histories> XML tags.\n\n<histories>\n{{"
                            "#histories#}}\n</histories>\n\n\nHuman: {{#sys.query#}}\n\nAssistant:",
                            "edition_type": "basic",
--- a/api/core/workflow/nodes/node_mapping.py
+++ b/api/core/workflow/nodes/node_mapping.py
@ -1,5 +1,3 @@
-from collections.abc import Mapping
-
 from core.workflow.nodes.answer import AnswerNode
 from core.workflow.nodes.base import BaseNode
 from core.workflow.nodes.code import CodeNode
@ -18,87 +16,26 @@ from core.workflow.nodes.start import StartNode
 from core.workflow.nodes.template_transform import TemplateTransformNode
 from core.workflow.nodes.tool import ToolNode
 from core.workflow.nodes.variable_aggregator import VariableAggregatorNode
-from core.workflow.nodes.variable_assigner.v1 import VariableAssignerNode as VariableAssignerNodeV1
-from core.workflow.nodes.variable_assigner.v2 import VariableAssignerNode as VariableAssignerNodeV2
+from core.workflow.nodes.variable_assigner import VariableAssignerNode

-LATEST_VERSION = "latest"
-
-NODE_TYPE_CLASSES_MAPPING: Mapping[NodeType, Mapping[str, type[BaseNode]]] = {
-    NodeType.START: {
-        LATEST_VERSION: StartNode,
-        "1": StartNode,
-    },
-    NodeType.END: {
-        LATEST_VERSION: EndNode,
-        "1": EndNode,
-    },
-    NodeType.ANSWER: {
-        LATEST_VERSION: AnswerNode,
-        "1": AnswerNode,
-    },
-    NodeType.LLM: {
-        LATEST_VERSION: LLMNode,
-        "1": LLMNode,
-    },
-    NodeType.KNOWLEDGE_RETRIEVAL: {
-        LATEST_VERSION: KnowledgeRetrievalNode,
-        "1": KnowledgeRetrievalNode,
-    },
-    NodeType.IF_ELSE: {
-        LATEST_VERSION: IfElseNode,
-        "1": IfElseNode,
-    },
-    NodeType.CODE: {
-        LATEST_VERSION: CodeNode,
-        "1": CodeNode,
-    },
-    NodeType.TEMPLATE_TRANSFORM: {
-        LATEST_VERSION: TemplateTransformNode,
-        "1": TemplateTransformNode,
-    },
-    NodeType.QUESTION_CLASSIFIER: {
-        LATEST_VERSION: QuestionClassifierNode,
-        "1": QuestionClassifierNode,
-    },
-    NodeType.HTTP_REQUEST: {
-        LATEST_VERSION: HttpRequestNode,
-        "1": HttpRequestNode,
-    },
-    NodeType.TOOL: {
-        LATEST_VERSION: ToolNode,
-        "1": ToolNode,
-    },
-    NodeType.VARIABLE_AGGREGATOR: {
-        LATEST_VERSION: VariableAggregatorNode,
-        "1": VariableAggregatorNode,
-    },
-    NodeType.LEGACY_VARIABLE_AGGREGATOR: {
-        LATEST_VERSION: VariableAggregatorNode,
-        "1": VariableAggregatorNode,
-    },  # original name of VARIABLE_AGGREGATOR
-    NodeType.ITERATION: {
-        LATEST_VERSION: IterationNode,
-        "1": IterationNode,
-    },
-    NodeType.ITERATION_START: {
-        LATEST_VERSION: IterationStartNode,
-        "1": IterationStartNode,
-    },
-    NodeType.PARAMETER_EXTRACTOR: {
-        LATEST_VERSION: ParameterExtractorNode,
-        "1": ParameterExtractorNode,
-    },
-    NodeType.VARIABLE_ASSIGNER: {
-        LATEST_VERSION: VariableAssignerNodeV2,
-        "1": VariableAssignerNodeV1,
-        "2": VariableAssignerNodeV2,
-    },
-    NodeType.DOCUMENT_EXTRACTOR: {
-        LATEST_VERSION: DocumentExtractorNode,
-        "1": DocumentExtractorNode,
-    },
-    NodeType.LIST_OPERATOR: {
-        LATEST_VERSION: ListOperatorNode,
-        "1": ListOperatorNode,
-    },
+node_type_classes_mapping: dict[NodeType, type[BaseNode]] = {
+    NodeType.START: StartNode,
+    NodeType.END: EndNode,
+    NodeType.ANSWER: AnswerNode,
+    NodeType.LLM: LLMNode,
+    NodeType.KNOWLEDGE_RETRIEVAL: KnowledgeRetrievalNode,
+    NodeType.IF_ELSE: IfElseNode,
+    NodeType.CODE: CodeNode,
+    NodeType.TEMPLATE_TRANSFORM: TemplateTransformNode,
+    NodeType.QUESTION_CLASSIFIER: QuestionClassifierNode,
+    NodeType.HTTP_REQUEST: HttpRequestNode,
+    NodeType.TOOL: ToolNode,
+    NodeType.VARIABLE_AGGREGATOR: VariableAggregatorNode,
+    NodeType.VARIABLE_ASSIGNER: VariableAggregatorNode,  # original name of VARIABLE_AGGREGATOR
+    NodeType.ITERATION: IterationNode,
+    NodeType.ITERATION_START: IterationStartNode,
+    NodeType.PARAMETER_EXTRACTOR: ParameterExtractorNode,
+    NodeType.CONVERSATION_VARIABLE_ASSIGNER: VariableAssignerNode,
+    NodeType.DOCUMENT_EXTRACTOR: DocumentExtractorNode,
+    NodeType.LIST_OPERATOR: ListOperatorNode,
 }
--- a/api/core/workflow/nodes/parameter_extractor/prompts.py
+++ b/api/core/workflow/nodes/parameter_extractor/prompts.py
@ -98,7 +98,7 @@ Step 3: Structure the extracted parameters to JSON object as specified in <struc
 Step 4: Ensure that the JSON object is properly formatted and valid. The output should not contain any XML tags. Only the JSON object should be outputted.

 ### Memory
-Here are the chat histories between human and assistant, inside <histories></histories> XML tags.
+Here is the chat histories between human and assistant, inside <histories></histories> XML tags.
 <histories>
 {histories}
 </histories>
@ -125,7 +125,7 @@ CHAT_GENERATE_JSON_PROMPT = """You should always follow the instructions and out
 The structure of the JSON object you can found in the instructions.

 ### Memory
-Here are the chat histories between human and assistant, inside <histories></histories> XML tags.
+Here is the chat histories between human and assistant, inside <histories></histories> XML tags.
 <histories>
 {histories}
 </histories>
--- a/api/core/workflow/nodes/question_classifier/init.py
+++ b/api/core/workflow/nodes/question_classifier/init.py
@ -1,4 +1,4 @@
 from .entities import QuestionClassifierNodeData
 from .question_classifier_node import QuestionClassifierNode

-__all__ = ["QuestionClassifierNode", "QuestionClassifierNodeData"]
+__all__ = ["QuestionClassifierNodeData", "QuestionClassifierNode"]
--- a/api/core/workflow/nodes/question_classifier/template_prompts.py
+++ b/api/core/workflow/nodes/question_classifier/template_prompts.py
@ -8,7 +8,7 @@ QUESTION_CLASSIFIER_SYSTEM_PROMPT = """
    ### Constraint
    DO NOT include anything other than the JSON array in your response.
    ### Memory
-    Here are the chat histories between human and assistant, inside <histories></histories> XML tags.
+    Here is the chat histories between human and assistant, inside <histories></histories> XML tags.
    <histories>
    {histories}
    </histories>
@ -66,7 +66,7 @@ User:{{"input_text": ["bad service, slow to bring the food"], "categories": [{{"
 Assistant:{{"keywords": ["bad service", "slow", "food", "tip", "terrible", "waitresses"],"category_id": "f6ff5bc3-aca0-4e4a-8627-e760d0aca78f","category_name": "Experience"}}
 </example> 
 ### Memory
-Here are the chat histories between human and assistant, inside <histories></histories> XML tags.
+Here is the chat histories between human and assistant, inside <histories></histories> XML tags.
 <histories>
 {histories}
 </histories>
--- a/api/core/workflow/nodes/variable_assigner/init.py
+++ b/api/core/workflow/nodes/variable_assigner/init.py
@ -0,0 +1,8 @@
+from .node import VariableAssignerNode
+from .node_data import VariableAssignerData, WriteMode
+
+__all__ = [
+    "VariableAssignerNode",
+    "VariableAssignerData",
+    "WriteMode",
+]
--- a/api/core/workflow/nodes/variable_assigner/common/init.py
+++ b/api/core/workflow/nodes/variable_assigner/common/init.py
--- a/api/core/workflow/nodes/variable_assigner/common/exc.py
+++ b/api/core/workflow/nodes/variable_assigner/common/exc.py
@ -1,4 +0,0 @@
-class VariableOperatorNodeError(Exception):
-    """Base error type, don't use directly."""
-
-    pass
--- a/api/core/workflow/nodes/variable_assigner/common/helpers.py
+++ b/api/core/workflow/nodes/variable_assigner/common/helpers.py
@ -1,19 +0,0 @@
-from sqlalchemy import select
-from sqlalchemy.orm import Session
-
-from core.variables import Variable
-from core.workflow.nodes.variable_assigner.common.exc import VariableOperatorNodeError
-from extensions.ext_database import db
-from models import ConversationVariable
-
-
-def update_conversation_variable(conversation_id: str, variable: Variable):
-    stmt = select(ConversationVariable).where(
-        ConversationVariable.id == variable.id, ConversationVariable.conversation_id == conversation_id
-    )
-    with Session(db.engine) as session:
-        row = session.scalar(stmt)
-        if not row:
-            raise VariableOperatorNodeError("conversation variable not found in the database")
-        row.data = variable.model_dump_json()
-        session.commit()
--- a/api/core/workflow/nodes/variable_assigner/exc.py
+++ b/api/core/workflow/nodes/variable_assigner/exc.py
@ -0,0 +1,2 @@
+class VariableAssignerNodeError(Exception):
+    pass
--- a/api/core/workflow/nodes/variable_assigner/v1/node.py
+++ b/api/core/workflow/nodes/variable_assigner/v1/node.py
@ -1,36 +1,40 @@
+from sqlalchemy import select
+from sqlalchemy.orm import Session
+
 from core.variables import SegmentType, Variable
 from core.workflow.entities.node_entities import NodeRunResult
 from core.workflow.nodes.base import BaseNode, BaseNodeData
 from core.workflow.nodes.enums import NodeType
-from core.workflow.nodes.variable_assigner.common import helpers as common_helpers
-from core.workflow.nodes.variable_assigner.common.exc import VariableOperatorNodeError
+from extensions.ext_database import db
 from factories import variable_factory
+from models import ConversationVariable
 from models.workflow import WorkflowNodeExecutionStatus

+from .exc import VariableAssignerNodeError
 from .node_data import VariableAssignerData, WriteMode


 class VariableAssignerNode(BaseNode[VariableAssignerData]):
    _node_data_cls: type[BaseNodeData] = VariableAssignerData
-    _node_type = NodeType.VARIABLE_ASSIGNER
+    _node_type: NodeType = NodeType.CONVERSATION_VARIABLE_ASSIGNER

    def _run(self) -> NodeRunResult:
        # Should be String, Number, Object, ArrayString, ArrayNumber, ArrayObject
        original_variable = self.graph_runtime_state.variable_pool.get(self.node_data.assigned_variable_selector)
        if not isinstance(original_variable, Variable):
-            raise VariableOperatorNodeError("assigned variable not found")
+            raise VariableAssignerNodeError("assigned variable not found")

        match self.node_data.write_mode:
            case WriteMode.OVER_WRITE:
                income_value = self.graph_runtime_state.variable_pool.get(self.node_data.input_variable_selector)
                if not income_value:
-                    raise VariableOperatorNodeError("input value not found")
+                    raise VariableAssignerNodeError("input value not found")
                updated_variable = original_variable.model_copy(update={"value": income_value.value})

            case WriteMode.APPEND:
                income_value = self.graph_runtime_state.variable_pool.get(self.node_data.input_variable_selector)
                if not income_value:
-                    raise VariableOperatorNodeError("input value not found")
+                    raise VariableAssignerNodeError("input value not found")
                updated_value = original_variable.value + [income_value.value]
                updated_variable = original_variable.model_copy(update={"value": updated_value})

@ -39,7 +43,7 @@ class VariableAssignerNode(BaseNode[VariableAssignerData]):
                updated_variable = original_variable.model_copy(update={"value": income_value.to_object()})

            case _:
-                raise VariableOperatorNodeError(f"unsupported write mode: {self.node_data.write_mode}")
+                raise VariableAssignerNodeError(f"unsupported write mode: {self.node_data.write_mode}")

        # Over write the variable.
        self.graph_runtime_state.variable_pool.add(self.node_data.assigned_variable_selector, updated_variable)
@ -48,8 +52,8 @@ class VariableAssignerNode(BaseNode[VariableAssignerData]):
        # Update conversation variable.
        conversation_id = self.graph_runtime_state.variable_pool.get(["sys", "conversation_id"])
        if not conversation_id:
-            raise VariableOperatorNodeError("conversation_id not found")
-        common_helpers.update_conversation_variable(conversation_id=conversation_id.text, variable=updated_variable)
+            raise VariableAssignerNodeError("conversation_id not found")
+        update_conversation_variable(conversation_id=conversation_id.text, variable=updated_variable)

        return NodeRunResult(
            status=WorkflowNodeExecutionStatus.SUCCEEDED,
@ -59,6 +63,18 @@ class VariableAssignerNode(BaseNode[VariableAssignerData]):
        )


+def update_conversation_variable(conversation_id: str, variable: Variable):
+    stmt = select(ConversationVariable).where(
+        ConversationVariable.id == variable.id, ConversationVariable.conversation_id == conversation_id
+    )
+    with Session(db.engine) as session:
+        row = session.scalar(stmt)
+        if not row:
+            raise VariableAssignerNodeError("conversation variable not found in the database")
+        row.data = variable.model_dump_json()
+        session.commit()
+
+
 def get_zero_value(t: SegmentType):
    match t:
        case SegmentType.ARRAY_OBJECT | SegmentType.ARRAY_STRING | SegmentType.ARRAY_NUMBER:
@ -70,4 +86,4 @@ def get_zero_value(t: SegmentType):
        case SegmentType.NUMBER:
            return variable_factory.build_segment(0)
        case _:
-            raise VariableOperatorNodeError(f"unsupported variable type: {t}")
+            raise VariableAssignerNodeError(f"unsupported variable type: {t}")
--- a/api/core/workflow/nodes/variable_assigner/v1/node_data.py
+++ b/api/core/workflow/nodes/variable_assigner/v1/node_data.py
@ -1,5 +1,6 @@
 from collections.abc import Sequence
 from enum import StrEnum
+from typing import Optional

 from core.workflow.nodes.base import BaseNodeData

@ -11,6 +12,8 @@ class WriteMode(StrEnum):


 class VariableAssignerData(BaseNodeData):
+    title: str = "Variable Assigner"
+    desc: Optional[str] = "Assign a value to a variable"
    assigned_variable_selector: Sequence[str]
    write_mode: WriteMode
    input_variable_selector: Sequence[str]
--- a/api/core/workflow/nodes/variable_assigner/v1/init.py
+++ b/api/core/workflow/nodes/variable_assigner/v1/init.py
@ -1,3 +0,0 @@
-from .node import VariableAssignerNode
-
-__all__ = ["VariableAssignerNode"]
--- a/api/core/workflow/nodes/variable_assigner/v2/init.py
+++ b/api/core/workflow/nodes/variable_assigner/v2/init.py
@ -1,3 +0,0 @@
-from .node import VariableAssignerNode
-
-__all__ = ["VariableAssignerNode"]
--- a/api/core/workflow/nodes/variable_assigner/v2/constants.py
+++ b/api/core/workflow/nodes/variable_assigner/v2/constants.py
@ -1,11 +0,0 @@
-from core.variables import SegmentType
-
-EMPTY_VALUE_MAPPING = {
-    SegmentType.STRING: "",
-    SegmentType.NUMBER: 0,
-    SegmentType.OBJECT: {},
-    SegmentType.ARRAY_ANY: [],
-    SegmentType.ARRAY_STRING: [],
-    SegmentType.ARRAY_NUMBER: [],
-    SegmentType.ARRAY_OBJECT: [],
-}
--- a/api/core/workflow/nodes/variable_assigner/v2/entities.py
+++ b/api/core/workflow/nodes/variable_assigner/v2/entities.py
@ -1,20 +0,0 @@
-from collections.abc import Sequence
-from typing import Any
-
-from pydantic import BaseModel
-
-from core.workflow.nodes.base import BaseNodeData
-
-from .enums import InputType, Operation
-
-
-class VariableOperationItem(BaseModel):
-    variable_selector: Sequence[str]
-    input_type: InputType
-    operation: Operation
-    value: Any | None = None
-
-
-class VariableAssignerNodeData(BaseNodeData):
-    version: str = "2"
-    items: Sequence[VariableOperationItem]
--- a/api/core/workflow/nodes/variable_assigner/v2/enums.py
+++ b/api/core/workflow/nodes/variable_assigner/v2/enums.py
@ -1,18 +0,0 @@
-from enum import StrEnum
-
-
-class Operation(StrEnum):
-    OVER_WRITE = "over-write"
-    CLEAR = "clear"
-    APPEND = "append"
-    EXTEND = "extend"
-    SET = "set"
-    ADD = "+="
-    SUBTRACT = "-="
-    MULTIPLY = "*="
-    DIVIDE = "/="
-
-
-class InputType(StrEnum):
-    VARIABLE = "variable"
-    CONSTANT = "constant"
--- a/api/core/workflow/nodes/variable_assigner/v2/exc.py
+++ b/api/core/workflow/nodes/variable_assigner/v2/exc.py
@ -1,31 +0,0 @@
-from collections.abc import Sequence
-from typing import Any
-
-from core.workflow.nodes.variable_assigner.common.exc import VariableOperatorNodeError
-
-from .enums import InputType, Operation
-
-
-class OperationNotSupportedError(VariableOperatorNodeError):
-    def __init__(self, *, operation: Operation, variable_type: str):
-        super().__init__(f"Operation {operation} is not supported for type {variable_type}")
-
-
-class InputTypeNotSupportedError(VariableOperatorNodeError):
-    def __init__(self, *, input_type: InputType, operation: Operation):
-        super().__init__(f"Input type {input_type} is not supported for operation {operation}")
-
-
-class VariableNotFoundError(VariableOperatorNodeError):
-    def __init__(self, *, variable_selector: Sequence[str]):
-        super().__init__(f"Variable {variable_selector} not found")
-
-
-class InvalidInputValueError(VariableOperatorNodeError):
-    def __init__(self, *, value: Any):
-        super().__init__(f"Invalid input value {value}")
-
-
-class ConversationIDNotFoundError(VariableOperatorNodeError):
-    def __init__(self):
-        super().__init__("conversation_id not found")
--- a/api/core/workflow/nodes/variable_assigner/v2/helpers.py
+++ b/api/core/workflow/nodes/variable_assigner/v2/helpers.py
@ -1,91 +0,0 @@
-from typing import Any
-
-from core.variables import SegmentType
-
-from .enums import Operation
-
-
-def is_operation_supported(*, variable_type: SegmentType, operation: Operation):
-    match operation:
-        case Operation.OVER_WRITE | Operation.CLEAR:
-            return True
-        case Operation.SET:
-            return variable_type in {SegmentType.OBJECT, SegmentType.STRING, SegmentType.NUMBER}
-        case Operation.ADD | Operation.SUBTRACT | Operation.MULTIPLY | Operation.DIVIDE:
-            # Only number variable can be added, subtracted, multiplied or divided
-            return variable_type == SegmentType.NUMBER
-        case Operation.APPEND | Operation.EXTEND:
-            # Only array variable can be appended or extended
-            return variable_type in {
-                SegmentType.ARRAY_ANY,
-                SegmentType.ARRAY_OBJECT,
-                SegmentType.ARRAY_STRING,
-                SegmentType.ARRAY_NUMBER,
-                SegmentType.ARRAY_FILE,
-            }
-        case _:
-            return False
-
-
-def is_variable_input_supported(*, operation: Operation):
-    if operation in {Operation.SET, Operation.ADD, Operation.SUBTRACT, Operation.MULTIPLY, Operation.DIVIDE}:
-        return False
-    return True
-
-
-def is_constant_input_supported(*, variable_type: SegmentType, operation: Operation):
-    match variable_type:
-        case SegmentType.STRING | SegmentType.OBJECT:
-            return operation in {Operation.OVER_WRITE, Operation.SET}
-        case SegmentType.NUMBER:
-            return operation in {
-                Operation.OVER_WRITE,
-                Operation.SET,
-                Operation.ADD,
-                Operation.SUBTRACT,
-                Operation.MULTIPLY,
-                Operation.DIVIDE,
-            }
-        case _:
-            return False
-
-
-def is_input_value_valid(*, variable_type: SegmentType, operation: Operation, value: Any):
-    if operation == Operation.CLEAR:
-        return True
-    match variable_type:
-        case SegmentType.STRING:
-            return isinstance(value, str)
-
-        case SegmentType.NUMBER:
-            if not isinstance(value, int | float):
-                return False
-            if operation == Operation.DIVIDE and value == 0:
-                return False
-            return True
-
-        case SegmentType.OBJECT:
-            return isinstance(value, dict)
-
-        # Array & Append
-        case SegmentType.ARRAY_ANY if operation == Operation.APPEND:
-            return isinstance(value, str | float | int | dict)
-        case SegmentType.ARRAY_STRING if operation == Operation.APPEND:
-            return isinstance(value, str)
-        case SegmentType.ARRAY_NUMBER if operation == Operation.APPEND:
-            return isinstance(value, int | float)
-        case SegmentType.ARRAY_OBJECT if operation == Operation.APPEND:
-            return isinstance(value, dict)
-
-        # Array & Extend / Overwrite
-        case SegmentType.ARRAY_ANY if operation in {Operation.EXTEND, Operation.OVER_WRITE}:
-            return isinstance(value, list) and all(isinstance(item, str | float | int | dict) for item in value)
-        case SegmentType.ARRAY_STRING if operation in {Operation.EXTEND, Operation.OVER_WRITE}:
-            return isinstance(value, list) and all(isinstance(item, str) for item in value)
-        case SegmentType.ARRAY_NUMBER if operation in {Operation.EXTEND, Operation.OVER_WRITE}:
-            return isinstance(value, list) and all(isinstance(item, int | float) for item in value)
-        case SegmentType.ARRAY_OBJECT if operation in {Operation.EXTEND, Operation.OVER_WRITE}:
-            return isinstance(value, list) and all(isinstance(item, dict) for item in value)
-
-        case _:
-            return False
--- a/api/core/workflow/nodes/variable_assigner/v2/node.py
+++ b/api/core/workflow/nodes/variable_assigner/v2/node.py
@ -1,159 +0,0 @@
-import json
-from typing import Any
-
-from core.variables import SegmentType, Variable
-from core.workflow.constants import CONVERSATION_VARIABLE_NODE_ID
-from core.workflow.entities.node_entities import NodeRunResult
-from core.workflow.nodes.base import BaseNode
-from core.workflow.nodes.enums import NodeType
-from core.workflow.nodes.variable_assigner.common import helpers as common_helpers
-from core.workflow.nodes.variable_assigner.common.exc import VariableOperatorNodeError
-from models.workflow import WorkflowNodeExecutionStatus
-
-from . import helpers
-from .constants import EMPTY_VALUE_MAPPING
-from .entities import VariableAssignerNodeData
-from .enums import InputType, Operation
-from .exc import (
-    ConversationIDNotFoundError,
-    InputTypeNotSupportedError,
-    InvalidInputValueError,
-    OperationNotSupportedError,
-    VariableNotFoundError,
-)
-
-
-class VariableAssignerNode(BaseNode[VariableAssignerNodeData]):
-    _node_data_cls = VariableAssignerNodeData
-    _node_type = NodeType.VARIABLE_ASSIGNER
-
-    def _run(self) -> NodeRunResult:
-        inputs = self.node_data.model_dump()
-        process_data = {}
-        # NOTE: This node has no outputs
-        updated_variables: list[Variable] = []
-
-        try:
-            for item in self.node_data.items:
-                variable = self.graph_runtime_state.variable_pool.get(item.variable_selector)
-
-                # ==================== Validation Part
-
-                # Check if variable exists
-                if not isinstance(variable, Variable):
-                    raise VariableNotFoundError(variable_selector=item.variable_selector)
-
-                # Check if operation is supported
-                if not helpers.is_operation_supported(variable_type=variable.value_type, operation=item.operation):
-                    raise OperationNotSupportedError(operation=item.operation, variable_type=variable.value_type)
-
-                # Check if variable input is supported
-                if item.input_type == InputType.VARIABLE and not helpers.is_variable_input_supported(
-                    operation=item.operation
-                ):
-                    raise InputTypeNotSupportedError(input_type=InputType.VARIABLE, operation=item.operation)
-
-                # Check if constant input is supported
-                if item.input_type == InputType.CONSTANT and not helpers.is_constant_input_supported(
-                    variable_type=variable.value_type, operation=item.operation
-                ):
-                    raise InputTypeNotSupportedError(input_type=InputType.CONSTANT, operation=item.operation)
-
-                # Get value from variable pool
-                if (
-                    item.input_type == InputType.VARIABLE
-                    and item.operation != Operation.CLEAR
-                    and item.value is not None
-                ):
-                    value = self.graph_runtime_state.variable_pool.get(item.value)
-                    if value is None:
-                        raise VariableNotFoundError(variable_selector=item.value)
-                    # Skip if value is NoneSegment
-                    if value.value_type == SegmentType.NONE:
-                        continue
-                    item.value = value.value
-
-                # If set string / bytes / bytearray to object, try convert string to object.
-                if (
-                    item.operation == Operation.SET
-                    and variable.value_type == SegmentType.OBJECT
-                    and isinstance(item.value, str | bytes | bytearray)
-                ):
-                    try:
-                        item.value = json.loads(item.value)
-                    except json.JSONDecodeError:
-                        raise InvalidInputValueError(value=item.value)
-
-                # Check if input value is valid
-                if not helpers.is_input_value_valid(
-                    variable_type=variable.value_type, operation=item.operation, value=item.value
-                ):
-                    raise InvalidInputValueError(value=item.value)
-
-                # ==================== Execution Part
-
-                updated_value = self._handle_item(
-                    variable=variable,
-                    operation=item.operation,
-                    value=item.value,
-                )
-                variable = variable.model_copy(update={"value": updated_value})
-                updated_variables.append(variable)
-        except VariableOperatorNodeError as e:
-            return NodeRunResult(
-                status=WorkflowNodeExecutionStatus.FAILED,
-                inputs=inputs,
-                process_data=process_data,
-                error=str(e),
-            )
-
-        # Update variables
-        for variable in updated_variables:
-            self.graph_runtime_state.variable_pool.add(variable.selector, variable)
-            process_data[variable.name] = variable.value
-
-            if variable.selector[0] == CONVERSATION_VARIABLE_NODE_ID:
-                conversation_id = self.graph_runtime_state.variable_pool.get(["sys", "conversation_id"])
-                if not conversation_id:
-                    raise ConversationIDNotFoundError
-                else:
-                    conversation_id = conversation_id.value
-                common_helpers.update_conversation_variable(
-                    conversation_id=conversation_id,
-                    variable=variable,
-                )
-
-        return NodeRunResult(
-            status=WorkflowNodeExecutionStatus.SUCCEEDED,
-            inputs=inputs,
-            process_data=process_data,
-        )
-
-    def _handle_item(
-        self,
-        *,
-        variable: Variable,
-        operation: Operation,
-        value: Any,
-    ):
-        match operation:
-            case Operation.OVER_WRITE:
-                return value
-            case Operation.CLEAR:
-                return EMPTY_VALUE_MAPPING[variable.value_type]
-            case Operation.APPEND:
-                return variable.value + [value]
-            case Operation.EXTEND:
-                return variable.value + value
-            case Operation.SET:
-                return value
-            case Operation.ADD:
-                return variable.value + value
-            case Operation.SUBTRACT:
-                return variable.value - value
-            case Operation.MULTIPLY:
-                return variable.value * value
-            case Operation.DIVIDE:
-                return variable.value / value
-            case _:
-                raise OperationNotSupportedError(operation=operation, variable_type=variable.value_type)
--- a/api/core/workflow/workflow_entry.py
+++ b/api/core/workflow/workflow_entry.py
@ -2,7 +2,7 @@ import logging
 import time
 import uuid
 from collections.abc import Generator, Mapping, Sequence
-from typing import Any, Optional
+from typing import Any, Optional, cast

 from configs import dify_config
 from core.app.apps.base_app_queue_manager import GenerateTaskStoppedError
@ -19,7 +19,7 @@ from core.workflow.graph_engine.graph_engine import GraphEngine
 from core.workflow.nodes import NodeType
 from core.workflow.nodes.base import BaseNode
 from core.workflow.nodes.event import NodeEvent
-from core.workflow.nodes.node_mapping import NODE_TYPE_CLASSES_MAPPING
+from core.workflow.nodes.node_mapping import node_type_classes_mapping
 from factories import file_factory
 from models.enums import UserFrom
 from models.workflow import (
@ -145,8 +145,11 @@ class WorkflowEntry:

        # Get node class
        node_type = NodeType(node_config.get("data", {}).get("type"))
-        node_version = node_config.get("data", {}).get("version", "1")
-        node_cls = NODE_TYPE_CLASSES_MAPPING[node_type][node_version]
+        node_cls = node_type_classes_mapping.get(node_type)
+        node_cls = cast(type[BaseNode], node_cls)
+
+        if not node_cls:
+            raise ValueError(f"Node class not found for node type {node_type}")

        # init variable pool
        variable_pool = VariablePool(environment_variables=workflow.environment_variables)
--- a/api/extensions/ext_redis.py
+++ b/api/extensions/ext_redis.py
@ -1,5 +1,3 @@
-from typing import Any, Union
-
 import redis
 from redis.cluster import ClusterNode, RedisCluster
 from redis.connection import Connection, SSLConnection
@ -48,11 +46,11 @@ redis_client = RedisClientWrapper()

 def init_app(app: DifyApp):
    global redis_client
-    connection_class: type[Union[Connection, SSLConnection]] = Connection
+    connection_class = Connection
    if dify_config.REDIS_USE_SSL:
        connection_class = SSLConnection

-    redis_params: dict[str, Any] = {
+    redis_params = {
        "username": dify_config.REDIS_USERNAME,
        "password": dify_config.REDIS_PASSWORD,
        "db": dify_config.REDIS_DB,
@ -62,7 +60,6 @@ def init_app(app: DifyApp):
    }

    if dify_config.REDIS_USE_SENTINEL:
-        assert dify_config.REDIS_SENTINELS is not None, "REDIS_SENTINELS must be set when REDIS_USE_SENTINEL is True"
        sentinel_hosts = [
            (node.split(":")[0], int(node.split(":")[1])) for node in dify_config.REDIS_SENTINELS.split(",")
        ]
@ -77,13 +74,11 @@ def init_app(app: DifyApp):
        master = sentinel.master_for(dify_config.REDIS_SENTINEL_SERVICE_NAME, **redis_params)
        redis_client.initialize(master)
    elif dify_config.REDIS_USE_CLUSTERS:
-        assert dify_config.REDIS_CLUSTERS is not None, "REDIS_CLUSTERS must be set when REDIS_USE_CLUSTERS is True"
        nodes = [
-            ClusterNode(host=node.split(":")[0], port=int(node.split(":")[1]))
+            ClusterNode(host=node.split(":")[0], port=int(node.split.split(":")[1]))
            for node in dify_config.REDIS_CLUSTERS.split(",")
        ]
-        # FIXME: mypy error here, try to figure out how to fix it
-        redis_client.initialize(RedisCluster(startup_nodes=nodes, password=dify_config.REDIS_CLUSTERS_PASSWORD))  # type: ignore
+        redis_client.initialize(RedisCluster(startup_nodes=nodes, password=dify_config.REDIS_CLUSTERS_PASSWORD))
    else:
        redis_params.update(
            {
--- a/api/factories/variable_factory.py
+++ b/api/factories/variable_factory.py
@ -36,7 +36,6 @@ from core.variables.variables import (
    StringVariable,
    Variable,
 )
-from core.workflow.constants import CONVERSATION_VARIABLE_NODE_ID, ENVIRONMENT_VARIABLE_NODE_ID


 class InvalidSelectorError(ValueError):
@ -63,25 +62,11 @@ SEGMENT_TO_VARIABLE_MAP = {
 }


-def build_conversation_variable_from_mapping(mapping: Mapping[str, Any], /) -> Variable:
-    if not mapping.get("name"):
-        raise VariableError("missing name")
-    return _build_variable_from_mapping(mapping=mapping, selector=[CONVERSATION_VARIABLE_NODE_ID, mapping["name"]])
-
-
-def build_environment_variable_from_mapping(mapping: Mapping[str, Any], /) -> Variable:
-    if not mapping.get("name"):
-        raise VariableError("missing name")
-    return _build_variable_from_mapping(mapping=mapping, selector=[ENVIRONMENT_VARIABLE_NODE_ID, mapping["name"]])
-
-
-def _build_variable_from_mapping(*, mapping: Mapping[str, Any], selector: Sequence[str]) -> Variable:
-    """
-    This factory function is used to create the environment variable or the conversation variable,
-    not support the File type.
-    """
+def build_variable_from_mapping(mapping: Mapping[str, Any], /) -> Variable:
    if (value_type := mapping.get("value_type")) is None:
        raise VariableError("missing value type")
+    if not mapping.get("name"):
+        raise VariableError("missing name")
    if (value := mapping.get("value")) is None:
        raise VariableError("missing value")
    match value_type:
@ -107,8 +92,6 @@ def _build_variable_from_mapping(*, mapping: Mapping[str, Any], selector: Sequen
            raise VariableError(f"not supported value type {value_type}")
    if result.size > dify_config.MAX_VARIABLE_SIZE:
        raise VariableError(f"variable size {result.size} exceeds limit {dify_config.MAX_VARIABLE_SIZE}")
-    if not result.selector:
-        result = result.model_copy(update={"selector": selector})
    return result


--- a/api/libs/helper.py
+++ b/api/libs/helper.py
@ -10,10 +10,10 @@ from collections.abc import Generator, Mapping
 from datetime import datetime
 from hashlib import sha256
 from typing import Any, Optional, Union
-from zoneinfo import available_timezones

 from flask import Response, stream_with_context
 from flask_restful import fields
+from zoneinfo import available_timezones

 from configs import dify_config
 from core.app.features.rate_limiting.rate_limit import RateLimitGenerator
--- a/api/models/init.py
+++ b/api/models/init.py
@ -24,30 +24,30 @@ from .workflow import (
 )

 __all__ = [
-    "Account",
-    "AccountIntegrate",
-    "ApiToken",
-    "App",
-    "AppMode",
-    "Conversation",
    "ConversationVariable",
-    "DataSourceOauthBinding",
+    "Document",
    "Dataset",
    "DatasetProcessRule",
-    "Document",
    "DocumentSegment",
-    "EndUser",
-    "InstalledApp",
-    "InvitationCode",
-    "Message",
-    "MessageAnnotation",
-    "MessageFile",
-    "RecommendedApp",
-    "Site",
-    "Tenant",
-    "ToolFile",
-    "UploadFile",
+    "DataSourceOauthBinding",
+    "AppMode",
    "Workflow",
+    "App",
+    "Message",
+    "EndUser",
+    "MessageFile",
+    "UploadFile",
+    "Account",
    "WorkflowAppLog",
    "WorkflowRun",
+    "Site",
+    "InstalledApp",
+    "RecommendedApp",
+    "ApiToken",
+    "AccountIntegrate",
+    "InvitationCode",
+    "Tenant",
+    "Conversation",
+    "MessageAnnotation",
+    "ToolFile",
 ]
--- a/api/models/workflow.py
+++ b/api/models/workflow.py
@ -238,9 +238,7 @@ class Workflow(db.Model):
        tenant_id = contexts.tenant_id.get()

        environment_variables_dict: dict[str, Any] = json.loads(self._environment_variables)
-        results = [
-            variable_factory.build_environment_variable_from_mapping(v) for v in environment_variables_dict.values()
-        ]
+        results = [variable_factory.build_variable_from_mapping(v) for v in environment_variables_dict.values()]

        # decrypt secret variables value
        decrypt_func = (
@ -305,7 +303,7 @@ class Workflow(db.Model):
            self._conversation_variables = "{}"

        variables_dict: dict[str, Any] = json.loads(self._conversation_variables)
-        results = [variable_factory.build_conversation_variable_from_mapping(v) for v in variables_dict.values()]
+        results = [variable_factory.build_variable_from_mapping(v) for v in variables_dict.values()]
        return results

    @conversation_variables.setter
@ -795,4 +793,4 @@ class ConversationVariable(db.Model):

    def to_variable(self) -> Variable:
        mapping = json.loads(self.data)
-        return variable_factory.build_conversation_variable_from_mapping(mapping)
+        return variable_factory.build_variable_from_mapping(mapping)
--- a/api/poetry.lock
+++ b/api/poetry.lock
--- a/api/pyproject.toml
+++ b/api/pyproject.toml
@ -20,7 +20,7 @@ azure-ai-inference = "~1.0.0b3"
 azure-ai-ml = "~1.20.0"
 azure-identity = "1.16.1"
 beautifulsoup4 = "4.12.2"
-boto3 = "1.35.74"
+boto3 = "1.35.17"
 bs4 = "~0.0.1"
 cachetools = "~5.3.0"
 celery = "~5.4.0"
--- a/api/services/app_dsl_service.py
+++ b/api/services/app_dsl_service.py
@ -22,7 +22,7 @@ logger = logging.getLogger(__name__)

 IMPORT_INFO_REDIS_KEY_PREFIX = "app_import_info:"
 IMPORT_INFO_REDIS_EXPIRY = 180  # 3 minutes
-CURRENT_DSL_VERSION = "0.1.4"
+CURRENT_DSL_VERSION = "0.1.3"


 class ImportMode(StrEnum):
@ -387,11 +387,11 @@ class AppDslService:

            environment_variables_list = workflow_data.get("environment_variables", [])
            environment_variables = [
-                variable_factory.build_environment_variable_from_mapping(obj) for obj in environment_variables_list
+                variable_factory.build_variable_from_mapping(obj) for obj in environment_variables_list
            ]
            conversation_variables_list = workflow_data.get("conversation_variables", [])
            conversation_variables = [
-                variable_factory.build_conversation_variable_from_mapping(obj) for obj in conversation_variables_list
+                variable_factory.build_variable_from_mapping(obj) for obj in conversation_variables_list
            ]

            workflow_service = WorkflowService()
--- a/api/services/errors/init.py
+++ b/api/services/errors/init.py
@ -14,16 +14,16 @@ from . import (
 )

 __all__ = [
-    "account",
-    "app",
-    "app_model_config",
-    "audio",
    "base",
-    "completion",
    "conversation",
-    "dataset",
-    "document",
-    "file",
-    "index",
    "message",
+    "index",
+    "app_model_config",
+    "account",
+    "document",
+    "dataset",
+    "app",
+    "completion",
+    "audio",
+    "file",
 ]
--- a/api/services/workflow_service.py
+++ b/api/services/workflow_service.py
@ -12,7 +12,7 @@ from core.workflow.entities.node_entities import NodeRunResult
 from core.workflow.errors import WorkflowNodeRunFailedError
 from core.workflow.nodes import NodeType
 from core.workflow.nodes.event import RunCompletedEvent
-from core.workflow.nodes.node_mapping import LATEST_VERSION, NODE_TYPE_CLASSES_MAPPING
+from core.workflow.nodes.node_mapping import node_type_classes_mapping
 from core.workflow.workflow_entry import WorkflowEntry
 from events.app_event import app_draft_workflow_was_synced, app_published_workflow_was_updated
 from extensions.ext_database import db
@ -176,8 +176,7 @@ class WorkflowService:
        """
        # return default block config
        default_block_configs = []
-        for node_class_mapping in NODE_TYPE_CLASSES_MAPPING.values():
-            node_class = node_class_mapping[LATEST_VERSION]
+        for node_type, node_class in node_type_classes_mapping.items():
            default_config = node_class.get_default_config()
            if default_config:
                default_block_configs.append(default_config)
@ -191,13 +190,13 @@ class WorkflowService:
        :param filters: filter by node config parameters.
        :return:
        """
-        node_type_enum = NodeType(node_type)
+        node_type_enum: NodeType = NodeType(node_type)

        # return default block config
-        if node_type_enum not in NODE_TYPE_CLASSES_MAPPING:
+        node_class = node_type_classes_mapping.get(node_type_enum)
+        if not node_class:
            return None

-        node_class = NODE_TYPE_CLASSES_MAPPING[node_type_enum][LATEST_VERSION]
        default_config = node_class.get_default_config(filters=filters)
        if not default_config:
            return None
--- a/api/tests/integration_tests/vdb/analyticdb/test_analyticdb.py
+++ b/api/tests/integration_tests/vdb/analyticdb/test_analyticdb.py
@ -1,4 +1,4 @@
-from core.rag.datasource.vdb.analyticdb.analyticdb_vector import AnalyticdbVector
+from core.rag.datasource.vdb.analyticdb.analyticdb_vector import AnalyticdbConfig, AnalyticdbVector
 from core.rag.datasource.vdb.analyticdb.analyticdb_vector_openapi import AnalyticdbVectorOpenAPIConfig
 from core.rag.datasource.vdb.analyticdb.analyticdb_vector_sql import AnalyticdbVectorBySqlConfig
 from tests.integration_tests.vdb.test_vector_store import AbstractVectorTest, setup_mock_redis
--- a/api/tests/unit_tests/core/app/segments/test_factory.py
+++ b/api/tests/unit_tests/core/app/segments/test_factory.py
@ -19,36 +19,36 @@ from factories import variable_factory

 def test_string_variable():
    test_data = {"value_type": "string", "name": "test_text", "value": "Hello, World!"}
-    result = variable_factory.build_conversation_variable_from_mapping(test_data)
+    result = variable_factory.build_variable_from_mapping(test_data)
    assert isinstance(result, StringVariable)


 def test_integer_variable():
    test_data = {"value_type": "number", "name": "test_int", "value": 42}
-    result = variable_factory.build_conversation_variable_from_mapping(test_data)
+    result = variable_factory.build_variable_from_mapping(test_data)
    assert isinstance(result, IntegerVariable)


 def test_float_variable():
    test_data = {"value_type": "number", "name": "test_float", "value": 3.14}
-    result = variable_factory.build_conversation_variable_from_mapping(test_data)
+    result = variable_factory.build_variable_from_mapping(test_data)
    assert isinstance(result, FloatVariable)


 def test_secret_variable():
    test_data = {"value_type": "secret", "name": "test_secret", "value": "secret_value"}
-    result = variable_factory.build_conversation_variable_from_mapping(test_data)
+    result = variable_factory.build_variable_from_mapping(test_data)
    assert isinstance(result, SecretVariable)


 def test_invalid_value_type():
    test_data = {"value_type": "unknown", "name": "test_invalid", "value": "value"}
    with pytest.raises(VariableError):
-        variable_factory.build_conversation_variable_from_mapping(test_data)
+        variable_factory.build_variable_from_mapping(test_data)


 def test_build_a_blank_string():
-    result = variable_factory.build_conversation_variable_from_mapping(
+    result = variable_factory.build_variable_from_mapping(
        {
            "value_type": "string",
            "name": "blank",
@ -80,7 +80,7 @@ def test_object_variable():
            "key2": 2,
        },
    }
-    variable = variable_factory.build_conversation_variable_from_mapping(mapping)
+    variable = variable_factory.build_variable_from_mapping(mapping)
    assert isinstance(variable, ObjectSegment)
    assert isinstance(variable.value["key1"], str)
    assert isinstance(variable.value["key2"], int)
@ -97,7 +97,7 @@ def test_array_string_variable():
            "text",
        ],
    }
-    variable = variable_factory.build_conversation_variable_from_mapping(mapping)
+    variable = variable_factory.build_variable_from_mapping(mapping)
    assert isinstance(variable, ArrayStringVariable)
    assert isinstance(variable.value[0], str)
    assert isinstance(variable.value[1], str)
@ -114,7 +114,7 @@ def test_array_number_variable():
            2.0,
        ],
    }
-    variable = variable_factory.build_conversation_variable_from_mapping(mapping)
+    variable = variable_factory.build_variable_from_mapping(mapping)
    assert isinstance(variable, ArrayNumberVariable)
    assert isinstance(variable.value[0], int)
    assert isinstance(variable.value[1], float)
@ -137,7 +137,7 @@ def test_array_object_variable():
            },
        ],
    }
-    variable = variable_factory.build_conversation_variable_from_mapping(mapping)
+    variable = variable_factory.build_variable_from_mapping(mapping)
    assert isinstance(variable, ArrayObjectVariable)
    assert isinstance(variable.value[0], dict)
    assert isinstance(variable.value[1], dict)
@ -149,7 +149,7 @@ def test_array_object_variable():

 def test_variable_cannot_large_than_200_kb():
    with pytest.raises(VariableError):
-        variable_factory.build_conversation_variable_from_mapping(
+        variable_factory.build_variable_from_mapping(
            {
                "id": str(uuid4()),
                "value_type": "string",
--- a/api/tests/unit_tests/core/workflow/nodes/variable_assigner/v1/test_variable_assigner_v1.py
+++ b/api/tests/unit_tests/core/workflow/nodes/variable_assigner/v1/test_variable_assigner_v1.py
@ -10,8 +10,7 @@ from core.workflow.enums import SystemVariableKey
 from core.workflow.graph_engine.entities.graph import Graph
 from core.workflow.graph_engine.entities.graph_init_params import GraphInitParams
 from core.workflow.graph_engine.entities.graph_runtime_state import GraphRuntimeState
-from core.workflow.nodes.variable_assigner.v1 import VariableAssignerNode
-from core.workflow.nodes.variable_assigner.v1.node_data import WriteMode
+from core.workflow.nodes.variable_assigner import VariableAssignerNode, WriteMode
 from models.enums import UserFrom
 from models.workflow import WorkflowType

@ -85,7 +84,6 @@ def test_overwrite_string_variable():
        config={
            "id": "node_id",
            "data": {
-                "title": "test",
                "assigned_variable_selector": ["conversation", conversation_variable.name],
                "write_mode": WriteMode.OVER_WRITE.value,
                "input_variable_selector": [DEFAULT_NODE_ID, input_variable.name],
@ -93,7 +91,7 @@ def test_overwrite_string_variable():
        },
    )

-    with mock.patch("core.workflow.nodes.variable_assigner.common.helpers.update_conversation_variable") as mock_run:
+    with mock.patch("core.workflow.nodes.variable_assigner.node.update_conversation_variable") as mock_run:
        list(node.run())
        mock_run.assert_called_once()

@ -168,7 +166,6 @@ def test_append_variable_to_array():
        config={
            "id": "node_id",
            "data": {
-                "title": "test",
                "assigned_variable_selector": ["conversation", conversation_variable.name],
                "write_mode": WriteMode.APPEND.value,
                "input_variable_selector": [DEFAULT_NODE_ID, input_variable.name],
@ -176,7 +173,7 @@ def test_append_variable_to_array():
        },
    )

-    with mock.patch("core.workflow.nodes.variable_assigner.common.helpers.update_conversation_variable") as mock_run:
+    with mock.patch("core.workflow.nodes.variable_assigner.node.update_conversation_variable") as mock_run:
        list(node.run())
        mock_run.assert_called_once()

@ -240,7 +237,6 @@ def test_clear_array():
        config={
            "id": "node_id",
            "data": {
-                "title": "test",
                "assigned_variable_selector": ["conversation", conversation_variable.name],
                "write_mode": WriteMode.CLEAR.value,
                "input_variable_selector": [],
@ -248,7 +244,7 @@ def test_clear_array():
        },
    )

-    with mock.patch("core.workflow.nodes.variable_assigner.common.helpers.update_conversation_variable") as mock_run:
+    with mock.patch("core.workflow.nodes.variable_assigner.node.update_conversation_variable") as mock_run:
        list(node.run())
        mock_run.assert_called_once()

--- a/api/tests/unit_tests/core/workflow/nodes/variable_assigner/v2/test_helpers.py
+++ b/api/tests/unit_tests/core/workflow/nodes/variable_assigner/v2/test_helpers.py
@ -1,24 +0,0 @@
-import pytest
-
-from core.variables import SegmentType
-from core.workflow.nodes.variable_assigner.v2.enums import Operation
-from core.workflow.nodes.variable_assigner.v2.helpers import is_input_value_valid
-
-
-def test_is_input_value_valid_overwrite_array_string():
-    # Valid cases
-    assert is_input_value_valid(
-        variable_type=SegmentType.ARRAY_STRING, operation=Operation.OVER_WRITE, value=["hello", "world"]
-    )
-    assert is_input_value_valid(variable_type=SegmentType.ARRAY_STRING, operation=Operation.OVER_WRITE, value=[])
-
-    # Invalid cases
-    assert not is_input_value_valid(
-        variable_type=SegmentType.ARRAY_STRING, operation=Operation.OVER_WRITE, value="not an array"
-    )
-    assert not is_input_value_valid(
-        variable_type=SegmentType.ARRAY_STRING, operation=Operation.OVER_WRITE, value=[1, 2, 3]
-    )
-    assert not is_input_value_valid(
-        variable_type=SegmentType.ARRAY_STRING, operation=Operation.OVER_WRITE, value=["valid", 123, "invalid"]
-    )
--- a/api/tests/unit_tests/models/test_conversation_variable.py
+++ b/api/tests/unit_tests/models/test_conversation_variable.py
@ -6,7 +6,7 @@ from models import ConversationVariable


 def test_from_variable_and_to_variable():
-    variable = variable_factory.build_conversation_variable_from_mapping(
+    variable = variable_factory.build_variable_from_mapping(
        {
            "id": str(uuid4()),
            "name": "name",
--- a/Show More
+++ b/Show More
Author	SHA1	Message	Date
Novice Lee	5f7771bc47	fix: iteration node use the main thread pool	2024-12-02 21:13:47 +08:00
Novice Lee	286741e139	fix: iteration node use the main thread pool	2024-12-02 21:13:39 +08:00