fix Reranking mode is null

fix #6902 .docx handles images within tables and handles cross-column tables (#6951 )
2026-01-26 14:55:45 +08:00 · 2024-08-06 19:03:32 +08:00 · 2024-08-06 18:34:07 +08:00 · 2024-08-06 17:14:24 +08:00 · 2024-08-06 16:11:14 +08:00 · 2024-08-06 16:11:00 +08:00
455 changed files with 13977 additions and 3191 deletions
--- a/.devcontainer/post_create_command.sh
+++ b/.devcontainer/post_create_command.sh
@ -3,8 +3,8 @@
 cd web && npm install
 pipx install poetry

-echo 'alias start-api="cd /workspaces/dify/api && flask run --host 0.0.0.0 --port=5001 --debug"' >> ~/.bashrc
-echo 'alias start-worker="cd /workspaces/dify/api && celery -A app.celery worker -P gevent -c 1 --loglevel INFO -Q dataset,generation,mail,ops_trace,app_deletion"' >> ~/.bashrc
+echo 'alias start-api="cd /workspaces/dify/api && poetry run python -m flask run --host 0.0.0.0 --port=5001 --debug"' >> ~/.bashrc
+echo 'alias start-worker="cd /workspaces/dify/api && poetry run python -m celery -A app.celery worker -P gevent -c 1 --loglevel INFO -Q dataset,generation,mail,ops_trace,app_deletion"' >> ~/.bashrc
 echo 'alias start-web="cd /workspaces/dify/web && npm run dev"' >> ~/.bashrc
 echo 'alias start-containers="cd /workspaces/dify/docker && docker-compose -f docker-compose.middleware.yaml -p dify up -d"' >> ~/.bashrc

--- a/.github/DISCUSSION_TEMPLATE/general.yml
+++ b/.github/DISCUSSION_TEMPLATE/general.yml
@ -9,7 +9,7 @@ body:
          required: true
        - label: I confirm that I am using English to submit this report (我已阅读并同意 [Language Policy](https://github.com/langgenius/dify/issues/1542)).
          required: true
-        - label: "请务必使用英文提交 Issue，否则会被关闭。谢谢！:）"
+        - label: "[FOR CHINESE USERS] 请务必使用英文提交 Issue，否则会被关闭。谢谢！:）"
          required: true
        - label: "Please do not modify this template :) and fill in all the required fields."
          required: true
--- a/.github/DISCUSSION_TEMPLATE/help.yml
+++ b/.github/DISCUSSION_TEMPLATE/help.yml
@ -9,7 +9,7 @@ body:
          required: true
        - label: I confirm that I am using English to submit this report (我已阅读并同意 [Language Policy](https://github.com/langgenius/dify/issues/1542)).
          required: true
-        - label: "请务必使用英文提交 Issue，否则会被关闭。谢谢！:）"
+        - label: "[FOR CHINESE USERS] 请务必使用英文提交 Issue，否则会被关闭。谢谢！:）"
          required: true
        - label: "Please do not modify this template :) and fill in all the required fields."
          required: true
--- a/.github/DISCUSSION_TEMPLATE/suggestion.yml
+++ b/.github/DISCUSSION_TEMPLATE/suggestion.yml
@ -9,7 +9,7 @@ body:
          required: true
        - label: I confirm that I am using English to submit this report (我已阅读并同意 [Language Policy](https://github.com/langgenius/dify/issues/1542)).
          required: true
-        - label: "请务必使用英文提交 Issue，否则会被关闭。谢谢！:）"
+        - label: "[FOR CHINESE USERS] 请务必使用英文提交 Issue，否则会被关闭。谢谢！:）"
          required: true
        - label: "Please do not modify this template :) and fill in all the required fields."
          required: true
--- a/.github/ISSUE_TEMPLATE/bug_report.yml
+++ b/.github/ISSUE_TEMPLATE/bug_report.yml
@ -14,7 +14,7 @@ body:
          required: true
        - label: I confirm that I am using English to submit this report (我已阅读并同意 [Language Policy](https://github.com/langgenius/dify/issues/1542)).
          required: true
-        - label: "请务必使用英文提交 Issue，否则会被关闭。谢谢！:）"
+        - label: "[FOR CHINESE USERS] 请务必使用英文提交 Issue，否则会被关闭。谢谢！:）"
          required: true
        - label: "Please do not modify this template :) and fill in all the required fields."
          required: true
@ -22,7 +22,6 @@ body:
  - type: input
    attributes:
      label: Dify version
-      placeholder: 0.6.11
      description: See about section in Dify console
    validations:
      required: true
--- a/.github/ISSUE_TEMPLATE/document_issue.yml
+++ b/.github/ISSUE_TEMPLATE/document_issue.yml
@ -12,7 +12,7 @@ body:
          required: true
        - label: I confirm that I am using English to submit report (我已阅读并同意 [Language Policy](https://github.com/langgenius/dify/issues/1542)).
          required: true
-        - label: "请务必使用英文提交 Issue，否则会被关闭。谢谢！:）"
+        - label: "[FOR CHINESE USERS] 请务必使用英文提交 Issue，否则会被关闭。谢谢！:）"
          required: true
        - label: "Please do not modify this template :) and fill in all the required fields."
          required: true
--- a/.github/ISSUE_TEMPLATE/feature_request.yml
+++ b/.github/ISSUE_TEMPLATE/feature_request.yml
@ -12,7 +12,7 @@ body:
          required: true
        - label: I confirm that I am using English to submit this report (我已阅读并同意 [Language Policy](https://github.com/langgenius/dify/issues/1542)).
          required: true
-        - label: "请务必使用英文提交 Issue，否则会被关闭。谢谢！:）"
+        - label: "[FOR CHINESE USERS] 请务必使用英文提交 Issue，否则会被关闭。谢谢！:）"
          required: true
        - label: "Please do not modify this template :) and fill in all the required fields."
          required: true
--- a/.github/ISSUE_TEMPLATE/translation_issue.yml
+++ b/.github/ISSUE_TEMPLATE/translation_issue.yml
@ -12,14 +12,13 @@ body:
          required: true
        - label: I confirm that I am using English to submit this report (我已阅读并同意 [Language Policy](https://github.com/langgenius/dify/issues/1542)).
          required: true
-        - label: "请务必使用英文提交 Issue，否则会被关闭。谢谢！:）"
+        - label: "[FOR CHINESE USERS] 请务必使用英文提交 Issue，否则会被关闭。谢谢！:）"
          required: true
        - label: "Please do not modify this template :) and fill in all the required fields."
          required: true
  - type: input
    attributes:
      label: Dify version
-      placeholder: 0.3.21
      description: Hover over system tray icon or look at Settings
    validations:
      required: true
--- a/.github/workflows/api-tests.yml
+++ b/.github/workflows/api-tests.yml
@ -21,6 +21,7 @@ jobs:
        python-version:
          - "3.10"
          - "3.11"
+          - "3.12"

    steps:
      - name: Checkout code
@ -89,6 +90,5 @@ jobs:
            pgvecto-rs
            pgvector
            chroma
-            myscale
      - name: Test Vector Stores
        run: poetry run -C api bash dev/pytest/pytest_vdb.sh
--- a/.gitignore
+++ b/.gitignore
@ -155,6 +155,7 @@ docker-legacy/volumes/milvus/*
 docker-legacy/volumes/chroma/*

 docker/volumes/app/storage/*
+docker/volumes/certbot/*
 docker/volumes/db/data/*
 docker/volumes/redis/data/*
 docker/volumes/weaviate/*
--- a/CONTRIBUTING_JA.md
+++ b/CONTRIBUTING_JA.md
@ -1,7 +1,7 @@
 Dify にコントリビュートしたいとお考えなのですね。それは素晴らしいことです。
 私たちは、LLM アプリケーションの構築と管理のための最も直感的なワークフローを設計するという壮大な野望を持っています。人数も資金も限られている新興企業として、コミュニティからの支援は本当に重要です。

-私たちは現状を鑑み、機敏かつ迅速に開発をする必要がありますが、同時にあなたのようなコントリビューターの方々に、可能な限りスムーズな貢献体験をしていただきたいと思っています。そのためにこのコントリビュートガイドを作成しました。
+私たちは現状を鑑み、機敏かつ迅速に開発をする必要がありますが、同時にあなた様のようなコントリビューターの方々に、可能な限りスムーズな貢献体験をしていただきたいと思っています。そのためにこのコントリビュートガイドを作成しました。
 コードベースやコントリビュータの方々と私たちがどのように仕事をしているのかに慣れていただき、楽しいパートにすぐに飛び込めるようにすることが目的です。

 このガイドは Dify そのものと同様に、継続的に改善されています。実際のプロジェクトに遅れをとることがあるかもしれませんが、ご理解のほどよろしくお願いいたします。
@ -14,13 +14,13 @@ Dify にコントリビュートしたいとお考えなのですね。それは

 ### 機能リクエスト

-* 新しい機能要望を出す場合は、提案する機能が何を実現するものなのかを説明し、可能な限り多くのコンテキストを含めてください。[@perzeusss](https://github.com/perzeuss)は、あなたの要望を書き出すのに役立つ [Feature Request Copilot](https://udify.app/chat/MK2kVSnw1gakVwMX) を作ってくれました。気軽に試してみてください。
+* 新しい機能要望を出す場合は、提案する機能が何を実現するものなのかを説明し、可能な限り多くのコンテキストを含めてください。[@perzeusss](https://github.com/perzeuss)は、あなた様の要望を書き出すのに役立つ [Feature Request Copilot](https://udify.app/chat/MK2kVSnw1gakVwMX) を作ってくれました。気軽に試してみてください。

 * 既存の課題から 1 つ選びたい場合は、その下にコメントを書いてください。

-  関連する方向で作業しているチームメンバーが参加します。すべてが良好であれば、コーディングを開始する許可が与えられます。私たちが変更を提案した場合にあなたの作業が無駄になることがないよう、それまでこの機能の作業を控えていただくようお願いいたします。
+  関連する方向で作業しているチームメンバーが参加します。すべてが良好であれば、コーディングを開始する許可が与えられます。私たちが変更を提案した場合にあなた様の作業が無駄になることがないよう、それまでこの機能の作業を控えていただくようお願いいたします。

-  提案された機能がどの分野に属するかによって、あなたは異なるチーム・メンバーと話をするかもしれません。以下は、各チームメンバーが現在取り組んでいる分野の概要です。
+  提案された機能がどの分野に属するかによって、あなた様は異なるチーム・メンバーと話をするかもしれません。以下は、各チームメンバーが現在取り組んでいる分野の概要です。

 | Member                                                                                  | Scope                                |
 | --------------------------------------------------------------------------------------- | ------------------------------------ |
@ -153,7 +153,7 @@ Dify のバックエンドは[Flask](https://flask.palletsprojects.com/en/3.0.x/
 いよいよ、私たちのリポジトリにプルリクエスト (PR) を提出する時が来ました。主要な機能については、まず `deploy/dev` ブランチにマージしてテストしてから `main` ブランチにマージします。
 マージ競合などの問題が発生した場合、またはプル リクエストを開く方法がわからない場合は、[GitHub's pull request tutorial](https://docs.github.com/en/pull-requests/collaborating-with-pull-requests) をチェックしてみてください。

-これで完了です！あなたの PR がマージされると、[README](https://github.com/langgenius/dify/blob/main/README.md) にコントリビューターとして紹介されます。
+これで完了です！あなた様の PR がマージされると、[README](https://github.com/langgenius/dify/blob/main/README.md) にコントリビューターとして紹介されます。

 ## ヘルプを得る

--- a/README.md
+++ b/README.md
@ -37,6 +37,7 @@
  <a href="./README_KL.md"><img alt="README tlhIngan Hol" src="https://img.shields.io/badge/Klingon-d9d9d9"></a>
  <a href="./README_KR.md"><img alt="README in Korean" src="https://img.shields.io/badge/한국어-d9d9d9"></a>
  <a href="./README_AR.md"><img alt="README بالعربية" src="https://img.shields.io/badge/العربية-d9d9d9"></a>
+  <a href="./README_TR.md"><img alt="Türkçe README" src="https://img.shields.io/badge/Türkçe-d9d9d9"></a>
 </p>


@ -64,7 +65,7 @@ Dify is an open-source LLM app development platform. Its intuitive interface com
  Extensive RAG capabilities that cover everything from document ingestion to retrieval, with out-of-box support for text extraction from PDFs, PPTs, and other common document formats.

 **5. Agent capabilities**: 
-  You can define agents based on LLM Function Calling or ReAct, and add pre-built or custom tools for the agent. Dify provides 50+ built-in tools for AI agents, such as Google Search, DELL·E, Stable Diffusion and WolframAlpha.
+  You can define agents based on LLM Function Calling or ReAct, and add pre-built or custom tools for the agent. Dify provides 50+ built-in tools for AI agents, such as Google Search, DALL·E, Stable Diffusion and WolframAlpha.

 **6. LLMOps**: 
  Monitor and analyze application logs and performance over time. You could continuously improve prompts, datasets, and models based on production data and annotations.
--- a/README_AR.md
+++ b/README_AR.md
@ -37,6 +37,7 @@
  <a href="./README_KL.md"><img alt="README tlhIngan Hol" src="https://img.shields.io/badge/Klingon-d9d9d9"></a>
  <a href="./README_KR.md"><img alt="README in Korean" src="https://img.shields.io/badge/한국어-d9d9d9"></a>
  <a href="./README_AR.md"><img alt="README بالعربية" src="https://img.shields.io/badge/العربية-d9d9d9"></a>
+  <a href="./README_TR.md"><img alt="Türkçe README" src="https://img.shields.io/badge/Türkçe-d9d9d9"></a>
 </p>

 <div style="text-align: right;">
@ -56,7 +57,7 @@

 **4. خط أنابيب RAG**: قدرات RAG الواسعة التي تغطي كل شيء من استيعاب الوثائق إلى الاسترجاع، مع الدعم الفوري لاستخراج النص من ملفات PDF و PPT وتنسيقات الوثائق الشائعة الأخرى.

-**5. قدرات الوكيل**: يمكنك تعريف الوكلاء بناءً على أمر وظيفة LLM أو ReAct، وإضافة أدوات مدمجة أو مخصصة للوكيل. توفر Dify أكثر من 50 أداة مدمجة لوكلاء الذكاء الاصطناعي، مثل البحث في Google و DELL·E وStable Diffusion و WolframAlpha.
+**5. قدرات الوكيل**: يمكنك تعريف الوكلاء بناءً على أمر وظيفة LLM أو ReAct، وإضافة أدوات مدمجة أو مخصصة للوكيل. توفر Dify أكثر من 50 أداة مدمجة لوكلاء الذكاء الاصطناعي، مثل البحث في Google و DALL·E وStable Diffusion و WolframAlpha.

 **6. الـ LLMOps**: راقب وتحلل سجلات التطبيق والأداء على مر الزمن. يمكنك تحسين الأوامر والبيانات والنماذج باستمرار استنادًا إلى البيانات الإنتاجية والتعليقات.

--- a/README_CN.md
+++ b/README_CN.md
@ -36,6 +36,7 @@
  <a href="./README_KL.md"><img alt="上个月的提交次数" src="https://img.shields.io/badge/法语-d9d9d9"></a>
  <a href="./README_FR.md"><img alt="上个月的提交次数" src="https://img.shields.io/badge/克林贡语-d9d9d9"></a>
  <a href="./README_KR.md"><img alt="上个月的提交次数" src="https://img.shields.io/badge/韓國語-d9d9d9"></a>
+  <a href="./README_TR.md"><img alt="Türkçe README" src="https://img.shields.io/badge/Türkçe-d9d9d9"></a>
 </div>


@ -69,7 +70,7 @@ Dify 是一个开源的 LLM 应用开发平台。其直观的界面结合了 AI
  广泛的 RAG 功能，涵盖从文档摄入到检索的所有内容，支持从 PDF、PPT 和其他常见文档格式中提取文本的开箱即用的支持。

 **5. Agent 智能体**: 
-  您可以基于 LLM 函数调用或 ReAct 定义 Agent，并为 Agent 添加预构建或自定义工具。Dify 为 AI Agent 提供了50多种内置工具，如谷歌搜索、DELL·E、Stable Diffusion 和 WolframAlpha 等。
+  您可以基于 LLM 函数调用或 ReAct 定义 Agent，并为 Agent 添加预构建或自定义工具。Dify 为 AI Agent 提供了50多种内置工具，如谷歌搜索、DALL·E、Stable Diffusion 和 WolframAlpha 等。

 **6. LLMOps**: 
  随时间监视和分析应用程序日志和性能。您可以根据生产数据和标注持续改进提示、数据集和模型。
--- a/README_ES.md
+++ b/README_ES.md
@ -36,6 +36,7 @@
  <a href="./README_KL.md"><img alt="Actividad de Commits el último mes" src="https://img.shields.io/badge/Français-d9d9d9"></a>
  <a href="./README_FR.md"><img alt="Actividad de Commits el último mes" src="https://img.shields.io/badge/Klingon-d9d9d9"></a>
  <a href="./README_KR.md"><img alt="Actividad de Commits el último mes" src="https://img.shields.io/badge/한국어-d9d9d9"></a>
+  <a href="./README_TR.md"><img alt="Türkçe README" src="https://img.shields.io/badge/Türkçe-d9d9d9"></a>
 </p>

 #
@ -69,7 +70,7 @@ Dify es una plataforma de desarrollo de aplicaciones de LLM de código abierto.
 **5. Capacidades de agente**: 
  Puedes definir agent

-es basados en LLM Function Calling o ReAct, y agregar herramientas preconstruidas o personalizadas para el agente. Dify proporciona más de 50 herramientas integradas para agentes de IA, como Búsqueda de Google, DELL·E, Difusión Estable y WolframAlpha.
+es basados en LLM Function Calling o ReAct, y agregar herramientas preconstruidas o personalizadas para el agente. Dify proporciona más de 50 herramientas integradas para agentes de IA, como Búsqueda de Google, DALL·E, Difusión Estable y WolframAlpha.

 **6. LLMOps**: 
  Supervisa y analiza registros de aplicaciones y rendimiento a lo largo del tiempo. Podrías mejorar continuamente prompts, conjuntos de datos y modelos basados en datos de producción y anotaciones.
@ -255,4 +256,4 @@ Para proteger tu privacidad, evita publicar problemas de seguridad en GitHub. En

 ## Licencia

-Este repositorio está disponible bajo la [Licencia de Código Abierto de Dify](LICENSE), que es esencialmente Apache 2.0 con algunas restricciones adicionales.
+Este repositorio está disponible bajo la [Licencia de Código Abierto de Dify](LICENSE), que es esencialmente Apache 2.0 con algunas restricciones adicionales.
--- a/README_FR.md
+++ b/README_FR.md
@ -36,6 +36,7 @@
  <a href="./README_KL.md"><img alt="Commits le mois dernier" src="https://img.shields.io/badge/Français-d9d9d9"></a>
  <a href="./README_FR.md"><img alt="Commits le mois dernier" src="https://img.shields.io/badge/Klingon-d9d9d9"></a>
  <a href="./README_KR.md"><img alt="Commits le mois dernier" src="https://img.shields.io/badge/한국어-d9d9d9"></a>
+  <a href="./README_TR.md"><img alt="Türkçe README" src="https://img.shields.io/badge/Türkçe-d9d9d9"></a>
 </p>

 #
@ -69,7 +70,7 @@ Dify est une plateforme de développement d'applications LLM open source. Son in
 **5. Capac

 ités d'agent**: 
-  Vous pouvez définir des agents basés sur l'appel de fonction LLM ou ReAct, et ajouter des outils pré-construits ou personnalisés pour l'agent. Dify fournit plus de 50 outils intégrés pour les agents d'IA, tels que la recherche Google, DELL·E, Stable Diffusion et WolframAlpha.
+  Vous pouvez définir des agents basés sur l'appel de fonction LLM ou ReAct, et ajouter des outils pré-construits ou personnalisés pour l'agent. Dify fournit plus de 50 outils intégrés pour les agents d'IA, tels que la recherche Google, DALL·E, Stable Diffusion et WolframAlpha.

 **6. LLMOps**: 
  Surveillez et analysez les journaux d'application et les performances au fil du temps. Vous pouvez continuellement améliorer les prompts, les ensembles de données et les modèles en fonction des données de production et des annotations.
--- a/README_JA.md
+++ b/README_JA.md
@ -36,6 +36,7 @@
  <a href="./README_KL.md"><img alt="先月のコミット" src="https://img.shields.io/badge/Français-d9d9d9"></a>
  <a href="./README_FR.md"><img alt="先月のコミット" src="https://img.shields.io/badge/Klingon-d9d9d9"></a>
  <a href="./README_KR.md"><img alt="先月のコミット" src="https://img.shields.io/badge/한국어-d9d9d9"></a>
+  <a href="./README_TR.md"><img alt="Türkçe README" src="https://img.shields.io/badge/Türkçe-d9d9d9"></a>
 </p>

 #
@ -68,7 +69,7 @@ DifyはオープンソースのLLMアプリケーション開発プラットフ
  ドキュメントの取り込みから検索までをカバーする広範なRAG機能ができます。ほかにもPDF、PPT、その他の一般的なドキュメントフォーマットからのテキスト抽出のサーポイントも提供します。

 **5. エージェント機能**: 
-  LLM Function CallingやReActに基づくエージェントの定義が可能で、AIエージェント用のプリビルトまたはカスタムツールを追加できます。Difyには、Google検索、DELL·E、Stable Diffusion、WolframAlphaなどのAIエージェント用の50以上の組み込みツールが提供します。
+  LLM Function CallingやReActに基づくエージェントの定義が可能で、AIエージェント用のプリビルトまたはカスタムツールを追加できます。Difyには、Google検索、DALL·E、Stable Diffusion、WolframAlphaなどのAIエージェント用の50以上の組み込みツールが提供します。

 **6. LLMOps**: 
  アプリケーションのログやパフォーマンスを監視と分析し、生産のデータと注釈に基づいて、プロンプト、データセット、モデルを継続的に改善できます。
--- a/README_KL.md
+++ b/README_KL.md
@ -36,6 +36,7 @@
  <a href="./README_KL.md"><img alt="Commits last month" src="https://img.shields.io/badge/Français-d9d9d9"></a>
  <a href="./README_FR.md"><img alt="Commits last month" src="https://img.shields.io/badge/Klingon-d9d9d9"></a>
  <a href="./README_KR.md"><img alt="Commits last month" src="https://img.shields.io/badge/한국어-d9d9d9"></a>
+  <a href="./README_TR.md"><img alt="Türkçe README" src="https://img.shields.io/badge/Türkçe-d9d9d9"></a>
 </p>

 #
@ -67,7 +68,7 @@ Dify is an open-source LLM app development platform. Its intuitive interface com
  Extensive RAG capabilities that cover everything from document ingestion to retrieval, with out-of-box support for text extraction from PDFs, PPTs, and other common document formats.

 **5. Agent capabilities**: 
-  You can define agents based on LLM Function Calling or ReAct, and add pre-built or custom tools for the agent. Dify provides 50+ built-in tools for AI agents, such as Google Search, DELL·E, Stable Diffusion and WolframAlpha.
+  You can define agents based on LLM Function Calling or ReAct, and add pre-built or custom tools for the agent. Dify provides 50+ built-in tools for AI agents, such as Google Search, DALL·E, Stable Diffusion and WolframAlpha.

 **6. LLMOps**: 
  Monitor and analyze application logs and performance over time. You could continuously improve prompts, datasets, and models based on production data and annotations.
@ -255,4 +256,4 @@ To protect your privacy, please avoid posting security issues on GitHub. Instead

 ## License

-This repository is available under the [Dify Open Source License](LICENSE), which is essentially Apache 2.0 with a few additional restrictions.
+This repository is available under the [Dify Open Source License](LICENSE), which is essentially Apache 2.0 with a few additional restrictions.
--- a/README_KR.md
+++ b/README_KR.md
@ -36,6 +36,7 @@
  <a href="./README_FR.md"><img alt="README en Français" src="https://img.shields.io/badge/Français-d9d9d9"></a>
  <a href="./README_KL.md"><img alt="README tlhIngan Hol" src="https://img.shields.io/badge/Klingon-d9d9d9"></a>
  <a href="./README_KR.md"><img alt="한국어 README" src="https://img.shields.io/badge/한국어-d9d9d9"></a>
+  <a href="./README_TR.md"><img alt="Türkçe README" src="https://img.shields.io/badge/Türkçe-d9d9d9"></a>

 </p>

@ -63,7 +64,7 @@
  문서 수집부터 검색까지 모든 것을 다루며, PDF, PPT 및 기타 일반적인 문서 형식에서 텍스트 추출을 위한 기본 지원이 포함되어 있는 광범위한 RAG 기능을 제공합니다.

 **5. 에이전트 기능**:
-  LLM 함수 호출 또는 ReAct를 기반으로 에이전트를 정의하고 에이전트에 대해 사전 구축된 도구나 사용자 정의 도구를 추가할 수 있습니다. Dify는 Google Search, DELL·E, Stable Diffusion, WolframAlpha 등 AI 에이전트를 위한 50개 이상의 내장 도구를 제공합니다.
+  LLM 함수 호출 또는 ReAct를 기반으로 에이전트를 정의하고 에이전트에 대해 사전 구축된 도구나 사용자 정의 도구를 추가할 수 있습니다. Dify는 Google Search, DALL·E, Stable Diffusion, WolframAlpha 등 AI 에이전트를 위한 50개 이상의 내장 도구를 제공합니다.

 **6. LLMOps**:
  시간 경과에 따른 애플리케이션 로그와 성능을 모니터링하고 분석합니다. 생산 데이터와 주석을 기반으로 프롬프트, 데이터세트, 모델을 지속적으로 개선할 수 있습니다.
--- a/README_TR.md
+++ b/README_TR.md
@ -0,0 +1,253 @@
+![cover-v5-optimized](https://github.com/langgenius/dify/assets/13230914/f9e19af5-61ba-4119-b926-d10c4c06ebab)
+
+<p align="center">
+  <a href="https://cloud.dify.ai">Dify Bulut</a> ·
+  <a href="https://docs.dify.ai/getting-started/install-self-hosted">Kendi Sunucunuzda Barındırma</a> ·
+  <a href="https://docs.dify.ai">Dokümantasyon</a> ·
+  <a href="https://cal.com/guchenhe/60-min-meeting">Kurumsal Sorgu</a>
+</p>
+
+<p align="center">
+    <a href="https://dify.ai" target="_blank">
+        <img alt="Statik Rozet" src="https://img.shields.io/badge/Ürün-F04438"></a>
+    <a href="https://dify.ai/pricing" target="_blank">
+        <img alt="Statik Rozet" src="https://img.shields.io/badge/ücretsiz-fiyatlandırma?logo=free&color=%20%23155EEF&label=fiyatlandirma&labelColor=%20%23528bff"></a>
+    <a href="https://discord.gg/FngNHpbcY7" target="_blank">
+        <img src="https://img.shields.io/discord/1082486657678311454?logo=discord&labelColor=%20%235462eb&logoColor=%20%23f5f5f5&color=%20%235462eb"
+            alt="Discord'da sohbet et"></a>
+    <a href="https://twitter.com/intent/follow?screen_name=dify_ai" target="_blank">
+        <img src="https://img.shields.io/twitter/follow/dify_ai?logo=X&color=%20%23f5f5f5"
+            alt="Twitter'da takip et"></a>
+    <a href="https://hub.docker.com/u/langgenius" target="_blank">
+        <img alt="Docker Çekmeleri" src="https://img.shields.io/docker/pulls/langgenius/dify-web?labelColor=%20%23FDB062&color=%20%23f79009"></a>
+    <a href="https://github.com/langgenius/dify/graphs/commit-activity" target="_blank">
+        <img alt="Geçen ay yapılan commitler" src="https://img.shields.io/github/commit-activity/m/langgenius/dify?labelColor=%20%2332b583&color=%20%2312b76a"></a>
+    <a href="https://github.com/langgenius/dify/" target="_blank">
+        <img alt="Kapatılan sorunlar" src="https://img.shields.io/github/issues-search?query=repo%3Alanggenius%2Fdify%20is%3Aclosed&label=kapatilan%20sorunlar&labelColor=%20%237d89b0&color=%20%235d6b98"></a>
+    <a href="https://github.com/langgenius/dify/discussions/" target="_blank">
+        <img alt="Tartışma gönderileri" src="https://img.shields.io/github/discussions/langgenius/dify?labelColor=%20%239b8afb&color=%20%237a5af8"></a>
+</p>
+
+<p align="center">
+  <a href="./README.md"><img alt="README in English" src="https://img.shields.io/badge/English-d9d9d9"></a>
+  <a href="./README_CN.md"><img alt="简体中文版自述文件" src="https://img.shields.io/badge/简体中文-d9d9d9"></a>
+  <a href="./README_JA.md"><img alt="日本語のREADME" src="https://img.shields.io/badge/日本語-d9d9d9"></a>
+  <a href="./README_ES.md"><img alt="README en Español" src="https://img.shields.io/badge/Español-d9d9d9"></a>
+  <a href="./README_FR.md"><img alt="README en Français" src="https://img.shields.io/badge/Français-d9d9d9"></a>
+  <a href="./README_KL.md"><img alt="README tlhIngan Hol" src="https://img.shields.io/badge/Klingon-d9d9d9"></a>
+  <a href="./README_KR.md"><img alt="README in Korean" src="https://img.shields.io/badge/한국어-d9d9d9"></a>
+  <a href="./README_AR.md"><img alt="README بالعربية" src="https://img.shields.io/badge/العربية-d9d9d9"></a>
+  <a href="./README_TR.md"><img alt="Türkçe README" src="https://img.shields.io/badge/Türkçe-d9d9d9"></a>
+</p>
+
+
+Dify, açık kaynaklı bir LLM uygulama geliştirme platformudur. Sezgisel arayüzü, AI iş akışı, RAG pipeline'ı, ajan yetenekleri, model yönetimi, gözlemlenebilirlik özellikleri ve daha fazlasını birleştirerek, prototipten üretime hızlıca geçmenizi sağlar. İşte temel özelliklerin bir listesi:
+</br> </br>
+
+**1. Workflow**: 
+Görsel bir arayüz üzerinde güçlü AI iş akışları oluşturun ve test edin, aşağıdaki tüm özellikleri ve daha fazlasını kullanarak.
+
+
+  https://github.com/langgenius/dify/assets/13230914/356df23e-1604-483d-80a6-9517ece318aa
+
+
+
+**2. Kapsamlı model desteği**:
+Çok sayıda çıkarım sağlayıcısı ve kendi kendine barındırılan çözümlerden yüzlerce özel / açık kaynaklı LLM ile sorunsuz entegrasyon sağlar. GPT, Mistral, Llama3 ve OpenAI API uyumlu tüm modelleri kapsar. Desteklenen model sağlayıcılarının tam listesine [buradan](https://docs.dify.ai/getting-started/readme/model-providers) ulaşabilirsiniz.
+
+![providers-v5](https://github.com/langgenius/dify/assets/13230914/5a17bdbe-097a-4100-8363-40255b70f6e3)
+
+
+Özür dilerim, haklısınız. Daha anlamlı ve akıcı bir çeviri yapmaya çalışayım. İşte güncellenmiş çeviri:
+
+**3. Prompt IDE**: 
+  Komut istemlerini oluşturmak, model performansını karşılaştırmak ve sohbet tabanlı uygulamalara metin-konuşma gibi ek özellikler eklemek için kullanıcı dostu bir arayüz.
+
+**4. RAG Pipeline**: 
+  Belge alımından bilgi çekmeye kadar geniş kapsamlı RAG yetenekleri. PDF'ler, PPT'ler ve diğer yaygın belge formatlarından metin çıkarma için hazır destek sunar.
+
+**5. Ajan yetenekleri**: 
+  LLM Fonksiyon Çağırma veya ReAct'a dayalı ajanlar tanımlayabilir ve bu ajanlara önceden hazırlanmış veya özel araçlar ekleyebilirsiniz. Dify, AI ajanları için Google Arama, DALL·E, Stable Diffusion ve WolframAlpha gibi 50'den fazla yerleşik araç sağlar.
+
+**6. LLMOps**: 
+  Uygulama loglarını ve performans metriklerini zaman içinde izleme ve analiz etme imkanı. Üretim ortamından elde edilen verilere ve kullanıcı geri bildirimlerine dayanarak, prompt'ları, veri setlerini ve modelleri sürekli olarak optimize edebilirsiniz. Bu sayede, AI uygulamanızın performansını ve doğruluğunu sürekli olarak artırabilirsiniz.
+
+**7. Hizmet Olarak Backend**: 
+  Dify'ın tüm özellikleri ilgili API'lerle birlikte gelir, böylece Dify'ı kendi iş mantığınıza kolayca entegre edebilirsiniz.
+
+
+## Özellik karşılaştırması
+<table style="width: 100%;">
+  <tr>
+    <th align="center">Özellik</th>
+    <th align="center">Dify.AI</th>
+    <th align="center">LangChain</th>
+    <th align="center">Flowise</th>
+    <th align="center">OpenAI Assistants API</th>
+  </tr>
+  <tr>
+    <td align="center">Programlama Yaklaşımı</td>
+    <td align="center">API + Uygulama odaklı</td>
+    <td align="center">Python Kodu</td>
+    <td align="center">Uygulama odaklı</td>
+    <td align="center">API odaklı</td>
+  </tr>
+  <tr>
+    <td align="center">Desteklenen LLM'ler</td>
+    <td align="center">Zengin Çeşitlilik</td>
+    <td align="center">Zengin Çeşitlilik</td>
+    <td align="center">Zengin Çeşitlilik</td>
+    <td align="center">Yalnızca OpenAI</td>
+  </tr>
+  <tr>
+    <td align="center">RAG Motoru</td>
+    <td align="center">✅</td>
+    <td align="center">✅</td>
+    <td align="center">✅</td>
+    <td align="center">✅</td>
+  </tr>
+  <tr>
+    <td align="center">Ajan</td>
+    <td align="center">✅</td>
+    <td align="center">✅</td>
+    <td align="center">❌</td>
+    <td align="center">✅</td>
+  </tr>
+  <tr>
+    <td align="center">İş Akışı</td>
+    <td align="center">✅</td>
+    <td align="center">❌</td>
+    <td align="center">✅</td>
+    <td align="center">❌</td>
+  </tr>
+  <tr>
+    <td align="center">Gözlemlenebilirlik</td>
+    <td align="center">✅</td>
+    <td align="center">✅</td>
+    <td align="center">❌</td>
+    <td align="center">❌</td>
+  </tr>
+  <tr>
+    <td align="center">Kurumsal Özellikler (SSO/Erişim kontrolü)</td>
+    <td align="center">✅</td>
+    <td align="center">❌</td>
+    <td align="center">❌</td>
+    <td align="center">❌</td>
+  </tr>
+  <tr>
+    <td align="center">Yerel Dağıtım</td>
+    <td align="center">✅</td>
+    <td align="center">✅</td>
+    <td align="center">✅</td>
+    <td align="center">❌</td>
+  </tr>
+</table>
+
+## Dify'ı Kullanma
+
+- **Cloud </br>**
+İşte verdiğiniz metnin Türkçe çevirisi, kod bloğu içinde:
+- 
+Herkesin sıfır kurulumla denemesi için bir [Dify Cloud](https://dify.ai) hizmeti sunuyoruz. Bu hizmet, kendi kendine dağıtılan versiyonun tüm yeteneklerini sağlar ve sandbox planında 200 ücretsiz GPT-4 çağrısı içerir.
+
+- **Dify Topluluk Sürümünü Kendi Sunucunuzda Barındırma</br>**
+Bu [başlangıç kılavuzu](#quick-start) ile Dify'ı kendi ortamınızda hızlıca çalıştırın.
+Daha fazla referans ve detaylı talimatlar için [dokümantasyonumuzu](https://docs.dify.ai) kullanın.
+
+- **Kurumlar / organizasyonlar için Dify</br>**
+Ek kurumsal odaklı özellikler sunuyoruz. Kurumsal ihtiyaçları görüşmek için [bizimle bir toplantı planlayın](https://cal.com/guchenhe/30min) veya [bize bir e-posta gönderin](mailto:business@dify.ai?subject=[GitHub]Business%20License%20Inquiry). </br>
+  > AWS kullanan startuplar ve küçük işletmeler için, [AWS Marketplace'deki Dify Premium'a](https://aws.amazon.com/marketplace/pp/prodview-t22mebxzwjhu6) göz atın ve tek tıklamayla kendi AWS VPC'nize dağıtın. Bu, özel logo ve marka ile uygulamalar oluşturma seçeneğine sahip uygun fiyatlı bir AMI teklifdir.
+
+## Güncel Kalma
+
+GitHub'da Dify'a yıldız verin ve yeni sürümlerden anında haberdar olun.
+
+![bizi-yıldızlayın](https://github.com/langgenius/dify/assets/13230914/b823edc1-6388-4e25-ad45-2f6b187adbb4)
+
+
+
+## Hızlı başlangıç
+> Dify'ı kurmadan önce, makinenizin aşağıdaki minimum sistem gereksinimlerini karşıladığından emin olun:
+> 
+>- CPU >= 2 Çekirdek
+>- RAM >= 4GB
+
+</br>
+İşte verdiğiniz metnin Türkçe çevirisi, kod bloğu içinde:
+
+Dify sunucusunu başlatmanın en kolay yolu, [docker-compose.yml](docker/docker-compose.yaml) dosyamızı çalıştırmaktır. Kurulum komutunu çalıştırmadan önce, makinenizde [Docker](https://docs.docker.com/get-docker/) ve [Docker Compose](https://docs.docker.com/compose/install/)'un kurulu olduğundan emin olun:
+
+```bash
+cd docker
+cp .env.example .env
+docker compose up -d
+```
+
+Çalıştırdıktan sonra, tarayıcınızda [http://localhost/install](http://localhost/install) adresinden Dify kontrol paneline erişebilir ve başlangıç ayarları sürecini başlatabilirsiniz.
+
+> Eğer Dify'a katkıda bulunmak veya ek geliştirmeler yapmak isterseniz, [kaynak koddan dağıtım kılavuzumuza](https://docs.dify.ai/getting-started/install-self-hosted/local-source-code) başvurun.
+
+## Sonraki adımlar
+
+Yapılandırmayı özelleştirmeniz gerekiyorsa, lütfen [.env.example](docker/.env.example) dosyamızdaki yorumlara bakın ve `.env` dosyanızdaki ilgili değerleri güncelleyin. Ayrıca, spesifik dağıtım ortamınıza ve gereksinimlerinize bağlı olarak `docker-compose.yaml` dosyasının kendisinde de, imaj sürümlerini, port eşlemelerini veya hacim bağlantılarını değiştirmek gibi ayarlamalar yapmanız gerekebilir. Herhangi bir değişiklik yaptıktan sonra, lütfen `docker-compose up -d` komutunu tekrar çalıştırın. Kullanılabilir tüm ortam değişkenlerinin tam listesini [burada](https://docs.dify.ai/getting-started/install-self-hosted/environments) bulabilirsiniz.
+
+Yüksek kullanılabilirliğe sahip bir kurulum yapılandırmak isterseniz, Dify'ın Kubernetes üzerine dağıtılmasına olanak tanıyan topluluk katkılı [Helm Charts](https://helm.sh/) ve YAML dosyaları mevcuttur.
+
+- [@LeoQuote tarafından Helm Chart](https://github.com/douban/charts/tree/master/charts/dify)
+- [@BorisPolonsky tarafından Helm Chart](https://github.com/BorisPolonsky/dify-helm)
+- [@Winson-030 tarafından YAML dosyası](https://github.com/Winson-030/dify-kubernetes)
+
+#### Dağıtım için Terraform Kullanımı
+
+##### Azure Global
+[Terraform](https://www.terraform.io/) kullanarak Dify'ı Azure'a tek tıklamayla dağıtın.
+- [@nikawang tarafından Azure Terraform](https://github.com/nikawang/dify-azure-terraform)
+
+## Katkıda Bulunma
+
+Kod katkısında bulunmak isteyenler için [Katkı Kılavuzumuza](https://github.com/langgenius/dify/blob/main/CONTRIBUTING.md) bakabilirsiniz.
+Aynı zamanda, lütfen Dify'ı sosyal medyada, etkinliklerde ve konferanslarda paylaşarak desteklemeyi düşünün.
+
+> Dify'ı Mandarin veya İngilizce dışındaki dillere çevirmemize yardımcı olacak katkıda bulunanlara ihtiyacımız var. Yardımcı olmakla ilgileniyorsanız, lütfen daha fazla bilgi için [i18n README](https://github.com/langgenius/dify/blob/main/web/i18n/README.md) dosyasına bakın ve [Discord Topluluk Sunucumuzdaki](https://discord.gg/8Tpq4AcN9c) `global-users` kanalında bize bir yorum bırakın.
+
+**Katkıda Bulunanlar**
+
+<a href="https://github.com/langgenius/dify/graphs/contributors">
+  <img src="https://contrib.rocks/image?repo=langgenius/dify" />
+</a>
+
+## Topluluk & iletişim
+
+* [Github Tartışmaları](https://github.com/langgenius/dify/discussions). En uygun: geri bildirim paylaşmak ve soru sormak için.
+* [GitHub Sorunları](https://github.com/langgenius/dify/issues). En uygun: Dify.AI kullanırken karşılaştığınız hatalar ve özellik önerileri için. [Katkı Kılavuzumuza](https://github.com/langgenius/dify/blob/main/CONTRIBUTING.md) bakın.
+* [Discord](https://discord.gg/FngNHpbcY7). En uygun: uygulamalarınızı paylaşmak ve toplulukla vakit geçirmek için.
+* [Twitter](https://twitter.com/dify_ai). En uygun: uygulamalarınızı paylaşmak ve toplulukla vakit geçirmek için.
+
+Veya doğrudan bir ekip üyesiyle toplantı planlayın:
+
+<table>
+  <tr>
+    <th>İletişim Noktası</th>
+    <th>Amaç</th>
+  </tr>
+  <tr>
+    <td><a href='https://cal.com/guchenhe/15min' target='_blank'><img class="schedule-button" src='https://github.com/langgenius/dify/assets/13230914/9ebcd111-1205-4d71-83d5-948d70b809f5' alt='Git-Hub-README-Button-3x' style="width: 180px; height: auto; object-fit: contain;"/></a></td>
+    <td>İş sorgulamaları & ürün geri bildirimleri</td>
+  </tr>
+  <tr>
+    <td><a href='https://cal.com/pinkbanana' target='_blank'><img class="schedule-button" src='https://github.com/langgenius/dify/assets/13230914/d1edd00a-d7e4-4513-be6c-e57038e143fd' alt='Git-Hub-README-Button-2x' style="width: 180px; height: auto; object-fit: contain;"/></a></td>
+    <td>Katkılar, sorunlar & özellik istekleri</td>
+  </tr>
+</table>
+
+## Star history
+
+[![Star History Chart](https://api.star-history.com/svg?repos=langgenius/dify&type=Date)](https://star-history.com/#langgenius/dify&Date)
+
+## Güvenlik açıklaması
+
+Gizliliğinizi korumak için, lütfen güvenlik sorunlarını GitHub'da paylaşmaktan kaçının. Bunun yerine, sorularınızı security@dify.ai adresine gönderin ve size daha detaylı bir cevap vereceğiz.
+
+## Lisans
+
+Bu depo, temel olarak Apache 2.0 lisansı ve birkaç ek kısıtlama içeren [Dify Açık Kaynak Lisansı](LICENSE) altında kullanıma sunulmuştur.
--- a/api/.env.example
+++ b/api/.env.example
@ -183,6 +183,7 @@ UPLOAD_IMAGE_FILE_SIZE_LIMIT=10

 # Model Configuration
 MULTIMODAL_SEND_IMAGE_FORMAT=base64
+PROMPT_GENERATION_MAX_TOKENS=512

 # Mail configuration, support: resend, smtp
 MAIL_TYPE=
@ -216,6 +217,7 @@ UNSTRUCTURED_API_KEY=

 SSRF_PROXY_HTTP_URL=
 SSRF_PROXY_HTTPS_URL=
+SSRF_DEFAULT_MAX_RETRIES=3

 BATCH_UPLOAD_LIMIT=10
 KEYWORD_DATA_SOURCE_TYPE=database
--- a/api/Dockerfile
+++ b/api/Dockerfile
@ -41,8 +41,12 @@ ENV TZ=UTC
 WORKDIR /app/api

 RUN apt-get update \
-    && apt-get install -y --no-install-recommends curl wget vim nodejs ffmpeg libgmp-dev libmpfr-dev libmpc-dev \
-    && apt-get autoremove \
+    && apt-get install -y --no-install-recommends curl nodejs libgmp-dev libmpfr-dev libmpc-dev \
+    && echo "deb http://deb.debian.org/debian testing main" > /etc/apt/sources.list \
+    && apt-get update \
+    # For Security
+    && apt-get install -y --no-install-recommends zlib1g=1:1.3.dfsg+really1.3.1-1 expat=2.6.2-1 libldap-2.5-0=2.5.18+dfsg-2 perl=5.38.2-5 libsqlite3-0=3.46.0-1 \
+    && apt-get autoremove -y \
    && rm -rf /var/lib/apt/lists/*

 # Copy Python environment and packages
--- a/api/README.md
+++ b/api/README.md
@ -12,7 +12,8 @@
   ```bash
   cd ../docker
   cp middleware.env.example middleware.env
-   docker compose -f docker-compose.middleware.yaml -p dify up -d
+   # change the profile to other vector database if you are not using weaviate
+   docker compose -f docker-compose.middleware.yaml --profile weaviate -p dify up -d
   cd ../api
   ```

--- a/api/app.py
+++ b/api/app.py
@ -261,6 +261,7 @@ def after_request(response):
@app.route('/health')
 def health():
    return Response(json.dumps({
+        'pid': os.getpid(),
        'status': 'ok',
        'version': app.config['CURRENT_VERSION']
    }), status=200, content_type="application/json")
@ -284,6 +285,7 @@ def threads():
        })

    return {
+        'pid': os.getpid(),
        'thread_num': num_threads,
        'threads': thread_list
    }
@ -293,6 +295,7 @@ def threads():
 def pool_stat():
    engine = db.engine
    return {
+        'pid': os.getpid(),
        'pool_size': engine.pool.size(),
        'checked_in_connections': engine.pool.checkedin(),
        'checked_out_connections': engine.pool.checkedout(),
--- a/api/commands.py
+++ b/api/commands.py
@ -249,8 +249,7 @@ def migrate_knowledge_vector_database():
    create_count = 0
    skipped_count = 0
    total_count = 0
-    config = current_app.config
-    vector_type = config.get('VECTOR_STORE')
+    vector_type = dify_config.VECTOR_STORE
    page = 1
    while True:
        try:
@ -484,8 +483,7 @@ def convert_to_agent_apps():
@click.option('--field', default='metadata.doc_id', prompt=False, help='index field , default is metadata.doc_id.')
 def add_qdrant_doc_id_index(field: str):
    click.echo(click.style('Start add qdrant doc_id index.', fg='green'))
-    config = current_app.config
-    vector_type = config.get('VECTOR_STORE')
+    vector_type = dify_config.VECTOR_STORE
    if vector_type != "qdrant":
        click.echo(click.style('Sorry, only support qdrant vector store.', fg='red'))
        return
@ -502,13 +500,15 @@ def add_qdrant_doc_id_index(field: str):

        from core.rag.datasource.vdb.qdrant.qdrant_vector import QdrantConfig
        for binding in bindings:
+            if dify_config.QDRANT_URL is None:
+                raise ValueError('Qdrant url is required.')
            qdrant_config = QdrantConfig(
-                endpoint=config.get('QDRANT_URL'),
-                api_key=config.get('QDRANT_API_KEY'),
+                endpoint=dify_config.QDRANT_URL,
+                api_key=dify_config.QDRANT_API_KEY,
                root_path=current_app.root_path,
-                timeout=config.get('QDRANT_CLIENT_TIMEOUT'),
-                grpc_port=config.get('QDRANT_GRPC_PORT'),
-                prefer_grpc=config.get('QDRANT_GRPC_ENABLED')
+                timeout=dify_config.QDRANT_CLIENT_TIMEOUT,
+                grpc_port=dify_config.QDRANT_GRPC_PORT,
+                prefer_grpc=dify_config.QDRANT_GRPC_ENABLED
            )
            try:
                client = qdrant_client.QdrantClient(**qdrant_config.to_qdrant_params())
--- a/api/configs/app_config.py
+++ b/api/configs/app_config.py
@ -64,4 +64,6 @@ class DifyConfig(
        return f'{self.HTTP_REQUEST_NODE_MAX_TEXT_SIZE / 1024 / 1024:.2f}MB'

    SSRF_PROXY_HTTP_URL: str | None = None
-    SSRF_PROXY_HTTPS_URL: str | None = None
+    SSRF_PROXY_HTTPS_URL: str | None = None
+
+    MODERATION_BUFFER_SIZE: int = Field(default=300, description='The buffer size for moderation.')
--- a/api/configs/middleware/init.py
+++ b/api/configs/middleware/init.py
@ -1,4 +1,5 @@
 from typing import Any, Optional
+from urllib.parse import quote_plus

 from pydantic import Field, NonNegativeInt, PositiveInt, computed_field
 from pydantic_settings import BaseSettings
@ -104,7 +105,7 @@ class DatabaseConfig:
        ).strip("&")
        db_extras = f"?{db_extras}" if db_extras else ""
        return (f"{self.SQLALCHEMY_DATABASE_URI_SCHEME}://"
-                f"{self.DB_USERNAME}:{self.DB_PASSWORD}@{self.DB_HOST}:{self.DB_PORT}/{self.DB_DATABASE}"
+                f"{quote_plus(self.DB_USERNAME)}:{quote_plus(self.DB_PASSWORD)}@{self.DB_HOST}:{self.DB_PORT}/{self.DB_DATABASE}" 
                f"{db_extras}")

    SQLALCHEMY_POOL_SIZE: NonNegativeInt = Field(
--- a/api/configs/packaging/init.py
+++ b/api/configs/packaging/init.py
@ -9,7 +9,7 @@ class PackagingInfo(BaseSettings):

    CURRENT_VERSION: str = Field(
        description='Dify version',
-        default='0.6.15',
+        default='0.6.16',
    )

    COMMIT_SHA: str = Field(
--- a/api/constants/languages.py
+++ b/api/constants/languages.py
@ -15,6 +15,7 @@ language_timezone_mapping = {
    'ro-RO': 'Europe/Bucharest',
    'pl-PL': 'Europe/Warsaw',
    'hi-IN': 'Asia/Kolkata',
+    'tr-TR': 'Europe/Istanbul',
 }

 languages = list(language_timezone_mapping.keys())
--- a/api/controllers/console/app/annotation.py
+++ b/api/controllers/console/app/annotation.py
@ -23,8 +23,7 @@ class AnnotationReplyActionApi(Resource):
    @account_initialization_required
    @cloud_edition_billing_resource_check('annotation')
    def post(self, app_id, action):
-        # The role of the current user in the ta table must be admin or owner
-        if not current_user.is_admin_or_owner:
+        if not current_user.is_editor:
            raise Forbidden()

        app_id = str(app_id)
@ -47,8 +46,7 @@ class AppAnnotationSettingDetailApi(Resource):
    @login_required
    @account_initialization_required
    def get(self, app_id):
-        # The role of the current user in the ta table must be admin or owner
-        if not current_user.is_admin_or_owner:
+        if not current_user.is_editor:
            raise Forbidden()

        app_id = str(app_id)
@ -61,8 +59,7 @@ class AppAnnotationSettingUpdateApi(Resource):
    @login_required
    @account_initialization_required
    def post(self, app_id, annotation_setting_id):
-        # The role of the current user in the ta table must be admin or owner
-        if not current_user.is_admin_or_owner:
+        if not current_user.is_editor:
            raise Forbidden()

        app_id = str(app_id)
@ -82,8 +79,7 @@ class AnnotationReplyActionStatusApi(Resource):
    @account_initialization_required
    @cloud_edition_billing_resource_check('annotation')
    def get(self, app_id, job_id, action):
-        # The role of the current user in the ta table must be admin or owner
-        if not current_user.is_admin_or_owner:
+        if not current_user.is_editor:
            raise Forbidden()

        job_id = str(job_id)
@ -110,8 +106,7 @@ class AnnotationListApi(Resource):
    @login_required
    @account_initialization_required
    def get(self, app_id):
-        # The role of the current user in the ta table must be admin or owner
-        if not current_user.is_admin_or_owner:
+        if not current_user.is_editor:
            raise Forbidden()

        page = request.args.get('page', default=1, type=int)
@ -135,8 +130,7 @@ class AnnotationExportApi(Resource):
    @login_required
    @account_initialization_required
    def get(self, app_id):
-        # The role of the current user in the ta table must be admin or owner
-        if not current_user.is_admin_or_owner:
+        if not current_user.is_editor:
            raise Forbidden()

        app_id = str(app_id)
@ -154,8 +148,7 @@ class AnnotationCreateApi(Resource):
    @cloud_edition_billing_resource_check('annotation')
    @marshal_with(annotation_fields)
    def post(self, app_id):
-        # The role of the current user in the ta table must be admin or owner
-        if not current_user.is_admin_or_owner:
+        if not current_user.is_editor:
            raise Forbidden()

        app_id = str(app_id)
@ -174,8 +167,7 @@ class AnnotationUpdateDeleteApi(Resource):
    @cloud_edition_billing_resource_check('annotation')
    @marshal_with(annotation_fields)
    def post(self, app_id, annotation_id):
-        # The role of the current user in the ta table must be admin or owner
-        if not current_user.is_admin_or_owner:
+        if not current_user.is_editor:
            raise Forbidden()

        app_id = str(app_id)
@ -191,8 +183,7 @@ class AnnotationUpdateDeleteApi(Resource):
    @login_required
    @account_initialization_required
    def delete(self, app_id, annotation_id):
-        # The role of the current user in the ta table must be admin or owner
-        if not current_user.is_admin_or_owner:
+        if not current_user.is_editor:
            raise Forbidden()

        app_id = str(app_id)
@ -207,8 +198,7 @@ class AnnotationBatchImportApi(Resource):
    @account_initialization_required
    @cloud_edition_billing_resource_check('annotation')
    def post(self, app_id):
-        # The role of the current user in the ta table must be admin or owner
-        if not current_user.is_admin_or_owner:
+        if not current_user.is_editor:
            raise Forbidden()

        app_id = str(app_id)
@ -232,8 +222,7 @@ class AnnotationBatchImportStatusApi(Resource):
    @account_initialization_required
    @cloud_edition_billing_resource_check('annotation')
    def get(self, app_id, job_id):
-        # The role of the current user in the ta table must be admin or owner
-        if not current_user.is_admin_or_owner:
+        if not current_user.is_editor:
            raise Forbidden()

        job_id = str(job_id)
@ -259,8 +248,7 @@ class AnnotationHitHistoryListApi(Resource):
    @login_required
    @account_initialization_required
    def get(self, app_id, annotation_id):
-        # The role of the current user in the table must be admin or owner
-        if not current_user.is_admin_or_owner:
+        if not current_user.is_editor:
            raise Forbidden()

        page = request.args.get('page', default=1, type=int)
--- a/api/controllers/console/app/conversation.py
+++ b/api/controllers/console/app/conversation.py
@ -22,7 +22,7 @@ from fields.conversation_fields import (
 )
 from libs.helper import datetime_string
 from libs.login import login_required
-from models.model import AppMode, Conversation, Message, MessageAnnotation
+from models.model import AppMode, Conversation, EndUser, Message, MessageAnnotation


 class CompletionConversationApi(Resource):
@ -143,7 +143,7 @@ class ChatConversationApi(Resource):
    @get_app_model(mode=[AppMode.CHAT, AppMode.AGENT_CHAT, AppMode.ADVANCED_CHAT])
    @marshal_with(conversation_with_summary_pagination_fields)
    def get(self, app_model):
-        if not current_user.is_admin_or_owner:
+        if not current_user.is_editor:
            raise Forbidden()
        parser = reqparse.RequestParser()
        parser.add_argument('keyword', type=str, location='args')
@ -156,19 +156,31 @@ class ChatConversationApi(Resource):
        parser.add_argument('limit', type=int_range(1, 100), required=False, default=20, location='args')
        args = parser.parse_args()

+        subquery = (
+            db.session.query(
+                Conversation.id.label('conversation_id'),
+                EndUser.session_id.label('from_end_user_session_id')
+            )
+            .outerjoin(EndUser, Conversation.from_end_user_id == EndUser.id)
+            .subquery()
+        )
+
        query = db.select(Conversation).where(Conversation.app_id == app_model.id)

        if args['keyword']:
+            keyword_filter = '%{}%'.format(args['keyword'])
            query = query.join(
-                Message, Message.conversation_id == Conversation.id
+                Message, Message.conversation_id == Conversation.id,
+            ).join(
+                subquery, subquery.c.conversation_id == Conversation.id
            ).filter(
                or_(
-                    Message.query.ilike('%{}%'.format(args['keyword'])),
-                    Message.answer.ilike('%{}%'.format(args['keyword'])),
-                    Conversation.name.ilike('%{}%'.format(args['keyword'])),
-                    Conversation.introduction.ilike('%{}%'.format(args['keyword'])),
+                    Message.query.ilike(keyword_filter),
+                    Message.answer.ilike(keyword_filter),
+                    Conversation.name.ilike(keyword_filter),
+                    Conversation.introduction.ilike(keyword_filter),
+                    subquery.c.from_end_user_session_id.ilike(keyword_filter)
                ),
-
            )

        account = current_user
@ -233,7 +245,7 @@ class ChatConversationDetailApi(Resource):
    @get_app_model(mode=[AppMode.CHAT, AppMode.AGENT_CHAT, AppMode.ADVANCED_CHAT])
    @marshal_with(conversation_detail_fields)
    def get(self, app_model, conversation_id):
-        if not current_user.is_admin_or_owner:
+        if not current_user.is_editor:
            raise Forbidden()
        conversation_id = str(conversation_id)

--- a/api/controllers/console/app/generator.py
+++ b/api/controllers/console/app/generator.py
@ -1,3 +1,5 @@
+import os
+
 from flask_login import current_user
 from flask_restful import Resource, reqparse

@ -28,13 +30,15 @@ class RuleGenerateApi(Resource):
        args = parser.parse_args()

        account = current_user
+        PROMPT_GENERATION_MAX_TOKENS = int(os.getenv('PROMPT_GENERATION_MAX_TOKENS', '512'))

        try:
            rules = LLMGenerator.generate_rule_config(
                tenant_id=account.current_tenant_id,
                instruction=args['instruction'],
                model_config=args['model_config'],
-                no_variable=args['no_variable']
+                no_variable=args['no_variable'],
+                rule_config_max_tokens=PROMPT_GENERATION_MAX_TOKENS
            )
        except ProviderTokenNotInitError as ex:
            raise ProviderNotInitializeError(ex.description)
--- a/api/controllers/console/app/message.py
+++ b/api/controllers/console/app/message.py
@ -149,8 +149,7 @@ class MessageAnnotationApi(Resource):
    @get_app_model
    @marshal_with(annotation_fields)
    def post(self, app_model):
-        # The role of the current user in the ta table must be admin or owner
-        if not current_user.is_admin_or_owner:
+        if not current_user.is_editor:
            raise Forbidden()

        parser = reqparse.RequestParser()
--- a/api/controllers/console/auth/data_source_oauth.py
+++ b/api/controllers/console/auth/data_source_oauth.py
@ -17,8 +17,6 @@ from ..wraps import account_initialization_required

 def get_oauth_providers():
    with current_app.app_context():
-        if not dify_config.NOTION_CLIENT_ID or not dify_config.NOTION_CLIENT_SECRET:
-            return {}
        notion_oauth = NotionOAuth(client_id=dify_config.NOTION_CLIENT_ID,
                                   client_secret=dify_config.NOTION_CLIENT_SECRET,
                                   redirect_uri=dify_config.CONSOLE_API_URL + '/console/api/oauth/data-source/callback/notion')
--- a/api/controllers/console/auth/login.py
+++ b/api/controllers/console/auth/login.py
@ -71,7 +71,7 @@ class ResetPasswordApi(Resource):
        # AccountService.update_password(account, new_password)

        # todo: Send email
-        # MAILCHIMP_API_KEY = current_app.config['MAILCHIMP_TRANSACTIONAL_API_KEY']
+        # MAILCHIMP_API_KEY = dify_config.MAILCHIMP_TRANSACTIONAL_API_KEY
        # mailchimp = MailchimpTransactional(MAILCHIMP_API_KEY)

        # message = {
@ -92,7 +92,7 @@ class ResetPasswordApi(Resource):
        #     'message': message,
        #     # required for transactional email
        #     ' settings': {
-        #         'sandbox_mode': current_app.config['MAILCHIMP_SANDBOX_MODE'],
+        #         'sandbox_mode': dify_config.MAILCHIMP_SANDBOX_MODE,
        #     },
        # })

--- a/api/controllers/console/datasets/datasets.py
+++ b/api/controllers/console/datasets/datasets.py
@ -189,8 +189,6 @@ class DatasetApi(Resource):
        dataset = DatasetService.get_dataset(dataset_id_str)
        if dataset is None:
            raise NotFound("Dataset not found.")
-        # check user's model setting
-        DatasetService.check_dataset_model_setting(dataset)

        parser = reqparse.RequestParser()
        parser.add_argument('name', nullable=False,
@ -215,6 +213,13 @@ class DatasetApi(Resource):
        args = parser.parse_args()
        data = request.get_json()

+        # check embedding model setting
+        if data.get('indexing_technique') == 'high_quality':
+            DatasetService.check_embedding_model_setting(dataset.tenant_id,
+                                                         data.get('embedding_model_provider'),
+                                                         data.get('embedding_model')
+                                                         )
+
        # The role of the current user in the ta table must be admin, owner, editor, or dataset_operator
        DatasetPermissionService.check_permission(
            current_user, dataset, data.get('permission'), data.get('partial_member_list')
@ -233,7 +238,8 @@ class DatasetApi(Resource):
            DatasetPermissionService.update_partial_member_list(
                tenant_id, dataset_id_str, data.get('partial_member_list')
            )
-        else:
+        # clear partial member list when permission is only_me or all_team_members
+        elif data.get('permission') == 'only_me' or data.get('permission') == 'all_team_members':
            DatasetPermissionService.clear_partial_member_list(dataset_id_str)

        partial_member_list = DatasetPermissionService.get_dataset_partial_member_list(dataset_id_str)
--- a/api/controllers/console/datasets/datasets_segments.py
+++ b/api/controllers/console/datasets/datasets_segments.py
@ -223,8 +223,7 @@ class DatasetDocumentSegmentAddApi(Resource):
        document = DocumentService.get_document(dataset_id, document_id)
        if not document:
            raise NotFound('Document not found.')
-        # The role of the current user in the ta table must be admin or owner
-        if not current_user.is_admin_or_owner:
+        if not current_user.is_editor:
            raise Forbidden()
        # check embedding model setting
        if dataset.indexing_technique == 'high_quality':
@ -347,7 +346,7 @@ class DatasetDocumentSegmentUpdateApi(Resource):
        if not segment:
            raise NotFound('Segment not found.')
        # The role of the current user in the ta table must be admin or owner
-        if not current_user.is_admin_or_owner:
+        if not current_user.is_editor:
            raise Forbidden()
        try:
            DatasetService.check_dataset_permission(dataset, current_user)
--- a/api/controllers/inner_api/wraps.py
+++ b/api/controllers/inner_api/wraps.py
@ -19,7 +19,7 @@ def inner_api_only(view):
        # get header 'X-Inner-Api-Key'
        inner_api_key = request.headers.get('X-Inner-Api-Key')
        if not inner_api_key or inner_api_key != dify_config.INNER_API_KEY:
-            abort(404)
+            abort(401)

        return view(*args, **kwargs)

--- a/api/controllers/service_api/app/conversation.py
+++ b/api/controllers/service_api/app/conversation.py
@ -53,7 +53,7 @@ class ConversationDetailApi(Resource):
            ConversationService.delete(app_model, conversation_id, end_user)
        except services.errors.conversation.ConversationNotExistsError:
            raise NotFound("Conversation Not Exists.")
-        return {"result": "success"}, 204
+        return {'result': 'success'}, 200


 class ConversationRenameApi(Resource):
--- a/api/controllers/service_api/app/workflow.py
+++ b/api/controllers/service_api/app/workflow.py
@ -29,22 +29,21 @@ from services.app_generate_service import AppGenerateService

 logger = logging.getLogger(__name__)

+workflow_run_fields = {
+    'id': fields.String,
+    'workflow_id': fields.String,
+    'status': fields.String,
+    'inputs': fields.Raw,
+    'outputs': fields.Raw,
+    'error': fields.String,
+    'total_steps': fields.Integer,
+    'total_tokens': fields.Integer,
+    'created_at': fields.DateTime,
+    'finished_at': fields.DateTime,
+    'elapsed_time': fields.Float,
+}

-class WorkflowRunApi(Resource):
-    workflow_run_fields = {
-        'id': fields.String,
-        'workflow_id': fields.String,
-        'status': fields.String,
-        'inputs': fields.Raw,
-        'outputs': fields.Raw,
-        'error': fields.String,
-        'total_steps': fields.Integer,
-        'total_tokens': fields.Integer,
-        'created_at': fields.DateTime,
-        'finished_at': fields.DateTime,
-        'elapsed_time': fields.Float,
-    }
-
+class WorkflowRunDetailApi(Resource):
    @validate_app_token
    @marshal_with(workflow_run_fields)
    def get(self, app_model: App, workflow_id: str):
@ -57,7 +56,7 @@ class WorkflowRunApi(Resource):

        workflow_run = db.session.query(WorkflowRun).filter(WorkflowRun.id == workflow_id).first()
        return workflow_run
-
+class WorkflowRunApi(Resource):
    @validate_app_token(fetch_user_arg=FetchUserArg(fetch_from=WhereisUserArg.JSON, required=True))
    def post(self, app_model: App, end_user: EndUser):
        """
@ -117,5 +116,6 @@ class WorkflowTaskStopApi(Resource):
        }


-api.add_resource(WorkflowRunApi, '/workflows/run/<string:workflow_id>', '/workflows/run')
+api.add_resource(WorkflowRunApi, '/workflows/run')
+api.add_resource(WorkflowRunDetailApi, '/workflows/run/<string:workflow_id>')
 api.add_resource(WorkflowTaskStopApi, '/workflows/tasks/<string:task_id>/stop')
--- a/api/core/agent/cot_agent_runner.py
+++ b/api/core/agent/cot_agent_runner.py
@ -79,6 +79,7 @@ class CotAgentRunner(BaseAgentRunner, ABC):
                llm_usage.completion_tokens += usage.completion_tokens
                llm_usage.prompt_price += usage.prompt_price
                llm_usage.completion_price += usage.completion_price
+                llm_usage.total_price += usage.total_price

        model_instance = self.model_instance

--- a/api/core/agent/fc_agent_runner.py
+++ b/api/core/agent/fc_agent_runner.py
@ -62,6 +62,7 @@ class FunctionCallAgentRunner(BaseAgentRunner):
                llm_usage.completion_tokens += usage.completion_tokens
                llm_usage.prompt_price += usage.prompt_price
                llm_usage.completion_price += usage.completion_price
+                llm_usage.total_price += usage.total_price

        model_instance = self.model_instance

--- a/api/core/app/app_config/easy_ui_based_app/dataset/manager.py
+++ b/api/core/app/app_config/easy_ui_based_app/dataset/manager.py
@ -62,7 +62,12 @@ class DatasetConfigManager:
            return None

        # dataset configs
-        dataset_configs = config.get('dataset_configs', {'retrieval_model': 'single'})
+        if 'dataset_configs' in config and config.get('dataset_configs'):
+            dataset_configs = config.get('dataset_configs')
+        else:
+            dataset_configs = {
+                'retrieval_model': 'multiple'
+            }
        query_variable = config.get('dataset_query_variable')

        if dataset_configs['retrieval_model'] == 'single':
@ -83,9 +88,11 @@ class DatasetConfigManager:
                    retrieve_strategy=DatasetRetrieveConfigEntity.RetrieveStrategy.value_of(
                        dataset_configs['retrieval_model']
                    ),
-                    top_k=dataset_configs.get('top_k'),
+                    top_k=dataset_configs.get('top_k', 4),
                    score_threshold=dataset_configs.get('score_threshold'),
-                    reranking_model=dataset_configs.get('reranking_model')
+                    reranking_model=dataset_configs.get('reranking_model'),
+                    weights=dataset_configs.get('weights'),
+                    reranking_enabled=dataset_configs.get('reranking_enabled', True),
                )
            )

@ -114,12 +121,6 @@ class DatasetConfigManager:
        if not isinstance(config["dataset_configs"], dict):
            raise ValueError("dataset_configs must be of object type")

-        if config["dataset_configs"]['retrieval_model'] == 'multiple':
-            if not config["dataset_configs"]['reranking_model']:
-                raise ValueError("reranking_model has not been set")
-            if not isinstance(config["dataset_configs"]['reranking_model'], dict):
-                raise ValueError("reranking_model must be of object type")
-
        if not isinstance(config["dataset_configs"], dict):
            raise ValueError("dataset_configs must be of object type")

--- a/api/core/app/app_config/entities.py
+++ b/api/core/app/app_config/entities.py
@ -158,8 +158,13 @@ class DatasetRetrieveConfigEntity(BaseModel):

    retrieve_strategy: RetrieveStrategy
    top_k: Optional[int] = None
-    score_threshold: Optional[float] = None
+    score_threshold: Optional[float] = .0
+    rerank_mode: Optional[str] = 'reranking_model'
    reranking_model: Optional[dict] = None
+    weights: Optional[dict] = None
+    reranking_enabled: Optional[bool] = True
+
+


 class DatasetEntity(BaseModel):
--- a/api/core/app/apps/advanced_chat/app_generator_tts_publisher.py
+++ b/api/core/app/apps/advanced_chat/app_generator_tts_publisher.py
@ -5,7 +5,12 @@ import queue
 import re
 import threading

-from core.app.entities.queue_entities import QueueAgentMessageEvent, QueueLLMChunkEvent, QueueTextChunkEvent
+from core.app.entities.queue_entities import (
+    QueueAgentMessageEvent,
+    QueueLLMChunkEvent,
+    QueueNodeSucceededEvent,
+    QueueTextChunkEvent,
+)
 from core.model_manager import ModelManager
 from core.model_runtime.entities.model_entities import ModelType

@ -88,6 +93,8 @@ class AppGeneratorTTSPublisher:
                    self.msg_text += message.event.chunk.delta.message.content
                elif isinstance(message.event, QueueTextChunkEvent):
                    self.msg_text += message.event.text
+                elif isinstance(message.event, QueueNodeSucceededEvent):
+                    self.msg_text += message.event.outputs.get('output', '')
                self.last_message = message
                sentence_arr, text_tmp = self._extract_sentence(self.msg_text)
                if len(sentence_arr) >= min(self.MAX_SENTENCE, 7):
--- a/api/core/app/apps/advanced_chat/generate_task_pipeline.py
+++ b/api/core/app/apps/advanced_chat/generate_task_pipeline.py
@ -244,7 +244,12 @@ class AdvancedChatAppGenerateTaskPipeline(BasedGenerateTaskPipeline, WorkflowCyc
        :return:
        """
        for message in self._queue_manager.listen():
-            if publisher:
+            if hasattr(message.event, 'metadata') and message.event.metadata.get('is_answer_previous_node', False) and publisher:
+                publisher.publish(message=message)
+            elif (hasattr(message.event, 'execution_metadata')
+                  and message.event.execution_metadata
+                  and message.event.execution_metadata.get('is_answer_previous_node', False)
+                  and publisher):
                publisher.publish(message=message)
            event = message.event

--- a/api/core/app/apps/agent_chat/app_generator.py
+++ b/api/core/app/apps/agent_chat/app_generator.py
@ -110,7 +110,8 @@ class AgentChatAppGenerator(MessageBasedAppGenerator):
        )

        # get tracing instance
-        trace_manager = TraceQueueManager(app_model.id)
+        user_id = user.id if isinstance(user, Account) else user.session_id
+        trace_manager = TraceQueueManager(app_model.id, user_id)

        # init application generate entity
        application_generate_entity = AgentChatAppGenerateEntity(
--- a/api/core/app/apps/base_app_queue_manager.py
+++ b/api/core/app/apps/base_app_queue_manager.py
@ -5,9 +5,9 @@ from collections.abc import Generator
 from enum import Enum
 from typing import Any

-from flask import current_app
 from sqlalchemy.orm import DeclarativeMeta

+from configs import dify_config
 from core.app.entities.app_invoke_entities import InvokeFrom
 from core.app.entities.queue_entities import (
    AppQueueEvent,
@ -48,7 +48,7 @@ class AppQueueManager:
        :return:
        """
        # wait for APP_MAX_EXECUTION_TIME seconds to stop listen
-        listen_timeout = current_app.config.get("APP_MAX_EXECUTION_TIME")
+        listen_timeout = dify_config.APP_MAX_EXECUTION_TIME
        start_time = time.time()
        last_ping_time = 0
        while True:
--- a/api/core/app/apps/workflow/app_generator.py
+++ b/api/core/app/apps/workflow/app_generator.py
@ -74,7 +74,8 @@ class WorkflowAppGenerator(BaseAppGenerator):
        )

        # get tracing instance
-        trace_manager = TraceQueueManager(app_model.id)
+        user_id = user.id if isinstance(user, Account) else user.session_id
+        trace_manager = TraceQueueManager(app_model.id, user_id)

        # init application generate entity
        application_generate_entity = WorkflowAppGenerateEntity(
--- a/api/core/app/segments/init.py
+++ b/api/core/app/segments/init.py
@ -1,8 +1,21 @@
 from .segment_group import SegmentGroup
-from .segments import NoneSegment, Segment
+from .segments import (
+    ArrayAnySegment,
+    FileSegment,
+    FloatSegment,
+    IntegerSegment,
+    NoneSegment,
+    ObjectSegment,
+    Segment,
+    StringSegment,
+)
 from .types import SegmentType
 from .variables import (
-    ArrayVariable,
+    ArrayAnyVariable,
+    ArrayFileVariable,
+    ArrayNumberVariable,
+    ArrayObjectVariable,
+    ArrayStringVariable,
    FileVariable,
    FloatVariable,
    IntegerVariable,
@ -20,11 +33,21 @@ __all__ = [
    'SecretVariable',
    'FileVariable',
    'StringVariable',
-    'ArrayVariable',
+    'ArrayAnyVariable',
    'Variable',
    'SegmentType',
    'SegmentGroup',
    'Segment',
    'NoneSegment',
    'NoneVariable',
+    'IntegerSegment',
+    'FloatSegment',
+    'ObjectSegment',
+    'ArrayAnySegment',
+    'FileSegment',
+    'StringSegment',
+    'ArrayStringVariable',
+    'ArrayNumberVariable',
+    'ArrayObjectVariable',
+    'ArrayFileVariable',
 ]
--- a/api/core/app/segments/factory.py
+++ b/api/core/app/segments/factory.py
@ -3,14 +3,25 @@ from typing import Any

 from core.file.file_obj import FileVar

-from .segments import Segment, StringSegment
+from .segments import (
+    ArrayAnySegment,
+    FileSegment,
+    FloatSegment,
+    IntegerSegment,
+    NoneSegment,
+    ObjectSegment,
+    Segment,
+    StringSegment,
+)
 from .types import SegmentType
 from .variables import (
-    ArrayVariable,
+    ArrayFileVariable,
+    ArrayNumberVariable,
+    ArrayObjectVariable,
+    ArrayStringVariable,
    FileVariable,
    FloatVariable,
    IntegerVariable,
-    NoneVariable,
    ObjectVariable,
    SecretVariable,
    StringVariable,
@ -28,40 +39,48 @@ def build_variable_from_mapping(m: Mapping[str, Any], /) -> Variable:
    match value_type:
        case SegmentType.STRING:
            return StringVariable.model_validate(m)
+        case SegmentType.SECRET:
+            return SecretVariable.model_validate(m)
        case SegmentType.NUMBER if isinstance(value, int):
            return IntegerVariable.model_validate(m)
        case SegmentType.NUMBER if isinstance(value, float):
            return FloatVariable.model_validate(m)
-        case SegmentType.SECRET:
-            return SecretVariable.model_validate(m)
        case SegmentType.NUMBER if not isinstance(value, float | int):
            raise ValueError(f'invalid number value {value}')
+        case SegmentType.FILE:
+            return FileVariable.model_validate(m)
+        case SegmentType.OBJECT if isinstance(value, dict):
+            return ObjectVariable.model_validate(
+                {**m, 'value': {k: build_variable_from_mapping(v) for k, v in value.items()}}
+            )
+        case SegmentType.ARRAY_STRING if isinstance(value, list):
+            return ArrayStringVariable.model_validate({**m, 'value': [build_variable_from_mapping(v) for v in value]})
+        case SegmentType.ARRAY_NUMBER if isinstance(value, list):
+            return ArrayNumberVariable.model_validate({**m, 'value': [build_variable_from_mapping(v) for v in value]})
+        case SegmentType.ARRAY_OBJECT if isinstance(value, list):
+            return ArrayObjectVariable.model_validate({**m, 'value': [build_variable_from_mapping(v) for v in value]})
+        case SegmentType.ARRAY_FILE if isinstance(value, list):
+            return ArrayFileVariable.model_validate({**m, 'value': [build_variable_from_mapping(v) for v in value]})
    raise ValueError(f'not supported value type {value_type}')


-def build_anonymous_variable(value: Any, /) -> Variable:
-    if value is None:
-        return NoneVariable(name='anonymous')
-    if isinstance(value, str):
-        return StringVariable(name='anonymous', value=value)
-    if isinstance(value, int):
-        return IntegerVariable(name='anonymous', value=value)
-    if isinstance(value, float):
-        return FloatVariable(name='anonymous', value=value)
-    if isinstance(value, dict):
-        # TODO: Limit the depth of the object
-        obj = {k: build_anonymous_variable(v) for k, v in value.items()}
-        return ObjectVariable(name='anonymous', value=obj)
-    if isinstance(value, list):
-        # TODO: Limit the depth of the array
-        elements = [build_anonymous_variable(v) for v in value]
-        return ArrayVariable(name='anonymous', value=elements)
-    if isinstance(value, FileVar):
-        return FileVariable(name='anonymous', value=value)
-    raise ValueError(f'not supported value {value}')
-
-
 def build_segment(value: Any, /) -> Segment:
+    if value is None:
+        return NoneSegment()
    if isinstance(value, str):
        return StringSegment(value=value)
+    if isinstance(value, int):
+        return IntegerSegment(value=value)
+    if isinstance(value, float):
+        return FloatSegment(value=value)
+    if isinstance(value, dict):
+        # TODO: Limit the depth of the object
+        obj = {k: build_segment(v) for k, v in value.items()}
+        return ObjectSegment(value=obj)
+    if isinstance(value, list):
+        # TODO: Limit the depth of the array
+        elements = [build_segment(v) for v in value]
+        return ArrayAnySegment(value=elements)
+    if isinstance(value, FileVar):
+        return FileSegment(value=value)
    raise ValueError(f'not supported value {value}')
--- a/api/core/app/segments/parser.py
+++ b/api/core/app/segments/parser.py
@ -1,17 +1,18 @@
 import re

-from core.app.segments import SegmentGroup, factory
 from core.workflow.entities.variable_pool import VariablePool

+from . import SegmentGroup, factory
+
 VARIABLE_PATTERN = re.compile(r'\{\{#([a-zA-Z0-9_]{1,50}(?:\.[a-zA-Z_][a-zA-Z0-9_]{0,29}){1,10})#\}\}')


 def convert_template(*, template: str, variable_pool: VariablePool):
    parts = re.split(VARIABLE_PATTERN, template)
    segments = []
-    for part in parts:
+    for part in filter(lambda x: x, parts):
        if '.' in part and (value := variable_pool.get(part.split('.'))):
            segments.append(value)
        else:
            segments.append(factory.build_segment(part))
-    return SegmentGroup(segments=segments)
+    return SegmentGroup(value=segments)
--- a/api/core/app/segments/segment_group.py
+++ b/api/core/app/segments/segment_group.py
@ -1,19 +1,22 @@
-from pydantic import BaseModel
-
 from .segments import Segment
+from .types import SegmentType


-class SegmentGroup(BaseModel):
-    segments: list[Segment]
+class SegmentGroup(Segment):
+    value_type: SegmentType = SegmentType.GROUP
+    value: list[Segment]

    @property
    def text(self):
-        return ''.join([segment.text for segment in self.segments])
+        return ''.join([segment.text for segment in self.value])

    @property
    def log(self):
-        return ''.join([segment.log for segment in self.segments])
+        return ''.join([segment.log for segment in self.value])

    @property
    def markdown(self):
-        return ''.join([segment.markdown for segment in self.segments])
+        return ''.join([segment.markdown for segment in self.value])
+
+    def to_object(self):
+        return [segment.to_object() for segment in self.value]
--- a/api/core/app/segments/segments.py
+++ b/api/core/app/segments/segments.py
@ -1,7 +1,11 @@
+import json
+from collections.abc import Mapping, Sequence
 from typing import Any

 from pydantic import BaseModel, ConfigDict, field_validator

+from core.file.file_obj import FileVar
+
 from .types import SegmentType


@ -34,12 +38,6 @@ class Segment(BaseModel):
        return str(self.value)

    def to_object(self) -> Any:
-        if isinstance(self.value, Segment):
-            return self.value.to_object()
-        if isinstance(self.value, list):
-            return [v.to_object() for v in self.value]
-        if isinstance(self.value, dict):
-            return {k: v.to_object() for k, v in self.value.items()}
        return self.value


@ -63,3 +61,80 @@ class NoneSegment(Segment):
 class StringSegment(Segment):
    value_type: SegmentType = SegmentType.STRING
    value: str
+
+
+class FloatSegment(Segment):
+    value_type: SegmentType = SegmentType.NUMBER
+    value: float
+
+
+class IntegerSegment(Segment):
+    value_type: SegmentType = SegmentType.NUMBER
+    value: int
+
+
+class FileSegment(Segment):
+    value_type: SegmentType = SegmentType.FILE
+    # TODO: embed FileVar in this model.
+    value: FileVar
+
+    @property
+    def markdown(self) -> str:
+        return self.value.to_markdown()
+
+
+class ObjectSegment(Segment):
+    value_type: SegmentType = SegmentType.OBJECT
+    value: Mapping[str, Segment]
+
+    @property
+    def text(self) -> str:
+        # TODO: Process variables.
+        return json.dumps(self.model_dump()['value'], ensure_ascii=False)
+
+    @property
+    def log(self) -> str:
+        # TODO: Process variables.
+        return json.dumps(self.model_dump()['value'], ensure_ascii=False, indent=2)
+
+    @property
+    def markdown(self) -> str:
+        # TODO: Use markdown code block
+        return json.dumps(self.model_dump()['value'], ensure_ascii=False, indent=2)
+
+    def to_object(self):
+        return {k: v.to_object() for k, v in self.value.items()}
+
+
+class ArraySegment(Segment):
+    @property
+    def markdown(self) -> str:
+        return '\n'.join(['- ' + item.markdown for item in self.value])
+
+    def to_object(self):
+        return [v.to_object() for v in self.value]
+
+
+class ArrayAnySegment(ArraySegment):
+    value_type: SegmentType = SegmentType.ARRAY_ANY
+    value: Sequence[Segment]
+
+
+class ArrayStringSegment(ArraySegment):
+    value_type: SegmentType = SegmentType.ARRAY_STRING
+    value: Sequence[StringSegment]
+
+
+class ArrayNumberSegment(ArraySegment):
+    value_type: SegmentType = SegmentType.ARRAY_NUMBER
+    value: Sequence[FloatSegment | IntegerSegment]
+
+
+class ArrayObjectSegment(ArraySegment):
+    value_type: SegmentType = SegmentType.ARRAY_OBJECT
+    value: Sequence[ObjectSegment]
+
+
+class ArrayFileSegment(ArraySegment):
+    value_type: SegmentType = SegmentType.ARRAY_FILE
+    value: Sequence[FileSegment]
--- a/api/core/app/segments/types.py
+++ b/api/core/app/segments/types.py
@ -6,6 +6,12 @@ class SegmentType(str, Enum):
    NUMBER = 'number'
    STRING = 'string'
    SECRET = 'secret'
-    ARRAY = 'array'
+    ARRAY_ANY = 'array[any]'
+    ARRAY_STRING = 'array[string]'
+    ARRAY_NUMBER = 'array[number]'
+    ARRAY_OBJECT = 'array[object]'
+    ARRAY_FILE = 'array[file]'
    OBJECT = 'object'
    FILE = 'file'
+
+    GROUP = 'group'
--- a/api/core/app/segments/variables.py
+++ b/api/core/app/segments/variables.py
@ -1,12 +1,21 @@
-import json
-from collections.abc import Mapping, Sequence
-
 from pydantic import Field

-from core.file.file_obj import FileVar
 from core.helper import encrypter

-from .segments import NoneSegment, Segment, StringSegment
+from .segments import (
+    ArrayAnySegment,
+    ArrayFileSegment,
+    ArrayNumberSegment,
+    ArrayObjectSegment,
+    ArrayStringSegment,
+    FileSegment,
+    FloatSegment,
+    IntegerSegment,
+    NoneSegment,
+    ObjectSegment,
+    Segment,
+    StringSegment,
+)
 from .types import SegmentType


@ -20,59 +29,47 @@ class Variable(Segment):
        description="Unique identity for variable. It's only used by environment variables now.",
    )
    name: str
+    description: str = Field(default='', description='Description of the variable.')


 class StringVariable(StringSegment, Variable):
    pass


-class FloatVariable(Variable):
-    value_type: SegmentType = SegmentType.NUMBER
-    value: float
+class FloatVariable(FloatSegment, Variable):
+    pass


-class IntegerVariable(Variable):
-    value_type: SegmentType = SegmentType.NUMBER
-    value: int
+class IntegerVariable(IntegerSegment, Variable):
+    pass


-class ObjectVariable(Variable):
-    value_type: SegmentType = SegmentType.OBJECT
-    value: Mapping[str, Variable]
-
-    @property
-    def text(self) -> str:
-        # TODO: Process variables.
-        return json.dumps(self.model_dump()['value'], ensure_ascii=False)
-
-    @property
-    def log(self) -> str:
-        # TODO: Process variables.
-        return json.dumps(self.model_dump()['value'], ensure_ascii=False, indent=2)
-
-    @property
-    def markdown(self) -> str:
-        # TODO: Use markdown code block
-        return json.dumps(self.model_dump()['value'], ensure_ascii=False, indent=2)
+class FileVariable(FileSegment, Variable):
+    pass


-class ArrayVariable(Variable):
-    value_type: SegmentType = SegmentType.ARRAY
-    value: Sequence[Variable]
-
-    @property
-    def markdown(self) -> str:
-        return '\n'.join(['- ' + item.markdown for item in self.value])
+class ObjectVariable(ObjectSegment, Variable):
+    pass


-class FileVariable(Variable):
-    value_type: SegmentType = SegmentType.FILE
-    # TODO: embed FileVar in this model.
-    value: FileVar
+class ArrayAnyVariable(ArrayAnySegment, Variable):
+    pass

-    @property
-    def markdown(self) -> str:
-        return self.value.to_markdown()
+
+class ArrayStringVariable(ArrayStringSegment, Variable):
+    pass
+
+
+class ArrayNumberVariable(ArrayNumberSegment, Variable):
+    pass
+
+
+class ArrayObjectVariable(ArrayObjectSegment, Variable):
+    pass
+
+
+class ArrayFileVariable(ArrayFileSegment, Variable):
+    pass


 class SecretVariable(StringVariable):
--- a/api/core/app/task_pipeline/workflow_cycle_manage.py
+++ b/api/core/app/task_pipeline/workflow_cycle_manage.py
@ -131,6 +131,7 @@ class WorkflowCycleManage(WorkflowIterationCycleManage):
                    TraceTaskName.WORKFLOW_TRACE,
                    workflow_run=workflow_run,
                    conversation_id=conversation_id,
+                    user_id=trace_manager.user_id,
                )
            )

@ -173,6 +174,7 @@ class WorkflowCycleManage(WorkflowIterationCycleManage):
                    TraceTaskName.WORKFLOW_TRACE,
                    workflow_run=workflow_run,
                    conversation_id=conversation_id,
+                    user_id=trace_manager.user_id,
                )
            )

--- a/api/core/file/upload_file_parser.py
+++ b/api/core/file/upload_file_parser.py
@ -6,8 +6,7 @@ import os
 import time
 from typing import Optional

-from flask import current_app
-
+from configs import dify_config
 from extensions.ext_storage import storage

 IMAGE_EXTENSIONS = ['jpg', 'jpeg', 'png', 'webp', 'gif', 'svg']
@ -23,7 +22,7 @@ class UploadFileParser:
        if upload_file.extension not in IMAGE_EXTENSIONS:
            return None

-        if current_app.config['MULTIMODAL_SEND_IMAGE_FORMAT'] == 'url' or force_url:
+        if dify_config.MULTIMODAL_SEND_IMAGE_FORMAT == 'url' or force_url:
            return cls.get_signed_temp_image_url(upload_file.id)
        else:
            # get image file base64
@ -44,13 +43,13 @@ class UploadFileParser:
        :param upload_file: UploadFile object
        :return:
        """
-        base_url = current_app.config.get('FILES_URL')
+        base_url = dify_config.FILES_URL
        image_preview_url = f'{base_url}/files/{upload_file_id}/image-preview'

        timestamp = str(int(time.time()))
        nonce = os.urandom(16).hex()
        data_to_sign = f"image-preview|{upload_file_id}|{timestamp}|{nonce}"
-        secret_key = current_app.config['SECRET_KEY'].encode()
+        secret_key = dify_config.SECRET_KEY.encode()
        sign = hmac.new(secret_key, data_to_sign.encode(), hashlib.sha256).digest()
        encoded_sign = base64.urlsafe_b64encode(sign).decode()

@ -68,7 +67,7 @@ class UploadFileParser:
        :return:
        """
        data_to_sign = f"image-preview|{upload_file_id}|{timestamp}|{nonce}"
-        secret_key = current_app.config['SECRET_KEY'].encode()
+        secret_key = dify_config.SECRET_KEY.encode()
        recalculated_sign = hmac.new(secret_key, data_to_sign.encode(), hashlib.sha256).digest()
        recalculated_encoded_sign = base64.urlsafe_b64encode(recalculated_sign).decode()

@ -77,4 +76,4 @@ class UploadFileParser:
            return False

        current_time = int(time.time())
-        return current_time - int(timestamp) <= current_app.config.get('FILES_ACCESS_TIMEOUT')
+        return current_time - int(timestamp) <= dify_config.FILES_ACCESS_TIMEOUT
--- a/api/core/helper/code_executor/code_executor.py
+++ b/api/core/helper/code_executor/code_executor.py
@ -107,11 +107,11 @@ class CodeExecutor:
            response = response.json()
        except:
            raise CodeExecutionException('Failed to parse response')
+
+        if (code := response.get('code')) != 0:
+            raise CodeExecutionException(f"Got error code: {code}. Got error msg: {response.get('message')}")
        
        response = CodeExecutionResponse(**response)
-
-        if response.code != 0:
-            raise CodeExecutionException(response.message)
        
        if response.data.error:
            raise CodeExecutionException(response.data.error)
--- a/api/core/helper/position_helper.py
+++ b/api/core/helper/position_helper.py
@ -13,18 +13,10 @@ def get_position_map(folder_path: str, *, file_name: str = "_position.yaml") ->
    :param file_name: the YAML file name, default to '_position.yaml'
    :return: a dict with name as key and index as value
    """
-    position_file_name = os.path.join(folder_path, file_name)
-    if not position_file_name or not os.path.exists(position_file_name):
-        return {}
-    
-    positions = load_yaml_file(position_file_name, ignore_error=True)
-    position_map = {}
-    index = 0
-    for _, name in enumerate(positions):
-        if name and isinstance(name, str):
-            position_map[name.strip()] = index
-            index += 1
-    return position_map
+    position_file_path = os.path.join(folder_path, file_name)
+    yaml_content = load_yaml_file(file_path=position_file_path, default_value=[])
+    positions = [item.strip() for item in yaml_content if item and isinstance(item, str) and item.strip()]
+    return {name: index for index, name in enumerate(positions)}


 def sort_by_position_map(
--- a/api/core/helper/ssrf_proxy.py
+++ b/api/core/helper/ssrf_proxy.py
@ -1,48 +1,75 @@
 """
 Proxy requests to avoid SSRF
 """
+import logging
 import os
+import time

 import httpx

 SSRF_PROXY_ALL_URL = os.getenv('SSRF_PROXY_ALL_URL', '')
 SSRF_PROXY_HTTP_URL = os.getenv('SSRF_PROXY_HTTP_URL', '')
 SSRF_PROXY_HTTPS_URL = os.getenv('SSRF_PROXY_HTTPS_URL', '')
+SSRF_DEFAULT_MAX_RETRIES = int(os.getenv('SSRF_DEFAULT_MAX_RETRIES', '3'))

 proxies = {
    'http://': SSRF_PROXY_HTTP_URL,
    'https://': SSRF_PROXY_HTTPS_URL
 } if SSRF_PROXY_HTTP_URL and SSRF_PROXY_HTTPS_URL else None

+BACKOFF_FACTOR = 0.5
+STATUS_FORCELIST = [429, 500, 502, 503, 504]

-def make_request(method, url, **kwargs):
-    if SSRF_PROXY_ALL_URL:
-        return httpx.request(method=method, url=url, proxy=SSRF_PROXY_ALL_URL, **kwargs)
-    elif proxies:
-        return httpx.request(method=method, url=url, proxies=proxies, **kwargs)
-    else:
-        return httpx.request(method=method, url=url, **kwargs)
+def make_request(method, url, max_retries=SSRF_DEFAULT_MAX_RETRIES, **kwargs):
+    if "allow_redirects" in kwargs:
+        allow_redirects = kwargs.pop("allow_redirects")
+        if "follow_redirects" not in kwargs:
+            kwargs["follow_redirects"] = allow_redirects
+    
+    retries = 0
+    while retries <= max_retries:
+        try:
+            if SSRF_PROXY_ALL_URL:
+                response = httpx.request(method=method, url=url, proxy=SSRF_PROXY_ALL_URL, **kwargs)
+            elif proxies:
+                response = httpx.request(method=method, url=url, proxies=proxies, **kwargs)
+            else:
+                response = httpx.request(method=method, url=url, **kwargs)
+
+            if response.status_code not in STATUS_FORCELIST:
+                return response
+            else:
+                logging.warning(f"Received status code {response.status_code} for URL {url} which is in the force list")
+
+        except httpx.RequestError as e:
+            logging.warning(f"Request to URL {url} failed on attempt {retries + 1}: {e}")
+
+        retries += 1
+        if retries <= max_retries:
+            time.sleep(BACKOFF_FACTOR * (2 ** (retries - 1)))
+
+    raise Exception(f"Reached maximum retries ({max_retries}) for URL {url}")


-def get(url, **kwargs):
-    return make_request('GET', url, **kwargs)
+def get(url, max_retries=SSRF_DEFAULT_MAX_RETRIES, **kwargs):
+    return make_request('GET', url, max_retries=max_retries, **kwargs)


-def post(url, **kwargs):
-    return make_request('POST', url, **kwargs)
+def post(url, max_retries=SSRF_DEFAULT_MAX_RETRIES, **kwargs):
+    return make_request('POST', url, max_retries=max_retries, **kwargs)


-def put(url, **kwargs):
-    return make_request('PUT', url, **kwargs)
+def put(url, max_retries=SSRF_DEFAULT_MAX_RETRIES, **kwargs):
+    return make_request('PUT', url, max_retries=max_retries, **kwargs)


-def patch(url, **kwargs):
-    return make_request('PATCH', url, **kwargs)
+def patch(url, max_retries=SSRF_DEFAULT_MAX_RETRIES, **kwargs):
+    return make_request('PATCH', url, max_retries=max_retries, **kwargs)


-def delete(url, **kwargs):
-    return make_request('DELETE', url, **kwargs)
+def delete(url, max_retries=SSRF_DEFAULT_MAX_RETRIES, **kwargs):
+    return make_request('DELETE', url, max_retries=max_retries, **kwargs)


-def head(url, **kwargs):
-    return make_request('HEAD', url, **kwargs)
+def head(url, max_retries=SSRF_DEFAULT_MAX_RETRIES, **kwargs):
+    return make_request('HEAD', url, max_retries=max_retries, **kwargs)
--- a/api/core/hosting_configuration.py
+++ b/api/core/hosting_configuration.py
@ -73,6 +73,8 @@ class HostingConfiguration:
                quota_limit=hosted_quota_limit,
                restrict_models=[
                    RestrictModel(model="gpt-4", base_model_name="gpt-4", model_type=ModelType.LLM),
+                    RestrictModel(model="gpt-4o", base_model_name="gpt-4o", model_type=ModelType.LLM),
+                    RestrictModel(model="gpt-4o-mini", base_model_name="gpt-4o-mini", model_type=ModelType.LLM),
                    RestrictModel(model="gpt-4-32k", base_model_name="gpt-4-32k", model_type=ModelType.LLM),
                    RestrictModel(model="gpt-4-1106-preview", base_model_name="gpt-4-1106-preview", model_type=ModelType.LLM),
                    RestrictModel(model="gpt-4-vision-preview", base_model_name="gpt-4-vision-preview", model_type=ModelType.LLM),
--- a/api/core/indexing_runner.py
+++ b/api/core/indexing_runner.py
@ -12,6 +12,7 @@ from flask import Flask, current_app
 from flask_login import current_user
 from sqlalchemy.orm.exc import ObjectDeletedError

+from configs import dify_config
 from core.errors.error import ProviderTokenNotInitError
 from core.llm_generator.llm_generator import LLMGenerator
 from core.model_manager import ModelInstance, ModelManager
@ -224,7 +225,7 @@ class IndexingRunner:
        features = FeatureService.get_features(tenant_id)
        if features.billing.enabled:
            count = len(extract_settings)
-            batch_upload_limit = int(current_app.config['BATCH_UPLOAD_LIMIT'])
+            batch_upload_limit = dify_config.BATCH_UPLOAD_LIMIT
            if count > batch_upload_limit:
                raise ValueError(f"You have reached the batch upload limit of {batch_upload_limit}.")

@ -427,7 +428,7 @@ class IndexingRunner:
            # The user-defined segmentation rule
            rules = json.loads(processing_rule.rules)
            segmentation = rules["segmentation"]
-            max_segmentation_tokens_length = int(current_app.config['INDEXING_MAX_SEGMENTATION_TOKENS_LENGTH'])
+            max_segmentation_tokens_length = dify_config.INDEXING_MAX_SEGMENTATION_TOKENS_LENGTH
            if segmentation["max_tokens"] < 50 or segmentation["max_tokens"] > max_segmentation_tokens_length:
                raise ValueError(f"Custom segment length should be between 50 and {max_segmentation_tokens_length}.")

--- a/api/core/llm_generator/llm_generator.py
+++ b/api/core/llm_generator/llm_generator.py
@ -118,7 +118,7 @@ class LLMGenerator:
        return questions

    @classmethod
-    def generate_rule_config(cls, tenant_id: str, instruction: str, model_config: dict, no_variable: bool) -> dict:
+    def generate_rule_config(cls, tenant_id: str, instruction: str, model_config: dict, no_variable: bool, rule_config_max_tokens: int = 512) -> dict:
        output_parser = RuleConfigGeneratorOutputParser()

        error = ""
@ -130,7 +130,7 @@ class LLMGenerator:
            "error": ""
        }
        model_parameters = {
-            "max_tokens": 512,
+            "max_tokens": rule_config_max_tokens,
            "temperature": 0.01
        }

--- a/api/core/model_runtime/docs/en_US/schema.md
+++ b/api/core/model_runtime/docs/en_US/schema.md
@ -86,6 +86,9 @@

 - `agent-thought` Agent reasoning, generally over 70B with thought chain capability.
 - `vision` Vision, i.e., image understanding.
+- `tool-call`
+- `multi-tool-call`
+- `stream-tool-call`

 ### FetchFrom

--- a/api/core/model_runtime/docs/zh_Hans/schema.md
+++ b/api/core/model_runtime/docs/zh_Hans/schema.md
@ -87,6 +87,9 @@

 - `agent-thought` Agent 推理，一般超过 70B 有思维链能力。
 - `vision` 视觉，即：图像理解。
+- `tool-call` 工具调用
+- `multi-tool-call` 多工具调用
+- `stream-tool-call` 流式工具调用

 ### FetchFrom

--- a/api/core/model_runtime/model_providers/__base/ai_model.py
+++ b/api/core/model_runtime/model_providers/__base/ai_model.py
@ -162,7 +162,7 @@ class AIModel(ABC):
        # traverse all model_schema_yaml_paths
        for model_schema_yaml_path in model_schema_yaml_paths:
            # read yaml data from yaml file
-            yaml_data = load_yaml_file(model_schema_yaml_path, ignore_error=True)
+            yaml_data = load_yaml_file(model_schema_yaml_path)

            new_parameter_rules = []
            for parameter_rule in yaml_data.get('parameter_rules', []):
--- a/api/core/model_runtime/model_providers/__base/model_provider.py
+++ b/api/core/model_runtime/model_providers/__base/model_provider.py
@ -44,7 +44,7 @@ class ModelProvider(ABC):
    
        # read provider schema from yaml file
        yaml_path = os.path.join(current_path, f'{provider_name}.yaml')
-        yaml_data = load_yaml_file(yaml_path, ignore_error=True)
+        yaml_data = load_yaml_file(yaml_path)
    
        try:
            # yaml_data to entity
--- a/api/core/model_runtime/model_providers/__base/tts_model.py
+++ b/api/core/model_runtime/model_providers/__base/tts_model.py
@ -1,18 +1,16 @@
-import hashlib
 import logging
 import re
-import subprocess
-import uuid
 from abc import abstractmethod
 from typing import Optional

 from pydantic import ConfigDict

 from core.model_runtime.entities.model_entities import ModelPropertyKey, ModelType
-from core.model_runtime.errors.invoke import InvokeBadRequestError
 from core.model_runtime.model_providers.__base.ai_model import AIModel

 logger = logging.getLogger(__name__)
+
+
 class TTSModel(AIModel):
    """
    Model class for ttstext model.
@ -37,8 +35,6 @@ class TTSModel(AIModel):
        :return: translated audio file
        """
        try:
-            logger.info(f"Invoke TTS model: {model} , invoke content : {content_text}")
-            self._is_ffmpeg_installed()
            return self._invoke(model=model, credentials=credentials, user=user,
                                content_text=content_text, voice=voice, tenant_id=tenant_id)
        except Exception as e:
@ -75,7 +71,8 @@ class TTSModel(AIModel):
        if model_schema and ModelPropertyKey.VOICES in model_schema.model_properties:
            voices = model_schema.model_properties[ModelPropertyKey.VOICES]
            if language:
-                return [{'name': d['name'], 'value': d['mode']} for d in voices if language and language in d.get('language')]
+                return [{'name': d['name'], 'value': d['mode']} for d in voices if
+                        language and language in d.get('language')]
            else:
                return [{'name': d['name'], 'value': d['mode']} for d in voices]

@ -146,28 +143,3 @@ class TTSModel(AIModel):
        if one_sentence != '':
            result.append(one_sentence)
        return result
-
-    @staticmethod
-    def _is_ffmpeg_installed():
-        try:
-            output = subprocess.check_output("ffmpeg -version", shell=True)
-            if "ffmpeg version" in output.decode("utf-8"):
-                return True
-            else:
-                raise InvokeBadRequestError("ffmpeg is not installed, "
-                                            "details: https://docs.dify.ai/getting-started/install-self-hosted"
-                                            "/install-faq#id-14.-what-to-do-if-this-error-occurs-in-text-to-speech")
-        except Exception:
-            raise InvokeBadRequestError("ffmpeg is not installed, "
-                                        "details: https://docs.dify.ai/getting-started/install-self-hosted"
-                                        "/install-faq#id-14.-what-to-do-if-this-error-occurs-in-text-to-speech")
-
-    # Todo: To improve the streaming function
-    @staticmethod
-    def _get_file_name(file_content: str) -> str:
-        hash_object = hashlib.sha256(file_content.encode())
-        hex_digest = hash_object.hexdigest()
-
-        namespace_uuid = uuid.UUID('a5da6ef9-b303-596f-8e88-bf8fa40f4b31')
-        unique_uuid = uuid.uuid5(namespace_uuid, hex_digest)
-        return str(unique_uuid)
--- a/api/core/model_runtime/model_providers/_position.yaml
+++ b/api/core/model_runtime/model_providers/_position.yaml
@ -6,6 +6,7 @@
 - nvidia
 - nvidia_nim
 - cohere
+- upstage
 - bedrock
 - togetherai
 - openrouter
--- a/api/core/model_runtime/model_providers/anthropic/llm/llm.py
+++ b/api/core/model_runtime/model_providers/anthropic/llm/llm.py
@ -116,7 +116,8 @@ class AnthropicLargeLanguageModel(LargeLanguageModel):
        # Add the new header for claude-3-5-sonnet-20240620 model
        extra_headers = {}
        if model == "claude-3-5-sonnet-20240620":
-            extra_headers["anthropic-beta"] = "max-tokens-3-5-sonnet-2024-07-15"
+            if model_parameters.get('max_tokens') > 4096:
+                extra_headers["anthropic-beta"] = "max-tokens-3-5-sonnet-2024-07-15"

        if tools:
            extra_model_kwargs['tools'] = [
--- a/api/core/model_runtime/model_providers/azure_openai/_constant.py
+++ b/api/core/model_runtime/model_providers/azure_openai/_constant.py
@ -496,6 +496,158 @@ LLM_BASE_MODELS = [
            )
        )
    ),
+    AzureBaseModel(
+        base_model_name='gpt-4o-mini',
+        entity=AIModelEntity(
+            model='fake-deployment-name',
+            label=I18nObject(
+                en_US='fake-deployment-name-label',
+            ),
+            model_type=ModelType.LLM,
+            features=[
+                ModelFeature.AGENT_THOUGHT,
+                ModelFeature.VISION,
+                ModelFeature.MULTI_TOOL_CALL,
+                ModelFeature.STREAM_TOOL_CALL,
+            ],
+            fetch_from=FetchFrom.CUSTOMIZABLE_MODEL,
+            model_properties={
+                ModelPropertyKey.MODE: LLMMode.CHAT.value,
+                ModelPropertyKey.CONTEXT_SIZE: 128000,
+            },
+            parameter_rules=[
+                ParameterRule(
+                    name='temperature',
+                    **PARAMETER_RULE_TEMPLATE[DefaultParameterName.TEMPERATURE],
+                ),
+                ParameterRule(
+                    name='top_p',
+                    **PARAMETER_RULE_TEMPLATE[DefaultParameterName.TOP_P],
+                ),
+                ParameterRule(
+                    name='presence_penalty',
+                    **PARAMETER_RULE_TEMPLATE[DefaultParameterName.PRESENCE_PENALTY],
+                ),
+                ParameterRule(
+                    name='frequency_penalty',
+                    **PARAMETER_RULE_TEMPLATE[DefaultParameterName.FREQUENCY_PENALTY],
+                ),
+                _get_max_tokens(default=512, min_val=1, max_val=16384),
+                ParameterRule(
+                    name='seed',
+                    label=I18nObject(
+                        zh_Hans='种子',
+                        en_US='Seed'
+                    ),
+                    type='int',
+                    help=I18nObject(
+                        zh_Hans='如果指定，模型将尽最大努力进行确定性采样，使得重复的具有相同种子和参数的请求应该返回相同的结果。不能保证确定性，您应该参考 system_fingerprint 响应参数来监视变化。',
+                        en_US='If specified, model will make a best effort to sample deterministically, such that repeated requests with the same seed and parameters should return the same result. Determinism is not guaranteed, and you should refer to the system_fingerprint response parameter to monitor changes in the backend.'
+                    ),
+                    required=False,
+                    precision=2,
+                    min=0,
+                    max=1,
+                ),
+                ParameterRule(
+                    name='response_format',
+                    label=I18nObject(
+                        zh_Hans='回复格式',
+                        en_US='response_format'
+                    ),
+                    type='string',
+                    help=I18nObject(
+                        zh_Hans='指定模型必须输出的格式',
+                        en_US='specifying the format that the model must output'
+                    ),
+                    required=False,
+                    options=['text', 'json_object']
+                ),
+            ],
+            pricing=PriceConfig(
+                input=0.150,
+                output=0.600,
+                unit=0.000001,
+                currency='USD',
+            )
+        )
+    ),
+    AzureBaseModel(
+        base_model_name='gpt-4o-mini-2024-07-18',
+        entity=AIModelEntity(
+            model='fake-deployment-name',
+            label=I18nObject(
+                en_US='fake-deployment-name-label',
+            ),
+            model_type=ModelType.LLM,
+            features=[
+                ModelFeature.AGENT_THOUGHT,
+                ModelFeature.VISION,
+                ModelFeature.MULTI_TOOL_CALL,
+                ModelFeature.STREAM_TOOL_CALL,
+            ],
+            fetch_from=FetchFrom.CUSTOMIZABLE_MODEL,
+            model_properties={
+                ModelPropertyKey.MODE: LLMMode.CHAT.value,
+                ModelPropertyKey.CONTEXT_SIZE: 128000,
+            },
+            parameter_rules=[
+                ParameterRule(
+                    name='temperature',
+                    **PARAMETER_RULE_TEMPLATE[DefaultParameterName.TEMPERATURE],
+                ),
+                ParameterRule(
+                    name='top_p',
+                    **PARAMETER_RULE_TEMPLATE[DefaultParameterName.TOP_P],
+                ),
+                ParameterRule(
+                    name='presence_penalty',
+                    **PARAMETER_RULE_TEMPLATE[DefaultParameterName.PRESENCE_PENALTY],
+                ),
+                ParameterRule(
+                    name='frequency_penalty',
+                    **PARAMETER_RULE_TEMPLATE[DefaultParameterName.FREQUENCY_PENALTY],
+                ),
+                _get_max_tokens(default=512, min_val=1, max_val=16384),
+                ParameterRule(
+                    name='seed',
+                    label=I18nObject(
+                        zh_Hans='种子',
+                        en_US='Seed'
+                    ),
+                    type='int',
+                    help=I18nObject(
+                        zh_Hans='如果指定，模型将尽最大努力进行确定性采样，使得重复的具有相同种子和参数的请求应该返回相同的结果。不能保证确定性，您应该参考 system_fingerprint 响应参数来监视变化。',
+                        en_US='If specified, model will make a best effort to sample deterministically, such that repeated requests with the same seed and parameters should return the same result. Determinism is not guaranteed, and you should refer to the system_fingerprint response parameter to monitor changes in the backend.'
+                    ),
+                    required=False,
+                    precision=2,
+                    min=0,
+                    max=1,
+                ),
+                ParameterRule(
+                    name='response_format',
+                    label=I18nObject(
+                        zh_Hans='回复格式',
+                        en_US='response_format'
+                    ),
+                    type='string',
+                    help=I18nObject(
+                        zh_Hans='指定模型必须输出的格式',
+                        en_US='specifying the format that the model must output'
+                    ),
+                    required=False,
+                    options=['text', 'json_object']
+                ),
+            ],
+            pricing=PriceConfig(
+                input=0.150,
+                output=0.600,
+                unit=0.000001,
+                currency='USD',
+            )
+        )
+    ),
    AzureBaseModel(
        base_model_name='gpt-4o',
        entity=AIModelEntity(
--- a/api/core/model_runtime/model_providers/azure_openai/azure_openai.yaml
+++ b/api/core/model_runtime/model_providers/azure_openai/azure_openai.yaml
@ -114,6 +114,18 @@ model_credential_schema:
          show_on:
            - variable: __model_type
              value: llm
+        - label:
+            en_US: gpt-4o-mini
+          value: gpt-4o-mini
+          show_on:
+            - variable: __model_type
+              value: llm
+        - label:
+            en_US: gpt-4o-mini-2024-07-18
+          value: gpt-4o-mini-2024-07-18
+          show_on:
+            - variable: __model_type
+              value: llm
        - label:
            en_US: gpt-4o
          value: gpt-4o
--- a/api/core/model_runtime/model_providers/azure_openai/llm/llm.py
+++ b/api/core/model_runtime/model_providers/azure_openai/llm/llm.py
@ -375,6 +375,10 @@ class AzureOpenAILargeLanguageModel(_CommonAzureOpenAI, LargeLanguageModel):
                continue

            delta = chunk.choices[0]
+            # NOTE: For fix https://github.com/langgenius/dify/issues/5790
+            if delta.delta is None:
+                continue
+

            # extract tool calls from response
            self._update_tool_calls(tool_calls=tool_calls, tool_calls_response=delta.delta.tool_calls)
--- a/api/core/model_runtime/model_providers/azure_openai/tts/tts.py
+++ b/api/core/model_runtime/model_providers/azure_openai/tts/tts.py
@ -1,12 +1,8 @@
 import concurrent.futures
 import copy
-from functools import reduce
-from io import BytesIO
 from typing import Optional

-from flask import Response
 from openai import AzureOpenAI
-from pydub import AudioSegment

 from core.model_runtime.entities.model_entities import AIModelEntity
 from core.model_runtime.errors.invoke import InvokeBadRequestError
@ -51,7 +47,7 @@ class AzureOpenAIText2SpeechModel(_CommonAzureOpenAI, TTSModel):
        :return: text translated to audio file
        """
        try:
-            self._tts_invoke(
+            self._tts_invoke_streaming(
                model=model,
                credentials=credentials,
                content_text='Hello Dify!',
@ -60,45 +56,6 @@ class AzureOpenAIText2SpeechModel(_CommonAzureOpenAI, TTSModel):
        except Exception as ex:
            raise CredentialsValidateFailedError(str(ex))

-    def _tts_invoke(self, model: str, credentials: dict, content_text: str, voice: str) -> Response:
-        """
-        _tts_invoke text2speech model
-
-        :param model: model name
-        :param credentials: model credentials
-        :param content_text: text content to be translated
-        :param voice: model timbre
-        :return: text translated to audio file
-        """
-        audio_type = self._get_model_audio_type(model, credentials)
-        word_limit = self._get_model_word_limit(model, credentials)
-        max_workers = self._get_model_workers_limit(model, credentials)
-        try:
-            sentences = list(self._split_text_into_sentences(org_text=content_text, max_length=word_limit))
-            audio_bytes_list = []
-
-            # Create a thread pool and map the function to the list of sentences
-            with concurrent.futures.ThreadPoolExecutor(max_workers=max_workers) as executor:
-                futures = [executor.submit(self._process_sentence, sentence=sentence, model=model, voice=voice,
-                                           credentials=credentials) for sentence in sentences]
-                for future in futures:
-                    try:
-                        if future.result():
-                            audio_bytes_list.append(future.result())
-                    except Exception as ex:
-                        raise InvokeBadRequestError(str(ex))
-
-            if len(audio_bytes_list) > 0:
-                audio_segments = [AudioSegment.from_file(BytesIO(audio_bytes), format=audio_type) for audio_bytes in
-                                  audio_bytes_list if audio_bytes]
-                combined_segment = reduce(lambda x, y: x + y, audio_segments)
-                buffer: BytesIO = BytesIO()
-                combined_segment.export(buffer, format=audio_type)
-                buffer.seek(0)
-                return Response(buffer.read(), status=200, mimetype=f"audio/{audio_type}")
-        except Exception as ex:
-            raise InvokeBadRequestError(str(ex))
-
    def _tts_invoke_streaming(self, model: str,  credentials: dict, content_text: str,
                              voice: str) -> any:
        """
@ -144,7 +101,6 @@ class AzureOpenAIText2SpeechModel(_CommonAzureOpenAI, TTSModel):
        :param sentence: text content to be translated
        :return: text translated to audio file
        """
-        # transform credentials to kwargs for model instance
        credentials_kwargs = self._to_credential_kwargs(credentials)
        client = AzureOpenAI(**credentials_kwargs)
        response = client.audio.speech.create(model=model, voice=voice, input=sentence.strip())
--- a/api/core/model_runtime/model_providers/bedrock/llm/_position.yaml
+++ b/api/core/model_runtime/model_providers/bedrock/llm/_position.yaml
@ -10,10 +10,14 @@
 - cohere.command-text-v14
 - cohere.command-r-plus-v1.0
 - cohere.command-r-v1.0
+- meta.llama3-1-8b-instruct-v1:0
+- meta.llama3-1-70b-instruct-v1:0
+- meta.llama3-1-405b-instruct-v1:0
 - meta.llama3-8b-instruct-v1:0
 - meta.llama3-70b-instruct-v1:0
 - meta.llama2-13b-chat-v1
 - meta.llama2-70b-chat-v1
+- mistral.mistral-large-2407-v1:0
 - mistral.mistral-small-2402-v1:0
 - mistral.mistral-large-2402-v1:0
 - mistral.mixtral-8x7b-instruct-v0:1
--- a/api/core/model_runtime/model_providers/bedrock/llm/cohere.command-r-plus-v1.0.yaml
+++ b/api/core/model_runtime/model_providers/bedrock/llm/cohere.command-r-plus-v1.0.yaml
@ -3,8 +3,7 @@ label:
  en_US: Command R+
 model_type: llm
 features:
-  #- multi-tool-call
-  - agent-thought
+  - tool-call
  #- stream-tool-call
 model_properties:
  mode: chat
--- a/api/core/model_runtime/model_providers/bedrock/llm/cohere.command-r-v1.0.yaml
+++ b/api/core/model_runtime/model_providers/bedrock/llm/cohere.command-r-v1.0.yaml
@ -3,9 +3,7 @@ label:
  en_US: Command R
 model_type: llm
 features:
-  #- multi-tool-call
-  - agent-thought
-  #- stream-tool-call
+  - tool-call
 model_properties:
  mode: chat
  context_size: 128000
--- a/api/core/model_runtime/model_providers/bedrock/llm/llm.py
+++ b/api/core/model_runtime/model_providers/bedrock/llm/llm.py
@ -17,7 +17,6 @@ from botocore.exceptions import (
    ServiceNotInRegionError,
    UnknownServiceError,
 )
-from cohere import ChatMessage

 # local import
 from core.model_runtime.entities.llm_entities import LLMResult, LLMResultChunk, LLMResultChunkDelta
@ -42,7 +41,6 @@ from core.model_runtime.errors.invoke import (
 )
 from core.model_runtime.errors.validate import CredentialsValidateFailedError
 from core.model_runtime.model_providers.__base.large_language_model import LargeLanguageModel
-from core.model_runtime.model_providers.cohere.llm.llm import CohereLargeLanguageModel

 logger = logging.getLogger(__name__)

@ -59,6 +57,7 @@ class BedrockLargeLanguageModel(LargeLanguageModel):
        {'prefix': 'mistral.mixtral-8x7b-instruct', 'support_system_prompts': False, 'support_tool_use': False},
        {'prefix': 'mistral.mistral-large', 'support_system_prompts': True, 'support_tool_use': True},
        {'prefix': 'mistral.mistral-small', 'support_system_prompts': True, 'support_tool_use': True},
+        {'prefix': 'cohere.command-r', 'support_system_prompts': True, 'support_tool_use': True},
        {'prefix': 'amazon.titan', 'support_system_prompts': False, 'support_tool_use': False}
    ]

@ -94,86 +93,8 @@ class BedrockLargeLanguageModel(LargeLanguageModel):
            model_info['model'] = model
            # invoke models via boto3 converse API
            return self._generate_with_converse(model_info, credentials, prompt_messages, model_parameters, stop, stream, user, tools)
-        # invoke Cohere models via boto3 client
-        if "cohere.command-r" in model:
-            return self._generate_cohere_chat(model, credentials, prompt_messages, model_parameters, stop, stream, user, tools)
        # invoke other models via boto3 client
        return self._generate(model, credentials, prompt_messages, model_parameters, stop, stream, user)
-    
-    def _generate_cohere_chat(
-            self, model: str, credentials: dict, prompt_messages: list[PromptMessage], model_parameters: dict,
-            stop: Optional[list[str]] = None, stream: bool = True, user: Optional[str] = None,
-            tools: Optional[list[PromptMessageTool]] = None,) -> Union[LLMResult, Generator]:
-        cohere_llm = CohereLargeLanguageModel()
-        client_config = Config(
-            region_name=credentials["aws_region"]
-        )
-
-        runtime_client = boto3.client(
-            service_name='bedrock-runtime',
-            config=client_config,
-            aws_access_key_id=credentials["aws_access_key_id"],
-            aws_secret_access_key=credentials["aws_secret_access_key"]
-        )
-
-        extra_model_kwargs = {}
-        if stop:
-            extra_model_kwargs['stop_sequences'] = stop
-
-        if tools:
-            tools = cohere_llm._convert_tools(tools)
-            model_parameters['tools'] = tools
-
-        message, chat_histories, tool_results \
-            = cohere_llm._convert_prompt_messages_to_message_and_chat_histories(prompt_messages)
-
-        if tool_results:
-            model_parameters['tool_results'] = tool_results
-
-        payload = {
-            **model_parameters,
-            "message": message,
-            "chat_history": chat_histories,
-        }
-
-        # need workaround for ai21 models which doesn't support streaming
-        if stream:
-            invoke = runtime_client.invoke_model_with_response_stream
-        else:
-            invoke = runtime_client.invoke_model
-
-        def serialize(obj):
-            if isinstance(obj, ChatMessage):
-                return obj.__dict__
-            raise TypeError(f"Type {type(obj)} not serializable")
-
-        try:
-            body_jsonstr=json.dumps(payload, default=serialize)
-            response = invoke(
-                modelId=model,
-                contentType="application/json",
-                accept="*/*",
-                body=body_jsonstr
-            )
-        except ClientError as ex:
-            error_code = ex.response['Error']['Code']
-            full_error_msg = f"{error_code}: {ex.response['Error']['Message']}"
-            raise self._map_client_to_invoke_error(error_code, full_error_msg)
-
-        except (EndpointConnectionError, NoRegionError, ServiceNotInRegionError) as ex:
-            raise InvokeConnectionError(str(ex))
-
-        except UnknownServiceError as ex:
-            raise InvokeServerUnavailableError(str(ex))
-
-        except Exception as ex:
-            raise InvokeError(str(ex))
-
-        if stream:
-            return self._handle_generate_stream_response(model, credentials, response, prompt_messages)
-
-        return self._handle_generate_response(model, credentials, response, prompt_messages)
-

    def _generate_with_converse(self, model_info: dict, credentials: dict, prompt_messages: list[PromptMessage], model_parameters: dict,
                stop: Optional[list[str]] = None, stream: bool = True, user: Optional[str] = None, tools: Optional[list[PromptMessageTool]] = None,) -> Union[LLMResult, Generator]:
@ -208,14 +129,25 @@ class BedrockLargeLanguageModel(LargeLanguageModel):

        if model_info['support_tool_use'] and tools:
            parameters['toolConfig'] = self._convert_converse_tool_config(tools=tools)
+        try:
+            if stream:
+                response = bedrock_client.converse_stream(**parameters)
+                return self._handle_converse_stream_response(model_info['model'], credentials, response, prompt_messages)
+            else:
+                response = bedrock_client.converse(**parameters)
+                return self._handle_converse_response(model_info['model'], credentials, response, prompt_messages)
+        except ClientError as ex:
+            error_code = ex.response['Error']['Code']
+            full_error_msg = f"{error_code}: {ex.response['Error']['Message']}"
+            raise self._map_client_to_invoke_error(error_code, full_error_msg)
+        except (EndpointConnectionError, NoRegionError, ServiceNotInRegionError) as ex:
+            raise InvokeConnectionError(str(ex))

-        if stream:
-            response = bedrock_client.converse_stream(**parameters)
-            return self._handle_converse_stream_response(model_info['model'], credentials, response, prompt_messages)
-        else:
-            response = bedrock_client.converse(**parameters)
-            return self._handle_converse_response(model_info['model'], credentials, response, prompt_messages)
+        except UnknownServiceError as ex:
+            raise InvokeServerUnavailableError(str(ex))

+        except Exception as ex:
+            raise InvokeError(str(ex))
    def _handle_converse_response(self, model: str, credentials: dict, response: dict,
                                prompt_messages: list[PromptMessage]) -> LLMResult:
        """
@ -558,7 +490,6 @@ class BedrockLargeLanguageModel(LargeLanguageModel):
        except ClientError as ex:
            error_code = ex.response['Error']['Code']
            full_error_msg = f"{error_code}: {ex.response['Error']['Message']}"
-
            raise CredentialsValidateFailedError(str(self._map_client_to_invoke_error(error_code, full_error_msg)))

        except Exception as ex:
@ -571,38 +502,9 @@ class BedrockLargeLanguageModel(LargeLanguageModel):
        :param message: PromptMessage to convert.
        :return: String representation of the message.
        """
-        
-        if model_prefix == "anthropic":
-            human_prompt_prefix = "\n\nHuman:"
-            human_prompt_postfix = ""
-            ai_prompt = "\n\nAssistant:"
-
-        elif model_prefix == "meta":
-            # LLAMA3
-            if model_name.startswith("llama3"):
-                human_prompt_prefix = "<|eot_id|><|start_header_id|>user<|end_header_id|>\n\n"
-                human_prompt_postfix = "<|eot_id|><|start_header_id|>assistant<|end_header_id|>\n\n"
-                ai_prompt = "\n\nAssistant:"
-            else:
-                # LLAMA2
-                human_prompt_prefix = "\n[INST]"
-                human_prompt_postfix = "[\\INST]\n"
-                ai_prompt = ""
-
-        elif model_prefix == "mistral":
-            human_prompt_prefix = "<s>[INST]"
-            human_prompt_postfix = "[\\INST]\n"
-            ai_prompt = "\n\nAssistant:"
-
-        elif model_prefix == "amazon":
-            human_prompt_prefix = "\n\nUser:"
-            human_prompt_postfix = ""
-            ai_prompt = "\n\nBot:"
-        
-        else:
-            human_prompt_prefix = ""
-            human_prompt_postfix = ""
-            ai_prompt = ""
+        human_prompt_prefix = ""
+        human_prompt_postfix = ""
+        ai_prompt = ""

        content = message.content

@ -653,13 +555,7 @@ class BedrockLargeLanguageModel(LargeLanguageModel):
        model_prefix = model.split('.')[0]
        model_name = model.split('.')[1]

-        if model_prefix == "amazon":
-            payload["textGenerationConfig"] = { **model_parameters }
-            payload["textGenerationConfig"]["stopSequences"] = ["User:"]
-            
-            payload["inputText"] = self._convert_messages_to_prompt(prompt_messages, model_prefix)
-        
-        elif model_prefix == "ai21":
+        if model_prefix == "ai21":
            payload["temperature"] = model_parameters.get("temperature")
            payload["topP"] = model_parameters.get("topP")
            payload["maxTokens"] = model_parameters.get("maxTokens")
@ -671,28 +567,12 @@ class BedrockLargeLanguageModel(LargeLanguageModel):
                payload["frequencyPenalty"] = {model_parameters.get("frequencyPenalty")}
            if model_parameters.get("countPenalty"):
                payload["countPenalty"] = {model_parameters.get("countPenalty")}
-        
-        elif model_prefix == "mistral":
-            payload["temperature"] = model_parameters.get("temperature")
-            payload["top_p"] = model_parameters.get("top_p")
-            payload["max_tokens"] = model_parameters.get("max_tokens")
-            payload["prompt"] = self._convert_messages_to_prompt(prompt_messages, model_prefix)
-            payload["stop"] = stop[:10] if stop else []
-
-        elif model_prefix == "anthropic":
-            payload = { **model_parameters }
-            payload["prompt"] = self._convert_messages_to_prompt(prompt_messages, model_prefix)
-            payload["stop_sequences"] = ["\n\nHuman:"] + (stop if stop else [])
-            
+                    
        elif model_prefix == "cohere":
            payload = { **model_parameters }
            payload["prompt"] = prompt_messages[0].content
            payload["stream"] = stream
        
-        elif model_prefix == "meta":
-            payload = { **model_parameters }
-            payload["prompt"] = self._convert_messages_to_prompt(prompt_messages, model_prefix, model_name)
-
        else:
            raise ValueError(f"Got unknown model prefix {model_prefix}")
        
@ -783,36 +663,16 @@ class BedrockLargeLanguageModel(LargeLanguageModel):
        # get output text and calculate num tokens based on model / provider
        model_prefix = model.split('.')[0]

-        if model_prefix == "amazon":
-            output = response_body.get("results")[0].get("outputText").strip('\n')
-            prompt_tokens = response_body.get("inputTextTokenCount")
-            completion_tokens = response_body.get("results")[0].get("tokenCount")
-
-        elif model_prefix == "ai21":
+        if model_prefix == "ai21":
            output = response_body.get('completions')[0].get('data').get('text')
            prompt_tokens = len(response_body.get("prompt").get("tokens"))
            completion_tokens = len(response_body.get('completions')[0].get('data').get('tokens'))
-
-        elif model_prefix == "anthropic":
-            output = response_body.get("completion")
-            prompt_tokens = self.get_num_tokens(model, credentials, prompt_messages)
-            completion_tokens = self.get_num_tokens(model, credentials, output if output else '')
            
        elif model_prefix == "cohere":
            output = response_body.get("generations")[0].get("text")
            prompt_tokens = self.get_num_tokens(model, credentials, prompt_messages)
            completion_tokens = self.get_num_tokens(model, credentials, output if output else '')
-            
-        elif model_prefix == "meta":
-            output = response_body.get("generation").strip('\n')
-            prompt_tokens = response_body.get("prompt_token_count")
-            completion_tokens = response_body.get("generation_token_count")
-        
-        elif model_prefix == "mistral":
-            output = response_body.get("outputs")[0].get("text")
-            prompt_tokens = response.get('ResponseMetadata').get('HTTPHeaders').get('x-amzn-bedrock-input-token-count')
-            completion_tokens = response.get('ResponseMetadata').get('HTTPHeaders').get('x-amzn-bedrock-output-token-count')
-
+                        
        else:
            raise ValueError(f"Got unknown model prefix {model_prefix} when handling block response")

@ -883,26 +743,10 @@ class BedrockLargeLanguageModel(LargeLanguageModel):
            payload = json.loads(chunk.get('bytes').decode())

            model_prefix = model.split('.')[0]
-            if model_prefix == "amazon":
-                content_delta = payload.get("outputText").strip('\n')
-                finish_reason = payload.get("completion_reason")
- 
-            elif model_prefix == "anthropic":
-                content_delta = payload.get("completion")
-                finish_reason = payload.get("stop_reason")
-
-            elif model_prefix == "cohere":
+            if model_prefix == "cohere":
                content_delta = payload.get("text")
                finish_reason = payload.get("finish_reason")
            
-            elif model_prefix == "mistral":
-                content_delta = payload.get('outputs')[0].get("text")
-                finish_reason = payload.get('outputs')[0].get("stop_reason")
-
-            elif model_prefix == "meta":
-                content_delta = payload.get("generation").strip('\n')
-                finish_reason = payload.get("stop_reason")
-            
            else:
                raise ValueError(f"Got unknown model prefix {model_prefix} when handling stream response")

--- a/api/core/model_runtime/model_providers/bedrock/llm/meta.llama3-1-405b-instruct-v1.0.yaml
+++ b/api/core/model_runtime/model_providers/bedrock/llm/meta.llama3-1-405b-instruct-v1.0.yaml
@ -0,0 +1,25 @@
+model: meta.llama3-1-405b-instruct-v1:0
+label:
+  en_US: Llama 3.1 405B Instruct
+model_type: llm
+model_properties:
+  mode: completion
+  context_size: 128000
+parameter_rules:
+  - name: temperature
+    use_template: temperature
+    default: 0.5
+  - name: top_p
+    use_template: top_p
+    default: 0.9
+  - name: max_gen_len
+    use_template: max_tokens
+    required: true
+    default: 512
+    min: 1
+    max: 2048
+pricing:
+  input: '0.00532'
+  output: '0.016'
+  unit: '0.001'
+  currency: USD
--- a/api/core/model_runtime/model_providers/bedrock/llm/meta.llama3-1-70b-instruct-v1.0.yaml
+++ b/api/core/model_runtime/model_providers/bedrock/llm/meta.llama3-1-70b-instruct-v1.0.yaml
@ -0,0 +1,25 @@
+model: meta.llama3-1-70b-instruct-v1:0
+label:
+  en_US: Llama 3.1 Instruct 70B
+model_type: llm
+model_properties:
+  mode: completion
+  context_size: 128000
+parameter_rules:
+  - name: temperature
+    use_template: temperature
+    default: 0.5
+  - name: top_p
+    use_template: top_p
+    default: 0.9
+  - name: max_gen_len
+    use_template: max_tokens
+    required: true
+    default: 512
+    min: 1
+    max: 2048
+pricing:
+  input: '0.00265'
+  output: '0.0035'
+  unit: '0.001'
+  currency: USD
--- a/api/core/model_runtime/model_providers/bedrock/llm/meta.llama3-1-8b-instruct-v1.0.yaml
+++ b/api/core/model_runtime/model_providers/bedrock/llm/meta.llama3-1-8b-instruct-v1.0.yaml
@ -0,0 +1,25 @@
+model: meta.llama3-1-8b-instruct-v1:0
+label:
+  en_US: Llama 3.1 Instruct 8B
+model_type: llm
+model_properties:
+  mode: completion
+  context_size: 128000
+parameter_rules:
+  - name: temperature
+    use_template: temperature
+    default: 0.5
+  - name: top_p
+    use_template: top_p
+    default: 0.9
+  - name: max_gen_len
+    use_template: max_tokens
+    required: true
+    default: 512
+    min: 1
+    max: 2048
+pricing:
+  input: '0.0003'
+  output: '0.0006'
+  unit: '0.001'
+  currency: USD
--- a/api/core/model_runtime/model_providers/bedrock/llm/mistral.mistral-large-2407-v1.0.yaml
+++ b/api/core/model_runtime/model_providers/bedrock/llm/mistral.mistral-large-2407-v1.0.yaml
@ -0,0 +1,29 @@
+model: mistral.mistral-large-2407-v1:0
+label:
+  en_US: Mistral Large 2 (24.07)
+model_type: llm
+features:
+  - tool-call
+model_properties:
+  mode: completion
+  context_size: 128000
+parameter_rules:
+  - name: temperature
+    use_template: temperature
+    required: false
+    default: 0.7
+  - name: top_p
+    use_template: top_p
+    required: false
+    default: 1
+  - name: max_tokens
+    use_template: max_tokens
+    required: true
+    default: 512
+    min: 1
+    max: 8192
+pricing:
+  input: '0.003'
+  output: '0.009'
+  unit: '0.001'
+  currency: USD
--- a/api/core/model_runtime/model_providers/deepseek/llm/deepseek-chat.yaml
+++ b/api/core/model_runtime/model_providers/deepseek/llm/deepseek-chat.yaml
@ -5,6 +5,8 @@ label:
 model_type: llm
 features:
  - agent-thought
+  - multi-tool-call
+  - stream-tool-call
 model_properties:
  mode: chat
  context_size: 128000
@ -23,7 +25,7 @@ parameter_rules:
    type: int
    default: 4096
    min: 1
-    max: 4096
+    max: 8192
    help:
      zh_Hans: 指定生成结果长度的上限。如果生成结果截断，可以调大该参数。
      en_US: Specifies the upper limit on the length of generated results. If the generated results are truncated, you can increase this parameter.
@ -57,6 +59,18 @@ parameter_rules:
    help:
      zh_Hans: 介于 -2.0 和 2.0 之间的数字。如果该值为正，那么新 token 会根据其在已有文本中的出现频率受到相应的惩罚，降低模型重复相同内容的可能性。
      en_US: A number between -2.0 and 2.0. If the value is positive, new tokens are penalized based on their frequency of occurrence in existing text, reducing the likelihood that the model will repeat the same content.
+  - name: response_format
+    label:
+      zh_Hans: 回复格式
+      en_US: response_format
+    type: string
+    help:
+      zh_Hans: 指定模型必须输出的格式
+      en_US: specifying the format that the model must output
+    required: false
+    options:
+      - text
+      - json_object
 pricing:
  input: '1'
  output: '2'
--- a/api/core/model_runtime/model_providers/deepseek/llm/deepseek-coder.yaml
+++ b/api/core/model_runtime/model_providers/deepseek/llm/deepseek-coder.yaml
@ -5,6 +5,8 @@ label:
 model_type: llm
 features:
  - agent-thought
+  - multi-tool-call
+  - stream-tool-call
 model_properties:
  mode: chat
  context_size: 128000
--- a/api/core/model_runtime/model_providers/groq/llm/_position.yaml
+++ b/api/core/model_runtime/model_providers/groq/llm/_position.yaml
@ -0,0 +1,7 @@
+- llama-3.1-405b-reasoning
+- llama-3.1-70b-versatile
+- llama-3.1-8b-instant
+- llama3-70b-8192
+- llama3-8b-8192
+- mixtral-8x7b-32768
+- llama2-70b-4096
--- a/api/core/model_runtime/model_providers/groq/llm/llama-3.1-405b-reasoning.yaml
+++ b/api/core/model_runtime/model_providers/groq/llm/llama-3.1-405b-reasoning.yaml
@ -0,0 +1,25 @@
+model: llama-3.1-405b-reasoning
+label:
+  zh_Hans: Llama-3.1-405b-reasoning
+  en_US: Llama-3.1-405b-reasoning
+model_type: llm
+features:
+  - agent-thought
+model_properties:
+  mode: chat
+  context_size: 131072
+parameter_rules:
+  - name: temperature
+    use_template: temperature
+  - name: top_p
+    use_template: top_p
+  - name: max_tokens
+    use_template: max_tokens
+    default: 512
+    min: 1
+    max: 8192
+pricing:
+  input: '0.05'
+  output: '0.1'
+  unit: '0.000001'
+  currency: USD
--- a/api/core/model_runtime/model_providers/groq/llm/llama-3.1-70b-versatile.yaml
+++ b/api/core/model_runtime/model_providers/groq/llm/llama-3.1-70b-versatile.yaml
@ -0,0 +1,25 @@
+model: llama-3.1-70b-versatile
+label:
+  zh_Hans: Llama-3.1-70b-versatile
+  en_US: Llama-3.1-70b-versatile
+model_type: llm
+features:
+  - agent-thought
+model_properties:
+  mode: chat
+  context_size: 131072
+parameter_rules:
+  - name: temperature
+    use_template: temperature
+  - name: top_p
+    use_template: top_p
+  - name: max_tokens
+    use_template: max_tokens
+    default: 512
+    min: 1
+    max: 8192
+pricing:
+  input: '0.05'
+  output: '0.1'
+  unit: '0.000001'
+  currency: USD
--- a/api/core/model_runtime/model_providers/groq/llm/llama-3.1-8b-instant.yaml
+++ b/api/core/model_runtime/model_providers/groq/llm/llama-3.1-8b-instant.yaml
@ -0,0 +1,25 @@
+model: llama-3.1-8b-instant
+label:
+  zh_Hans: Llama-3.1-8b-instant
+  en_US: Llama-3.1-8b-instant
+model_type: llm
+features:
+  - agent-thought
+model_properties:
+  mode: chat
+  context_size: 131072
+parameter_rules:
+  - name: temperature
+    use_template: temperature
+  - name: top_p
+    use_template: top_p
+  - name: max_tokens
+    use_template: max_tokens
+    default: 512
+    min: 1
+    max: 8192
+pricing:
+  input: '0.05'
+  output: '0.1'
+  unit: '0.000001'
+  currency: USD
--- a/api/core/model_runtime/model_providers/groq/llm/llama3-70b-8192.yaml
+++ b/api/core/model_runtime/model_providers/groq/llm/llama3-70b-8192.yaml
@ -19,7 +19,7 @@ parameter_rules:
    min: 1
    max: 8192
 pricing:
-  input: '0.05'
-  output: '0.1'
+  input: '0.59'
+  output: '0.79'
  unit: '0.000001'
  currency: USD
--- a/api/core/model_runtime/model_providers/groq/llm/llama3-8b-8192.yaml
+++ b/api/core/model_runtime/model_providers/groq/llm/llama3-8b-8192.yaml
@ -19,7 +19,7 @@ parameter_rules:
    min: 1
    max: 8192
 pricing:
-  input: '0.59'
-  output: '0.79'
+  input: '0.05'
+  output: '0.08'
  unit: '0.000001'
  currency: USD
--- a/api/core/model_runtime/model_providers/hunyuan/hunyuan.yaml
+++ b/api/core/model_runtime/model_providers/hunyuan/hunyuan.yaml
@ -18,6 +18,7 @@ help:
    en_US: https://console.cloud.tencent.com/cam/capi
 supported_model_types:
  - llm
+  - text-embedding
 configurate_methods:
  - predefined-model
 provider_credential_schema:
--- a/api/core/model_runtime/model_providers/hunyuan/llm/hunyuan-pro.yaml
+++ b/api/core/model_runtime/model_providers/hunyuan/llm/hunyuan-pro.yaml
@ -21,6 +21,16 @@ parameter_rules:
    default: 1024
    min: 1
    max: 32000
+  - name: enable_enhance
+    label:
+      zh_Hans: 功能增强
+      en_US: Enable Enhancement
+    type: boolean
+    help:
+      zh_Hans: 功能增强（如搜索）开关，关闭时将直接由主模型生成回复内容，可以降低响应时延（对于流式输出时的首字时延尤为明显）。但在少数场景里，回复效果可能会下降。
+      en_US: Allow the model to perform external search to enhance the generation results.
+    required: false
+    default: true
 pricing:
  input: '0.03'
  output: '0.10'
--- a/api/core/model_runtime/model_providers/hunyuan/llm/hunyuan-standard-256k.yaml
+++ b/api/core/model_runtime/model_providers/hunyuan/llm/hunyuan-standard-256k.yaml
@ -21,6 +21,16 @@ parameter_rules:
    default: 1024
    min: 1
    max: 256000
+  - name: enable_enhance
+    label:
+      zh_Hans: 功能增强
+      en_US: Enable Enhancement
+    type: boolean
+    help:
+      zh_Hans: 功能增强（如搜索）开关，关闭时将直接由主模型生成回复内容，可以降低响应时延（对于流式输出时的首字时延尤为明显）。但在少数场景里，回复效果可能会下降。
+      en_US: Allow the model to perform external search to enhance the generation results.
+    required: false
+    default: true
 pricing:
  input: '0.015'
  output: '0.06'
--- a/api/core/model_runtime/model_providers/hunyuan/llm/hunyuan-standard.yaml
+++ b/api/core/model_runtime/model_providers/hunyuan/llm/hunyuan-standard.yaml
@ -21,6 +21,16 @@ parameter_rules:
    default: 1024
    min: 1
    max: 32000
+  - name: enable_enhance
+    label:
+      zh_Hans: 功能增强
+      en_US: Enable Enhancement
+    type: boolean
+    help:
+      zh_Hans: 功能增强（如搜索）开关，关闭时将直接由主模型生成回复内容，可以降低响应时延（对于流式输出时的首字时延尤为明显）。但在少数场景里，回复效果可能会下降。
+      en_US: Allow the model to perform external search to enhance the generation results.
+    required: false
+    default: true
 pricing:
  input: '0.0045'
  output: '0.0005'
--- a/api/core/model_runtime/model_providers/hunyuan/llm/llm.py
+++ b/api/core/model_runtime/model_providers/hunyuan/llm/llm.py
@ -14,6 +14,7 @@ from core.model_runtime.entities.message_entities import (
    PromptMessage,
    PromptMessageTool,
    SystemPromptMessage,
+    ToolPromptMessage,
    UserPromptMessage,
 )
 from core.model_runtime.errors.invoke import InvokeError
@ -35,7 +36,8 @@ class HunyuanLargeLanguageModel(LargeLanguageModel):

        custom_parameters = {
            'Temperature': model_parameters.get('temperature', 0.0),
-            'TopP': model_parameters.get('top_p', 1.0)
+            'TopP': model_parameters.get('top_p', 1.0),
+            'EnableEnhancement': model_parameters.get('enable_enhance', True)
        }

        params = {
@ -44,6 +46,17 @@ class HunyuanLargeLanguageModel(LargeLanguageModel):
            "Stream": stream,
            **custom_parameters,
        }
+        # add Tools and ToolChoice
+        if (tools and len(tools) > 0):
+            params['ToolChoice'] = "auto"
+            params['Tools'] = [{
+                "Type": "function", 
+                "Function": {
+                    "Name": tool.name, 
+                    "Description": tool.description,
+                    "Parameters": json.dumps(tool.parameters)
+                }
+            } for tool in tools]

        request.from_json_string(json.dumps(params))
        response = client.ChatCompletions(request)
@ -89,9 +102,43 @@ class HunyuanLargeLanguageModel(LargeLanguageModel):

    def _convert_prompt_messages_to_dicts(self, prompt_messages: list[PromptMessage]) -> list[dict]:
        """Convert a list of PromptMessage objects to a list of dictionaries with 'Role' and 'Content' keys."""
-        return [{"Role": message.role.value, "Content": message.content} for message in prompt_messages]
+        dict_list = []
+        for message in prompt_messages:
+            if isinstance(message, AssistantPromptMessage):
+                tool_calls = message.tool_calls
+                if (tool_calls and len(tool_calls) > 0):
+                    dict_tool_calls = [
+                        {
+                            "Id": tool_call.id,
+                            "Type": tool_call.type,
+                            "Function": {
+                                "Name": tool_call.function.name,
+                                "Arguments": tool_call.function.arguments if (tool_call.function.arguments == "") else "{}"
+                            }
+                        } for tool_call in tool_calls]
+                    
+                    dict_list.append({ 
+                        "Role": message.role.value,
+                        # fix set content = "" while tool_call request
+                        # fix [hunyuan] None, [TencentCloudSDKException] code:InvalidParameter message:Messages Content and Contents not allowed empty at the same time.
+                        "Content": " ", # message.content if (message.content is not None) else "", 
+                        "ToolCalls":  dict_tool_calls
+                    })
+                else:
+                    dict_list.append({ "Role": message.role.value, "Content": message.content })
+            elif isinstance(message, ToolPromptMessage):
+                tool_execute_result = { "result": message.content }
+                content =json.dumps(tool_execute_result, ensure_ascii=False)
+                dict_list.append({ "Role": message.role.value, "Content": content, "ToolCallId": message.tool_call_id  })
+            else:
+                dict_list.append({ "Role": message.role.value, "Content": message.content })
+        return dict_list

    def _handle_stream_chat_response(self, model, credentials, prompt_messages, resp):
+
+        tool_call = None
+        tool_calls = []
+
        for index, event in enumerate(resp):
            logging.debug("_handle_stream_chat_response, event: %s", event)

@ -109,20 +156,54 @@ class HunyuanLargeLanguageModel(LargeLanguageModel):
            usage = data.get('Usage', {})
            prompt_tokens = usage.get('PromptTokens', 0)
            completion_tokens = usage.get('CompletionTokens', 0)
-            usage = self._calc_response_usage(model, credentials, prompt_tokens, completion_tokens)
+
+            response_tool_calls = delta.get('ToolCalls')
+            if (response_tool_calls is not None):
+                new_tool_calls = self._extract_response_tool_calls(response_tool_calls)
+                if (len(new_tool_calls) > 0):
+                    new_tool_call = new_tool_calls[0]
+                    if (tool_call is None): tool_call = new_tool_call
+                    elif (tool_call.id != new_tool_call.id):
+                        tool_calls.append(tool_call)
+                        tool_call = new_tool_call
+                    else:
+                        tool_call.function.name += new_tool_call.function.name
+                        tool_call.function.arguments += new_tool_call.function.arguments
+                if (tool_call is not None and len(tool_call.function.name) > 0 and len(tool_call.function.arguments) > 0):
+                    tool_calls.append(tool_call)
+                    tool_call = None

            assistant_prompt_message = AssistantPromptMessage(
                content=message_content,
                tool_calls=[]
            )
+            # rewrite content = "" while tool_call to avoid show content on web page
+            if (len(tool_calls) > 0): assistant_prompt_message.content = ""
+            
+            # add tool_calls to assistant_prompt_message
+            if (finish_reason == 'tool_calls'):
+                assistant_prompt_message.tool_calls = tool_calls
+                tool_call = None
+                tool_calls = []

-            delta_chunk = LLMResultChunkDelta(
-                index=index,
-                role=delta.get('Role', 'assistant'),
-                message=assistant_prompt_message,
-                usage=usage,
-                finish_reason=finish_reason,
-            )
+            if (len(finish_reason) > 0):
+                usage = self._calc_response_usage(model, credentials, prompt_tokens, completion_tokens)
+
+                delta_chunk = LLMResultChunkDelta(
+                    index=index,
+                    role=delta.get('Role', 'assistant'),
+                    message=assistant_prompt_message,
+                    usage=usage,
+                    finish_reason=finish_reason,
+                )
+                tool_call = None
+                tool_calls = []
+
+            else:
+                delta_chunk = LLMResultChunkDelta(
+                    index=index,
+                    message=assistant_prompt_message,
+                )

            yield LLMResultChunk(
                model=model,
@ -177,12 +258,15 @@ class HunyuanLargeLanguageModel(LargeLanguageModel):
        """
        human_prompt = "\n\nHuman:"
        ai_prompt = "\n\nAssistant:"
+        tool_prompt = "\n\nTool:"
        content = message.content

        if isinstance(message, UserPromptMessage):
            message_text = f"{human_prompt} {content}"
        elif isinstance(message, AssistantPromptMessage):
            message_text = f"{ai_prompt} {content}"
+        elif isinstance(message, ToolPromptMessage):
+            message_text = f"{tool_prompt} {content}"
        elif isinstance(message, SystemPromptMessage):
            message_text = content
        else:
@ -203,3 +287,30 @@ class HunyuanLargeLanguageModel(LargeLanguageModel):
        return {
            InvokeError: [TencentCloudSDKException],
        }
+    
+    def _extract_response_tool_calls(self,
+                                     response_tool_calls: list[dict]) \
+            -> list[AssistantPromptMessage.ToolCall]:
+        """
+        Extract tool calls from response
+
+        :param response_tool_calls: response tool calls
+        :return: list of tool calls
+        """
+        tool_calls = []
+        if response_tool_calls:
+            for response_tool_call in response_tool_calls:
+                response_function = response_tool_call.get('Function', {})
+                function = AssistantPromptMessage.ToolCall.ToolCallFunction(
+                    name=response_function.get('Name', ''),
+                    arguments=response_function.get('Arguments', '')
+                )
+
+                tool_call = AssistantPromptMessage.ToolCall(
+                    id=response_tool_call.get('Id', 0),
+                    type='function',
+                    function=function
+                )
+                tool_calls.append(tool_call)
+
+        return tool_calls
--- a/api/core/model_runtime/model_providers/hunyuan/text_embedding/init.py
+++ b/api/core/model_runtime/model_providers/hunyuan/text_embedding/init.py
--- a/api/core/model_runtime/model_providers/hunyuan/text_embedding/hunyuan-text-embedding.yaml
+++ b/api/core/model_runtime/model_providers/hunyuan/text_embedding/hunyuan-text-embedding.yaml
@ -0,0 +1,5 @@
+model: hunyuan-embedding
+model_type: text-embedding
+model_properties:
+  context_size: 1024
+  max_chunks: 1
--- a/api/core/model_runtime/model_providers/hunyuan/text_embedding/text_embedding.py
+++ b/api/core/model_runtime/model_providers/hunyuan/text_embedding/text_embedding.py
@ -0,0 +1,173 @@
+import json
+import logging
+import time
+from typing import Optional
+
+from tencentcloud.common import credential
+from tencentcloud.common.exception import TencentCloudSDKException
+from tencentcloud.common.profile.client_profile import ClientProfile
+from tencentcloud.common.profile.http_profile import HttpProfile
+from tencentcloud.hunyuan.v20230901 import hunyuan_client, models
+
+from core.model_runtime.entities.model_entities import PriceType
+from core.model_runtime.entities.text_embedding_entities import EmbeddingUsage, TextEmbeddingResult
+from core.model_runtime.errors.invoke import (
+    InvokeError,
+)
+from core.model_runtime.errors.validate import CredentialsValidateFailedError
+from core.model_runtime.model_providers.__base.text_embedding_model import TextEmbeddingModel
+
+logger = logging.getLogger(__name__)
+
+class HunyuanTextEmbeddingModel(TextEmbeddingModel):
+    """
+    Model class for Hunyuan text embedding model.
+    """
+
+    def _invoke(self, model: str, credentials: dict,
+                texts: list[str], user: Optional[str] = None) \
+            -> TextEmbeddingResult:
+        """
+        Invoke text embedding model
+
+        :param model: model name
+        :param credentials: model credentials
+        :param texts: texts to embed
+        :param user: unique user id
+        :return: embeddings result
+        """
+
+        if model != 'hunyuan-embedding':
+            raise ValueError('Invalid model name')
+        
+        client = self._setup_hunyuan_client(credentials)
+
+        embeddings = []
+        token_usage = 0
+
+        for input in texts:
+            request = models.GetEmbeddingRequest()
+            params = {
+                "Input": input
+            }
+            request.from_json_string(json.dumps(params))
+            response = client.GetEmbedding(request)
+            usage = response.Usage.TotalTokens
+
+            embeddings.extend([data.Embedding for data in response.Data])
+            token_usage += usage
+
+        result = TextEmbeddingResult(
+            model=model,
+            embeddings=embeddings,
+            usage=self._calc_response_usage(
+                model=model,
+                credentials=credentials,
+                tokens=token_usage
+            )
+        )
+
+        return result
+
+    def validate_credentials(self, model: str, credentials: dict) -> None:
+        """
+        Validate credentials
+        """
+        try:
+            client = self._setup_hunyuan_client(credentials)
+
+            req = models.ChatCompletionsRequest()
+            params = {
+                "Model": model,
+                "Messages": [{
+                    "Role": "user",
+                    "Content": "hello"
+                }],
+                "TopP": 1,
+                "Temperature": 0,
+                "Stream": False
+            }
+            req.from_json_string(json.dumps(params))
+            client.ChatCompletions(req)
+        except Exception as e:
+            raise CredentialsValidateFailedError(f'Credentials validation failed: {e}')
+
+    def _setup_hunyuan_client(self, credentials):
+        secret_id = credentials['secret_id']
+        secret_key = credentials['secret_key']
+        cred = credential.Credential(secret_id, secret_key)
+        httpProfile = HttpProfile()
+        httpProfile.endpoint = "hunyuan.tencentcloudapi.com"
+        clientProfile = ClientProfile()
+        clientProfile.httpProfile = httpProfile
+        client = hunyuan_client.HunyuanClient(cred, "", clientProfile)
+        return client
+    
+    def _calc_response_usage(self, model: str, credentials: dict, tokens: int) -> EmbeddingUsage:
+        """
+        Calculate response usage
+
+        :param model: model name
+        :param credentials: model credentials
+        :param tokens: input tokens
+        :return: usage
+        """
+        # get input price info
+        input_price_info = self.get_price(
+            model=model,
+            credentials=credentials,
+            price_type=PriceType.INPUT,
+            tokens=tokens
+        )
+
+        # transform usage
+        usage = EmbeddingUsage(
+            tokens=tokens,
+            total_tokens=tokens,
+            unit_price=input_price_info.unit_price,
+            price_unit=input_price_info.unit,
+            total_price=input_price_info.total_amount,
+            currency=input_price_info.currency,
+            latency=time.perf_counter() - self.started_at
+        )
+
+        return usage
+    
+    @property
+    def _invoke_error_mapping(self) -> dict[type[InvokeError], list[type[Exception]]]:
+        """
+        Map model invoke error to unified error
+        The key is the error type thrown to the caller
+        The value is the error type thrown by the model,
+        which needs to be converted into a unified error type for the caller.
+
+        :return: Invoke error mapping
+        """
+        return {
+            InvokeError: [TencentCloudSDKException],
+        }
+    
+    def get_num_tokens(self, model: str, credentials: dict, texts: list[str]) -> int:
+        """
+        Get number of tokens for given prompt messages
+
+        :param model: model name
+        :param credentials: model credentials
+        :param texts: texts to embed
+        :return:
+        """
+        # client = self._setup_hunyuan_client(credentials)
+
+        num_tokens = 0
+        for text in texts:
+            num_tokens += self._get_num_tokens_by_gpt2(text)
+            # use client.GetTokenCount to get num tokens
+            # request = models.GetTokenCountRequest()
+            # params = {
+            #     "Prompt": text
+            # }
+            # request.from_json_string(json.dumps(params))
+            # response = client.GetTokenCount(request)
+            # num_tokens += response.TokenCount
+
+        return num_tokens
--- a/api/core/model_runtime/model_providers/novita/llm/Nous-Hermes-2-Mixtral-8x7B-DPO.yaml
+++ b/api/core/model_runtime/model_providers/novita/llm/Nous-Hermes-2-Mixtral-8x7B-DPO.yaml
@ -34,3 +34,8 @@ parameter_rules:
    min: -2
    max: 2
    default: 0
+pricing:
+  input: '0.0027'
+  output: '0.0027'
+  unit: '0.0001'
+  currency: USD
--- a/Show More
+++ b/Show More
Author	SHA1	Message	Date
jyong	2ab04bb933	fix Reranking mode is null	2024-08-06 19:03:32 +08:00
jyong	a3c2ab9a6e	fix Reranking mode is null	2024-08-06 18:34:07 +08:00
yanghx	c53875ce8c	fix #6902 .docx handles images within tables and handles cross-column tables (#6951 )	2024-08-06 17:14:24 +08:00
crazywoola	7f18c06b0a	fix: code-block-missing-checks (#7002 )	2024-08-06 16:11:14 +08:00
灰灰	96dcf0fe8a	fix: code tool fails when null property exists in object (#6988 )	2024-08-06 16:11:00 +08:00
Yi Xiao	0c22e4e3d1	Feat/new confirm (#6984 )	2024-08-06 14:31:13 +08:00
Yefori	bd3ed89516	feat: add function calling for deepseek models (#6990 )	2024-08-06 13:37:27 +08:00
Vico Chu	1c043b8426	Chores: fix name typo (#6987 )	2024-08-06 13:33:21 +08:00
小羽	23ed15d19f	feat:nvidia add nemotron4-340b and microsoft/phi-3 (#6973 )	2024-08-06 10:16:41 +08:00
非法操作	312d905c9b	chore: update duckduckgo tool (#6983 )	2024-08-06 10:16:04 +08:00
Dr. Artificial曾小健	cba9319cc7	fix doc (#6974 )	2024-08-06 10:10:55 +08:00
takatost	d839f1ada7	version to 0.6.16 (#6972 )	2024-08-05 23:33:37 +08:00
takatost	6da14c2d48	security: fix api image security issues (#6971 )	2024-08-05 20:21:08 +08:00
Pedro Gomes	a34285196b	Revise the wrong pricing of certain LLM models. (#6967 )	2024-08-05 18:41:44 +08:00
quicksand	e4587b2151	chore: MAX_TREE_DEPTH spelling mistake (#6965 )	2024-08-05 18:41:08 +08:00
takatost	ea30174057	chore: optimize streaming tts of xinference (#6966 )	2024-08-05 18:23:23 +08:00
Sangmin Ahn	dd676866aa	chore: exclude .txt extenstion in create_by_text API (#6956 )	2024-08-05 15:52:07 +08:00
TzuxinChen	f0d10553b4	Fixed a bug where permission was clearly displaye… (#6934 )	2024-08-05 13:19:01 +08:00
liuzhenghua	ef616c604a	fix: The permissions issue of the editor role accessing some backend … (#6945 ) Co-authored-by: liuzhenghua-jk <liuzhenghua-jk@360shuke.com>	2024-08-05 12:55:55 +08:00
KVOJJJin	2288efbf48	Fix: tag & settings modal in dataset card in Firefox (#6953 )	2024-08-05 12:51:26 +08:00
Bowen Liang	f656e1bae2	fix: ensure db migration in docker entry script running with `upgrade-db` command for proper locking (#6946 )	2024-08-05 10:55:26 +08:00
alwqx	5a7fc8cd8c	chore: fix markdown format and one typo (#6939 )	2024-08-05 08:29:59 +08:00
liuzhenghua	141e4e0276	fix: restore xinference secret field (#6941 ) Co-authored-by: liuzhenghua-jk <liuzhenghua-jk@360shuke.com>	2024-08-04 22:32:24 +08:00
Pedro Gomes	20d3e1d297	Fix increase_usage of total_price in agent_runner (#6688 )	2024-08-04 14:42:22 +08:00
crazywoola	79715345ef	fix: import workflow errors (#6937 )	2024-08-04 14:34:39 +08:00
chenxu9741	dff3f41ef6	Workflow TTS playback node filtering issue. (#6877 )	2024-08-04 14:28:56 +08:00
Weaxs	5e634a59a2	compatible xinference reranker server (#6927 )	2024-08-04 13:49:38 +08:00
Joe	26e46d365c	fix: workflow trace user_id error (#6932 )	2024-08-04 03:28:50 +08:00
takatost	bcd7c8e921	fix: sending app trace data to other app trace provider (#6931 )	2024-08-04 00:05:51 +08:00
Bowen Liang	70283f5b9f	dep: support for Python 3.12 (#6771 )	2024-08-02 21:14:36 +08:00
JuHyung Son	2e941bb91c	add new provider Solar (#6884 )	2024-08-02 20:48:09 +08:00
zhuhao	541bf1db5a	feat: add the tool Serper for Google search. (#6786 ) (#6790 )	2024-08-02 20:37:04 +08:00
Jyong	048bc4c06e	fix update dataset failed when embedding model is not exist (#6920 )	2024-08-02 20:30:22 +08:00
Kevin9703	4d0a6cc382	fix(nodes/knowledge-retrieval): workflow knowledge retrieval rerank model check (#6918 )	2024-08-02 20:30:05 +08:00
zxhlyh	6feea0d75b	fix: default rerank model check (#6917 )	2024-08-02 18:27:06 +08:00
Joe	f97a51ce24	fix: reranking disable timer error (#6910 )	2024-08-02 16:34:50 +08:00
NFish	df530b53e5	fix: system model setting missing space between buttons (#6912 )	2024-08-02 16:26:16 +08:00
Bowen Liang	6aa02f8c63	dep: bump pgvecto-rs client from 0.1.x to 0.2.x (#6891 )	2024-08-02 15:51:23 +08:00
crazywoola	7ab04e17e7	fix: return code in service api (#6911 )	2024-08-02 15:48:58 +08:00
非法操作	bf3f1027c8	fix: code execution node not display clear reasons when sandbox res error (#6830 )	2024-08-02 15:36:44 +08:00
KVOJJJin	62cc4077bb	Fix: webapp color theme (#6908 )	2024-08-02 15:08:14 +08:00
zxhlyh	e683461416	fix: knowledge save button visible (#6905 )	2024-08-02 14:20:20 +08:00
zxhlyh	33dab4fe54	fix: multiple retrieval default weighted score (#6897 )	2024-08-02 14:05:27 +08:00
sino	8166a8caf5	feat: update llama3.1 parameters for openrouter (#6901 )	2024-08-02 13:13:34 +08:00
Jyong	44801df8f8	fix score threshold limit be None (#6900 )	2024-08-02 12:10:51 +08:00
灰灰	56af1a0adf	pref: change ollama embedded api request (#6876 )	2024-08-02 12:04:47 +08:00
dufei	f8617db012	fix tongyi tool calls (#6896 )	2024-08-02 10:03:43 +08:00
Jyong	2ab9af3b38	delete weight_type in knowledge retrieval node (#6892 )	2024-08-01 21:38:59 +08:00
Hanqing Zhao	24a89f7753	Modify/modify jp doc (#6889 )	2024-08-01 20:33:35 +08:00
Weaxs	cc4785f094	fix: xinference reranker return_documents (#6888 )	2024-08-01 19:57:53 +08:00
ian	093f902335	fix: Change API key authentication failure response code from 404 to 401 (#6885 )	2024-08-01 17:41:35 +08:00
hursit	104c797dd0	feat: Add support for i18n Turkish language (tr-TR) (#6886 ) Co-authored-by: hursit <hursit.topal@enuygun.com>	2024-08-01 17:30:35 +08:00
chenxu9741	a9cd6df97e	Remove tts (blocking call) (#6869 )	2024-08-01 14:50:22 +08:00
呆萌闷油瓶	f31142e758	Azure 4o mini options (#6873 )	2024-08-01 14:04:18 +08:00
zxhlyh	9ae88ede12	chore: n to 1 retrieval (#6839 )	2024-08-01 13:45:18 +08:00
crazywoola	792f908afb	Revert "feat:Azure gpt4o mini" (#6870 )	2024-08-01 13:32:03 +08:00
非法操作	29e3c3061c	fix: remote image not display in answer node (#6867 )	2024-08-01 13:21:49 +08:00
呆萌闷油瓶	14367ddc09	feat:Azure gpt4o mini (#6866 )	2024-08-01 13:03:08 +08:00
Jyong	8157fccf6d	delete weight_type (#6865 )	2024-08-01 13:02:33 +08:00
Charlie.Wei	cbf7f21ade	Add azure gpt4omini (#6862 ) Co-authored-by: luowei <glpat-EjySCyNjWiLqAED-YmwM> Co-authored-by: crazywoola <427733928@qq.com> Co-authored-by: crazywoola <100913391+crazywoola@users.noreply.github.com>	2024-08-01 12:57:52 +08:00
NFish	9c4f3be0f3	Fix keyboard shortcut conflict between workflow and browser (#6863 )	2024-08-01 12:57:30 +08:00
Weaxs	f6e8e120a1	support xinference tts (#6746 )	2024-08-01 11:59:15 +08:00
Joe	08f922d8c9	fix: anthropic max token NoneType error (#6858 )	2024-08-01 11:30:00 +08:00
zxhlyh	e9d6a43907	fix: model parameter selector (#6861 )	2024-08-01 11:23:53 +08:00
-LAN-	feb4576ee7	chore: update SQLAlchemy configuration with custom naming convention (#6854 )	2024-08-01 11:16:49 +08:00
小羽	56b43f62d1	feat: nvidia add llama3.1 model (#6844 )	2024-07-31 21:24:02 +08:00
Giga Group	4b410494b3	Add model parameter enable_enhance for hunyuan llm model (#6847 ) Co-authored-by: sun <sun@centen.cn>	2024-07-31 20:04:43 +08:00
Jyong	13f5867a16	add unstructured profiles (#6846 )	2024-07-31 19:39:38 +08:00
Joe	df9bd36cab	fix: claude-3-5-sonnet-20240620 max token error (#6843 )	2024-07-31 18:34:44 +08:00
Joel	77c071e26f	chore: upgrade slider ui (#6838 )	2024-07-31 17:46:43 +08:00
Jyong	af76381b98	fix notion internal setting (#6836 )	2024-07-31 17:17:46 +08:00
非法操作	35d0534eb9	chore: fix ssrf doc url (#6828 )	2024-07-31 17:14:53 +08:00
William Espegren	4be12b29b9	fix: improved error handling for spider tool (#6835 )	2024-07-31 17:11:52 +08:00
NFish	dd64e65ea0	fix: edit segment missing space between buttons (#6826 ) Co-authored-by: xc Dou <xcdou@192.168.88.89>	2024-07-31 15:11:07 +08:00
ybalbert001	c23aa50bea	Add AWS builtin Tools (#6721 ) Co-authored-by: Yuanbo Li <ybalbert@amazon.com> Co-authored-by: crazywoola <427733928@qq.com>	2024-07-31 14:41:42 +08:00
Nam Vu	8eb0d0fddd	feat: support Celery auto-scale (#6249 ) Co-authored-by: takatost <takatost@gmail.com>	2024-07-31 14:34:44 +08:00
kimjion	8904745129	feat: tag filter adapte to scrolling (#6819 )	2024-07-31 13:55:32 +08:00
k-brahma	936ac8826d	Add docker-compose certbot configurations with backward compatibility (#6702 ) Co-authored-by: Your Name <you@example.com>	2024-07-31 13:21:56 +08:00
Ever	545d3c5a93	chore: Add processId field for metrics of threads/db-pool-stat/health (#6797 ) Co-authored-by: 老潮 <zhangyongsheng@3vjia.com> Co-authored-by: takatost <takatost@users.noreply.github.com> Co-authored-by: takatost <takatost@gmail.com>	2024-07-31 00:21:16 +08:00
crazywoola	3c371a6cb0	fix: workflow api (#6810 )	2024-07-30 23:51:48 +08:00
longzhihun	9ce5cea911	feat: bedrock invoke enhancement (#6808 )	2024-07-30 21:57:18 +08:00
eric-0x72	98d9837fbc	fix wrong charset when decoding Chinese content (#6774 ) Co-authored-by: zhangwb <zhangwb@zts.com.cn>	2024-07-30 21:32:45 +08:00
Joel	53a89bbbc7	chore : option card (#6800 )	2024-07-30 17:33:08 +08:00
zxhlyh	0a744a73b3	fix: eco knowledge retrieval method (#6798 )	2024-07-30 16:59:03 +08:00
非法操作	0675c5f716	chore: add shortcut keys and hints for the shortcuts (#6779 )	2024-07-30 16:18:58 +08:00
Yeuoly	72963d1f13	fix: nonetype in webscraper validation (#6788 )	2024-07-30 14:45:14 +08:00
Chenhe Gu	028261f760	improve issue templates (#6785 )	2024-07-30 14:17:45 +08:00
-LAN-	a98284b1ef	refactor(api): Switch to `dify_config` (#6750 ) Signed-off-by: -LAN- <laipz8200@outlook.com>	2024-07-30 11:15:26 +08:00
Bowen Liang	daa31b2cb3	chore: remove redundant version pinning for indirect dependencies (#6772 )	2024-07-30 08:45:57 +08:00
Bowen Liang	b414ea41d6	dep: initial support for Milvus 2.4.x (#6084 )	2024-07-29 19:56:45 +08:00
Joe	f78d0082ae	feat: implement function dispatch table for trace processing (#6628 )	2024-07-29 18:47:25 +08:00
SiliconFlow, Inc	3e18d32ce5	add deepseek-coder-v2 in siliconflow (#6149 )	2024-07-29 18:45:19 +08:00
Charles	94d68b6a08	upgrade deepseek params (#6744 )	2024-07-29 18:31:56 +08:00
Giga Group	c9ff0e3961	Add model hunyuan-embedding (#6657 ) Co-authored-by: sun <sun@centen.cn>	2024-07-29 18:30:52 +08:00
-LAN-	8dd68e2034	fix(api/core/moderation/output_moderation.py): Fix config call. (#6769 )	2024-07-29 18:30:29 +08:00
zxhlyh	2cd662c43b	chore: n to 1 retrieval legacy text (#6767 )	2024-07-29 18:09:44 +08:00
zxhlyh	4945184f8c	fix: n to 1 retrieval legacy text (#6760 )	2024-07-29 16:03:47 +08:00
Bowen Liang	cb01bf2986	chore: set logging level to debug when reading YAML files and falling back to default value in case of None (#6758 )	2024-07-29 13:40:18 +08:00
Yi Xiao	f43e27814c	Fix action button size (#6753 )	2024-07-29 13:19:15 +08:00
Bowen Liang	20268708cc	chore: improve position map conversion and tolerate empty position yaml file (#6541 )	2024-07-29 10:32:11 +08:00
Hanqing Zhao	c8da4a1b7e	Add jp translation for new features (#6749 )	2024-07-29 08:58:48 +08:00
Vicky Guo	829472a1d7	switch to diffy_config with Pydantic in files, moderation and app (#6747 ) Signed-off-by: -LAN- <laipz8200@outlook.com> Co-authored-by: -LAN- <laipz8200@outlook.com>	2024-07-29 02:57:45 +08:00
Hiroshige Aoki	e23461c837	Fix/6615 40 varchar limit on DatasetCollectionBinding and Embedding model name (#6723 )	2024-07-28 09:42:58 +08:00
非法操作	21f6caacd4	feat: enhance the firecrawl tool (#6705 )	2024-07-27 15:00:06 +08:00
Pascal M	082c46a903	chore: migrate to poetry in devcontainer commands (#6724 )	2024-07-27 14:49:34 +08:00
-LAN-	6a3bef8378	feat(api/core/app/segments): Update segment types and variables (#6734 ) Signed-off-by: -LAN- <laipz8200@outlook.com>	2024-07-27 14:43:51 +08:00
-LAN-	b6c3010f02	refactor(api/core/workflow/nodes/base_node.py): Update extract_variable_selector_to_variable_mapping method signature. (#6733 ) Signed-off-by: -LAN- <laipz8200@outlook.com>	2024-07-27 14:43:25 +08:00
crazywoola	90d2c01218	Feat/6725 can not get image url from cogview tool (#6728 )	2024-07-27 00:07:31 +08:00
-LAN-	83af50368f	fix(api/core/model_runtime/model_providers/azure_openai/llm/llm.py): Try to skip if `delta.delta` is None. (#6727 ) Signed-off-by: -LAN- <laipz8200@outlook.com>	2024-07-27 00:05:21 +08:00
Jyong	cf258b7a67	add xlsx support hyperlink extract (#6722 )	2024-07-26 19:26:52 +08:00
-LAN-	5d77dc4f58	feat(api/core/app/segments/parser.py): Remove blank segment in `convert_template` (#6709 ) Signed-off-by: -LAN- <laipz8200@outlook.com>	2024-07-26 18:19:33 +08:00
Joe	e4542215cc	fix: tongyi empty tool_calls is not supported in message (#6719 )	2024-07-26 18:10:13 +08:00
Jason	3d3677e912	Feat/model provider novita (#6717 ) Co-authored-by: takatost <takatost@gmail.com>	2024-07-26 17:37:21 +08:00
Kevin9703	427f48be6b	fix(answer/operation): feedback status in the logs (#6716 )	2024-07-26 17:36:36 +08:00
-LAN-	c6996a48a4	refactor(api/core/app/segments): Support more kinds of Segments. (#6706 ) Signed-off-by: -LAN- <laipz8200@outlook.com>	2024-07-26 15:03:56 +08:00
chenxu9741	6b50bb0fe6	issues #6655 Open ai tts issues (#6696 )	2024-07-26 14:55:49 +08:00
Kevin9703	80b3871c55	fix(log/list): Incorrect field 'app_id' causing annotations to fail t… (#6697 )	2024-07-26 11:24:32 +08:00
KVOJJJin	4839523e53	Fix appId missing in annotations (#6699 )	2024-07-26 11:21:51 +08:00
Sangmin Ahn	ecb9c311b5	chore: make prompt generator max tokens configurable (#6693 )	2024-07-26 10:20:23 +08:00
crazywoola	bd97ce9489	fix: doc link in knowledge base (#6691 )	2024-07-26 09:14:08 +08:00
Yeuoly	79cb23e8ac	security/SSRF vulns (#6682 )	2024-07-25 20:50:26 +08:00
longzhihun	c5ac004f15	[seanguo] fix: unsupported filename in windows & add Mistral Large 2 (#6679 )	2024-07-25 19:26:46 +08:00
crazywoola	5fbfa0f2c8	Update bug_report.yml (#6678 )	2024-07-25 18:59:04 +08:00
RookieAgent	78a339a794	modify llama3-1 yaml filename to support Windows pull operations (#6677 )	2024-07-25 18:58:55 +08:00
Hanqing Zhao	f904df4b63	Add french and jp translation for new feature (#6675 )	2024-07-25 18:55:16 +08:00
灰灰	5e4ac11df3	fix: code block segmentation problem of markdown document (#6465 )	2024-07-25 17:24:37 +08:00
tmuife	16b4f560cd	fix bugs(when using Oracle23ai as Vector DB) (#6658 )	2024-07-25 17:07:14 +08:00
-LAN-	75e6576c67	refactor(api/core/app/segments): implement `to_object` in ObjectVariable and ArrayVariable. (#6671 ) Signed-off-by: -LAN- <laipz8200@outlook.com>	2024-07-25 17:06:38 +08:00
Seayon	0b4c26578e	Enhance database URI security and add URL encoding (#6668 )	2024-07-25 16:48:00 +08:00
xielong	ebcc07e3e9	feat: support max_retries in jina requests (#6585 )	2024-07-25 13:10:39 +08:00
-LAN-	55c2b61921	fix(api/fields/workflow_fields.py): Add check in environment variables (#6621 )	2024-07-25 11:30:52 +08:00
Giga Group	ca696fe94c	Add support of tool-call for model provider "hunyuan" (#6656 ) Co-authored-by: sun <sun@centen.cn>	2024-07-25 11:27:58 +08:00
非法操作	585444c50c	chore: fix type annotations (#6600 )	2024-07-25 11:21:51 +08:00
longzhihun	9815aab7a3	[seanguo] feat: add llama 3.1 support in bedrock (#6645 )	2024-07-25 11:20:37 +08:00
yanghx	349ec0db77	fix tencent_cos_storage image-preview error is not a byte (#6652 )	2024-07-25 11:20:20 +08:00
majian	a876baf0a9	Resolve variable type parameter error (#6646 )	2024-07-25 11:15:54 +08:00
Jyong	91fd8521c3	fix reranking model field error (#6654 )	2024-07-25 10:07:55 +08:00
-LAN-	4ec9a87e46	fix(api/core/workflow/nodes/iteration/iteration_node.py): Extend output in iteration if output is a array. (#6647 ) Signed-off-by: -LAN- <laipz8200@outlook.com>	2024-07-25 00:32:39 +08:00
Vico Chu	fb5e3662d5	Chores: add missing profile for middleware docker compose cmd and fix ssrf-proxy doc link (#6372 ) Co-authored-by: crazywoola <100913391+crazywoola@users.noreply.github.com>	2024-07-24 19:36:06 +08:00
-LAN-	31efe10c75	refactor(api/core/workflow/workflow_engine_manager.py): Remove (#6630 ) Signed-off-by: -LAN- <laipz8200@outlook.com>	2024-07-24 19:35:40 +08:00
-LAN-	72bc9d5f2b	feat(api/core/app/segments/variables.py): Support description in Variable. (#6636 ) Signed-off-by: -LAN- <laipz8200@outlook.com>	2024-07-24 19:35:22 +08:00
Jyong	600f13436d	remove rerank model must be required when retrieval_model is multiple (#6640 )	2024-07-24 19:34:41 +08:00
Joe	b347a2f839	Feat/user session id search (#6638 )	2024-07-24 19:34:23 +08:00
crazywoola	47b5bd7243	fix: value is not an array (#6632 )	2024-07-24 19:14:04 +08:00
zhangzhiqiangcs	d4c55748f1	doc: fix about model features (#6619 )	2024-07-24 19:12:10 +08:00
takatost	0625db0bf5	chore: optimize asynchronous workflow deletion performance of app related data (#6639 )	2024-07-24 19:00:37 +08:00
takatost	05141ede16	chore: optimize asynchronous deletion performance of app related data (#6634 )	2024-07-24 18:15:03 +08:00
Yi Xiao	c112188207	feat: added ActionButton component (#6631 )	2024-07-24 18:09:44 +08:00
dufei	5af2df0cd5	fix: qwen fc error (#6620 ) Co-authored-by: dufei <du_fei@venusgroup.com.cn>	2024-07-24 16:56:06 +08:00
crazywoola	f324374b95	Fix/6615 40 varchar limit on model name (#6623 )	2024-07-24 16:23:16 +08:00
KVOJJJin	2aad128883	Fix: DSL backup (#6616 )	2024-07-24 15:02:30 +08:00
KVOJJJin	3c78fdec1c	Fix: reset button in embedded chatbot (#6611 )	2024-07-24 14:46:52 +08:00
zxhlyh	6fe9aa69cc	feat: n to 1 retrieval legacy (#6554 )	2024-07-24 12:50:48 +08:00
Jyong	e4bb943fe5	Feat/delete single dataset retrival (#6570 )	2024-07-24 12:50:11 +08:00
takatost	0fb741f269	fix: downgraded sentry-sdk to 1.44.1 due to claude LLM token returning 0 (#6597 )	2024-07-24 04:49:03 +08:00
takatost	4c85393a1d	feat: add GroqCloud llama3.1 series models support (#6596 )	2024-07-24 00:41:58 +08:00
sino	d5c2680fde	feat: support llama3.1 series models for openrouter provider (#6595 )	2024-07-24 00:37:48 +08:00