From c13dc620656903e0cdbe973fd0164a0771ec4a39 Mon Sep 17 00:00:00 2001
From: Hanqing Zhao <sherry9277@gmail.com>
Date: Mon, 28 Oct 2024 16:31:58 +0800
Subject: [PATCH 01/29] Modify and add jp translation (#9930)

---
 web/i18n/ja-JP/app-annotation.ts   |  2 ++
 web/i18n/ja-JP/app-debug.ts        | 57 ++++++++++++++++++++++++++++--
 web/i18n/ja-JP/dataset-settings.ts |  2 +-
 web/i18n/ja-JP/dataset.ts          |  2 +-
 web/i18n/ja-JP/workflow.ts         | 38 ++++++++++----------
 5 files changed, 78 insertions(+), 23 deletions(-)
diff --git a/web/i18n/ja-JP/app-annotation.ts b/web/i18n/ja-JP/app-annotation.ts
index 6c6c98cdd0..f34d8d2acd 100644
--- a/web/i18n/ja-JP/app-annotation.ts
+++ b/web/i18n/ja-JP/app-annotation.ts
@@ -9,6 +9,8 @@ const translation = {
   table: {
     header: {
       question: '質問',
+      match: 'マッチ',
+      response: '応答',
       answer: '回答',
       createdAt: '作成日時',
       hits: 'ヒット数',
diff --git a/web/i18n/ja-JP/app-debug.ts b/web/i18n/ja-JP/app-debug.ts
index 0ba4c35b0d..620d9b2f55 100644
--- a/web/i18n/ja-JP/app-debug.ts
+++ b/web/i18n/ja-JP/app-debug.ts
@@ -150,7 +150,7 @@ const translation = {
       title: '会話履歴',
       description: '会話の役割に接頭辞名を設定します',
       tip: '会話履歴は有効になっていません。上記のプロンプトに <histories> を追加してください。',
-      learnMore: '詳細',
+      learnMore: '詳細を見る',
       editModal: {
         title: '会話役割名の編集',
         userPrefix: 'ユーザー接頭辞',
@@ -163,6 +163,7 @@ const translation = {
     moderation: {
       title: 'コンテンツのモデレーション',
       description: 'モデレーションAPIを使用するか、機密語リストを維持することで、モデルの出力を安全にします。',
+      contentEnableLabel: 'モデレート・コンテンツを有効にする',
       allEnabled: '入力/出力コンテンツが有効になっています',
       inputEnabled: '入力コンテンツが有効になっています',
       outputEnabled: '出力コンテンツが有効になっています',
@@ -198,6 +199,25 @@ const translation = {
         },
       },
     },
+    fileUpload: {
+      title: 'ファイル アップロード',
+      description: 'チャットの入力ボックスは画像やドキュメントやその他のファイルのアップロードをサポートします。',
+      supportedTypes: 'サポートされるファイルのタイプ',
+      numberLimit: '最大アップロード数',
+      modalTitle: 'ファイル アップロード設置',
+    },
+    imageUpload: {
+      title: '画像アップロード',
+      description: '画像アップロードをサポートする',
+      supportedTypes: 'サポートされるファイルのタイプ',
+      numberLimit: '最大アップロード数',
+      modalTitle: '画像アップロード設置',
+    },
+    bar: {
+      empty: 'Webアプリのユーザーエクスペリアンスを強化させる機能を有効にする',
+      enableText: '有効な機能',
+      manage: '管理',
+    },
   },
   codegen: {
     title: 'コードジェネレーター',
@@ -278,6 +298,10 @@ const translation = {
     waitForBatchResponse: 'バッチタスクへの応答が完了するまでお待ちください。',
     notSelectModel: 'モデルを選択してください',
     waitForImgUpload: '画像のアップロードが完了するまでお待ちください',
+    waitForFileUpload: 'ファイルのアップロードが完了するまでお待ちください',
+  },
+  warningMessage: {
+    timeoutExceeded: 'タイムアウトのため結果が表示されません。完全な結果を手にいれるためには、ログを参照してください。',
   },
   chatSubTitle: '手順',
   completionSubTitle: '接頭辞プロンプト',
@@ -319,6 +343,8 @@ const translation = {
     'paragraph': '段落',
     'select': '選択',
     'number': '数値',
+    'single-file': '単一ファイル',
+    'multi-files': 'ファイルリスト',
     'notSet': '設定されていません。プレフィックスのプロンプトで {{input}} を入力してみてください。',
     'stringTitle': 'フォームテキストボックスオプション',
     'maxLength': '最大長',
@@ -330,6 +356,31 @@ const translation = {
     'inputPlaceholder': '入力してください',
     'content': 'コンテンツ',
     'required': '必須',
+    'file': {
+      supportFileTypes: 'サッポトされたファイルタイプ',
+      image: {
+        name: '画像',
+      },
+      audio: {
+        name: '音声',
+      },
+      document: {
+        name: 'ドキュメント',
+      },
+      video: {
+        name: '映像',
+      },
+      custom: {
+        name: '他のファイルタイプ',
+        description: '他のファイルタイプを指定する。',
+        createPlaceholder: '+ 拡張子, 例：.doc',
+      },
+    },
+    'uploadFileTypes': 'アップロードされたファイルのタイプ',
+    'localUpload': 'ローカル アップロード',
+    'both': '両方',
+    'maxNumberOfUploads': 'アップロードの最大数',
+    'maxNumberTip': 'ドキュメント < {{docLimit}}, 画像 < {{imgLimit}}, 音声 < {{audioLimit}}, 映像 < {{videoLimit}}',
     'errorMsg': {
       varNameRequired: '変数名は必須です',
       labelNameRequired: 'ラベル名は必須です',
@@ -341,6 +392,7 @@ const translation = {
   vision: {
     name: 'ビジョン',
     description: 'ビジョンを有効にすると、モデルが画像を受け取り、それに関する質問に答えることができます。',
+    onlySupportVisionModelTip: 'ビジョンモデルのみをサポート',
     settings: '設定',
     visionSettings: {
       title: 'ビジョン設定',
@@ -369,7 +421,7 @@ const translation = {
       voice: '音声',
       autoPlay: '自動再生',
       autoPlayEnabled: '開ける',
-      autoPlayDisabled: '關閉',
+      autoPlayDisabled: '閉じる',
     },
   },
   openingStatement: {
@@ -408,6 +460,7 @@ const translation = {
     run: '実行',
   },
   result: '出力テキスト',
+  noResult: '出力はここに表示されます。',
   datasetConfig: {
     settingTitle: 'リトリーバル設定',
     knowledgeTip: 'ナレッジを追加するには「+」ボタンをクリックしてください',
diff --git a/web/i18n/ja-JP/dataset-settings.ts b/web/i18n/ja-JP/dataset-settings.ts
index 1eb3dabb74..f0b8c76a24 100644
--- a/web/i18n/ja-JP/dataset-settings.ts
+++ b/web/i18n/ja-JP/dataset-settings.ts
@@ -24,7 +24,7 @@ const translation = {
     embeddingModelTipLink: '設定',
     retrievalSetting: {
       title: '検索設定',
-      learnMore: '詳細を学ぶ',
+      learnMore: '詳細を見る',
       description: ' 検索方法についての詳細',
       longDescription: ' 検索方法についての詳細については、いつでもナレッジの設定で変更できます。',
     },
diff --git a/web/i18n/ja-JP/dataset.ts b/web/i18n/ja-JP/dataset.ts
index d995509a3f..f15f0dfb1a 100644
--- a/web/i18n/ja-JP/dataset.ts
+++ b/web/i18n/ja-JP/dataset.ts
@@ -101,7 +101,7 @@ const translation = {
       end: '.次に、対応するナレッジIDを見つけて、左側のフォームに入力します。すべての情報が正しい場合は、接続ボタンをクリックした後、ナレッジベースの検索テストに自動的にジャンプします。',
     },
     title: '外部ナレッジベースに接続する方法',
-    learnMore: '詳細情報',
+    learnMore: '詳細を見る',
   },
   connectHelper: {
     helper2: '取得機能のみがサポートされています',
diff --git a/web/i18n/ja-JP/workflow.ts b/web/i18n/ja-JP/workflow.ts
index 632e5712e5..b6c7786081 100644
--- a/web/i18n/ja-JP/workflow.ts
+++ b/web/i18n/ja-JP/workflow.ts
@@ -19,6 +19,10 @@ const translation = {
     goBackToEdit: '編集に戻る',
     conversationLog: '会話ログ',
     features: '機能',
+    featuresDescription: 'Webアプリのユーザーエクスペリエンスを強化する',
+    ImageUploadLegacyTip: '開始フォームでファイルタイプ変数を作成できるようになりました。まもなく、画像アップロード機能のサポートは終了いたします。',
+    fileUploadTip: '画像アップロード機能がファイルのアップロード機能にアップグレードされました。',
+    featuresDocLink: '詳細を見る',
     debugAndPreview: 'プレビュー',
     restart: '再起動',
     currentDraft: '現在の下書き',
@@ -55,7 +59,7 @@ const translation = {
     viewOnly: '表示のみ',
     showRunHistory: '実行履歴を表示',
     enableJinja: 'Jinjaテンプレートのサポートを有効にする',
-    learnMore: '詳細を学ぶ',
+    learnMore: '詳細を見る',
     copy: 'コピー',
     duplicate: '複製',
     addBlock: 'ブロックを追加',
@@ -95,10 +99,6 @@ const translation = {
     addParallelNode: '並列ノードを追加',
     parallel: '並列',
     branch: 'ブランチ',
-    fileUploadTip: '画像のアップロード機能がファイルのアップロードにアップグレードされました。',
-    featuresDocLink: '詳細情報',
-    ImageUploadLegacyTip: 'これで、開始フォームでファイルタイプ変数を作成できるようになりました。今後、画像のアップロード機能のサポートは終了いたします。',
-    featuresDescription: 'Webアプリのユーザーエクスペリエンスを強化',
   },
   env: {
     envPanelTitle: '環境変数',
@@ -229,8 +229,8 @@ const translation = {
     'iteration-start': 'イテレーション開始',
     'iteration': 'イテレーション',
     'parameter-extractor': 'パラメーター抽出',
-    'document-extractor': 'ドキュメントエクストラクター',
-    'list-operator': 'リスト演算子',
+    'document-extractor': 'テキスト抽出ツール',
+    'list-operator': 'リスト処理',
   },
   blocksAbout: {
     'start': 'ワークフローの開始に必要なパラメータを定義します',
@@ -248,7 +248,7 @@ const translation = {
     'variable-aggregator': '複数のブランチの変数を1つの変数に集約し、下流のノードに対して統一された設定を行います。',
     'iteration': 'リストオブジェクトに対して複数のステップを実行し、すべての結果が出力されるまで繰り返します。',
     'parameter-extractor': '自然言語からツールの呼び出しやHTTPリクエストのための構造化されたパラメーターを抽出するためにLLMを使用します。',
-    'document-extractor': 'アップロードされたドキュメントを LLM で簡単に理解できるテキスト コンテンツに解析するために使用されます。',
+    'document-extractor': 'アップロードされたドキュメントを LLM で簡単に理解できるテキストのコンテンツに解析するために使用されます。',
     'list-operator': '配列のコンテンツをフィルタリングまたはソートするために使用されます。',
   },
   operator: {
@@ -405,7 +405,7 @@ const translation = {
         writeLabel: '書き込みタイムアウト',
         writePlaceholder: '書き込みタイムアウトを秒で入力',
       },
-      type: '種類',
+      type: 'タイプ',
       binaryFileVariable: 'バイナリファイル変数',
     },
     code: {
@@ -443,21 +443,21 @@ const translation = {
         'null': 'null',
         'not null': 'nullでない',
         'regex match': '正規表現マッチ',
-        'in': 'で',
-        'not exists': '存在しません',
-        'exists': '存在',
+        'in': '含まれている',
         'not in': '含まれていない',
         'all of': 'すべての',
+        'exists': '存在します',
+        'not exists': '存在しません',
       },
       enterValue: '値を入力',
       addCondition: '条件を追加',
       conditionNotSetup: '条件が設定されていません',
       selectVariable: '変数を選択...',
       optionName: {
-        audio: 'オーディオ',
+        audio: '音声',
         localUpload: 'ローカルアップロード',
         image: '画像',
-        video: 'ビデオ',
+        video: '映像',
         doc: 'ドキュメント',
         url: 'URL',
       },
@@ -583,7 +583,7 @@ const translation = {
         text: '抽出されたテキスト',
       },
       inputVar: '入力変数',
-      learnMore: '詳細情報',
+      learnMore: '詳細を見る',
       supportFileTypes: 'サポートするファイルタイプ: {{types}}。',
     },
     listFilter: {
@@ -593,13 +593,13 @@ const translation = {
         result: 'フィルター結果',
       },
       limit: 'トップN',
-      asc: 'ASCの',
+      asc: 'ASC',
       filterCondition: 'フィルター条件',
       filterConditionKey: 'フィルター条件キー',
-      orderBy: '注文順',
+      orderBy: '並べる順番',
       filterConditionComparisonValue: 'フィルター条件の値',
-      selectVariableKeyPlaceholder: 'サブ変数キーの選択',
-      filterConditionComparisonOperator: 'フィルター条件比較演算子',
+      selectVariableKeyPlaceholder: 'サブ変数キーを選択する',
+      filterConditionComparisonOperator: 'フィルター条件を比較オペレーター',
       inputVar: '入力変数',
       desc: 'DESC',
     },

From 0ebd9856725e273621db5c7943a9e18e01991aeb Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?=E6=96=B9=E7=A8=8B?= <fchangenow@163.com>
Date: Mon, 28 Oct 2024 16:52:12 +0800
Subject: [PATCH 02/29] feat: add models for gitee.ai (#9490)

---
 .../gitee_ai/_assets/Gitee-AI-Logo-full.svg   |   6 +
 .../gitee_ai/_assets/Gitee-AI-Logo.svg        |   3 +
 .../model_providers/gitee_ai/_common.py       |  47 +++++++
 .../model_providers/gitee_ai/gitee_ai.py      |  25 ++++
 .../model_providers/gitee_ai/gitee_ai.yaml    |  35 +++++
 .../gitee_ai/llm/Qwen2-72B-Instruct.yaml      | 105 ++++++++++++++
 .../gitee_ai/llm/Qwen2-7B-Instruct.yaml       | 105 ++++++++++++++
 .../gitee_ai/llm/Yi-1.5-34B-Chat.yaml         | 105 ++++++++++++++
 .../gitee_ai/llm/_position.yaml               |   7 +
 .../gitee_ai/llm/codegeex4-all-9b.yaml        | 105 ++++++++++++++
 .../llm/deepseek-coder-33B-instruct-chat.yaml | 105 ++++++++++++++
 ...epseek-coder-33B-instruct-completions.yaml |  91 ++++++++++++
 .../gitee_ai/llm/glm-4-9b-chat.yaml           | 105 ++++++++++++++
 .../model_providers/gitee_ai/llm/llm.py       |  47 +++++++
 .../gitee_ai/rerank/__init__.py               |   0
 .../gitee_ai/rerank/_position.yaml            |   1 +
 .../gitee_ai/rerank/bge-reranker-v2-m3.yaml   |   4 +
 .../model_providers/gitee_ai/rerank/rerank.py | 128 +++++++++++++++++
 .../gitee_ai/speech2text/__init__.py          |   0
 .../gitee_ai/speech2text/_position.yaml       |   2 +
 .../gitee_ai/speech2text/speech2text.py       |  53 +++++++
 .../gitee_ai/speech2text/whisper-base.yaml    |   5 +
 .../gitee_ai/speech2text/whisper-large.yaml   |   5 +
 .../gitee_ai/text_embedding/_position.yaml    |   3 +
 .../text_embedding/bge-large-zh-v1.5.yaml     |   8 ++
 .../gitee_ai/text_embedding/bge-m3.yaml       |   8 ++
 .../text_embedding/bge-small-zh-v1.5.yaml     |   8 ++
 .../gitee_ai/text_embedding/text_embedding.py |  31 ++++
 .../model_providers/gitee_ai/tts/ChatTTS.yaml |  11 ++
 .../tts/FunAudioLLM-CosyVoice-300M.yaml       |  11 ++
 .../model_providers/gitee_ai/tts/__init__.py  |   0
 .../gitee_ai/tts/_position.yaml               |   4 +
 .../gitee_ai/tts/fish-speech-1.2-sft.yaml     |  11 ++
 .../gitee_ai/tts/speecht5_tts.yaml            |  11 ++
 .../model_providers/gitee_ai/tts/tts.py       |  79 +++++++++++
 api/pytest.ini                                |   1 +
 api/tests/integration_tests/.env.example      |   3 +
 .../model_runtime/gitee_ai/__init__.py        |   0
 .../model_runtime/gitee_ai/test_llm.py        | 132 ++++++++++++++++++
 .../model_runtime/gitee_ai/test_provider.py   |  15 ++
 .../model_runtime/gitee_ai/test_rerank.py     |  47 +++++++
 .../gitee_ai/test_speech2text.py              |  45 ++++++
 .../gitee_ai/test_text_embedding.py           |  46 ++++++
 .../model_runtime/gitee_ai/test_tts.py        |  23 +++
 44 files changed, 1586 insertions(+)
 create mode 100644 api/core/model_runtime/model_providers/gitee_ai/_assets/Gitee-AI-Logo-full.svg
 create mode 100644 api/core/model_runtime/model_providers/gitee_ai/_assets/Gitee-AI-Logo.svg
 create mode 100644 api/core/model_runtime/model_providers/gitee_ai/_common.py
 create mode 100644 api/core/model_runtime/model_providers/gitee_ai/gitee_ai.py
 create mode 100644 api/core/model_runtime/model_providers/gitee_ai/gitee_ai.yaml
 create mode 100644 api/core/model_runtime/model_providers/gitee_ai/llm/Qwen2-72B-Instruct.yaml
 create mode 100644 api/core/model_runtime/model_providers/gitee_ai/llm/Qwen2-7B-Instruct.yaml
 create mode 100644 api/core/model_runtime/model_providers/gitee_ai/llm/Yi-1.5-34B-Chat.yaml
 create mode 100644 api/core/model_runtime/model_providers/gitee_ai/llm/_position.yaml
 create mode 100644 api/core/model_runtime/model_providers/gitee_ai/llm/codegeex4-all-9b.yaml
 create mode 100644 api/core/model_runtime/model_providers/gitee_ai/llm/deepseek-coder-33B-instruct-chat.yaml
 create mode 100644 api/core/model_runtime/model_providers/gitee_ai/llm/deepseek-coder-33B-instruct-completions.yaml
 create mode 100644 api/core/model_runtime/model_providers/gitee_ai/llm/glm-4-9b-chat.yaml
 create mode 100644 api/core/model_runtime/model_providers/gitee_ai/llm/llm.py
 create mode 100644 api/core/model_runtime/model_providers/gitee_ai/rerank/__init__.py
 create mode 100644 api/core/model_runtime/model_providers/gitee_ai/rerank/_position.yaml
 create mode 100644 api/core/model_runtime/model_providers/gitee_ai/rerank/bge-reranker-v2-m3.yaml
 create mode 100644 api/core/model_runtime/model_providers/gitee_ai/rerank/rerank.py
 create mode 100644 api/core/model_runtime/model_providers/gitee_ai/speech2text/__init__.py
 create mode 100644 api/core/model_runtime/model_providers/gitee_ai/speech2text/_position.yaml
 create mode 100644 api/core/model_runtime/model_providers/gitee_ai/speech2text/speech2text.py
 create mode 100644 api/core/model_runtime/model_providers/gitee_ai/speech2text/whisper-base.yaml
 create mode 100644 api/core/model_runtime/model_providers/gitee_ai/speech2text/whisper-large.yaml
 create mode 100644 api/core/model_runtime/model_providers/gitee_ai/text_embedding/_position.yaml
 create mode 100644 api/core/model_runtime/model_providers/gitee_ai/text_embedding/bge-large-zh-v1.5.yaml
 create mode 100644 api/core/model_runtime/model_providers/gitee_ai/text_embedding/bge-m3.yaml
 create mode 100644 api/core/model_runtime/model_providers/gitee_ai/text_embedding/bge-small-zh-v1.5.yaml
 create mode 100644 api/core/model_runtime/model_providers/gitee_ai/text_embedding/text_embedding.py
 create mode 100644 api/core/model_runtime/model_providers/gitee_ai/tts/ChatTTS.yaml
 create mode 100644 api/core/model_runtime/model_providers/gitee_ai/tts/FunAudioLLM-CosyVoice-300M.yaml
 create mode 100644 api/core/model_runtime/model_providers/gitee_ai/tts/__init__.py
 create mode 100644 api/core/model_runtime/model_providers/gitee_ai/tts/_position.yaml
 create mode 100644 api/core/model_runtime/model_providers/gitee_ai/tts/fish-speech-1.2-sft.yaml
 create mode 100644 api/core/model_runtime/model_providers/gitee_ai/tts/speecht5_tts.yaml
 create mode 100644 api/core/model_runtime/model_providers/gitee_ai/tts/tts.py
 create mode 100644 api/tests/integration_tests/model_runtime/gitee_ai/__init__.py
 create mode 100644 api/tests/integration_tests/model_runtime/gitee_ai/test_llm.py
 create mode 100644 api/tests/integration_tests/model_runtime/gitee_ai/test_provider.py
 create mode 100644 api/tests/integration_tests/model_runtime/gitee_ai/test_rerank.py
 create mode 100644 api/tests/integration_tests/model_runtime/gitee_ai/test_speech2text.py
 create mode 100644 api/tests/integration_tests/model_runtime/gitee_ai/test_text_embedding.py
 create mode 100644 api/tests/integration_tests/model_runtime/gitee_ai/test_tts.py

diff --git a/api/core/model_runtime/model_providers/gitee_ai/_assets/Gitee-AI-Logo-full.svg b/api/core/model_runtime/model_providers/gitee_ai/_assets/Gitee-AI-Logo-full.svg
new file mode 100644
index 0000000000..f9738b585b
--- /dev/null
+++ b/api/core/model_runtime/model_providers/gitee_ai/_assets/Gitee-AI-Logo-full.svg
@@ -0,0 +1,6 @@
+<svg width="145" height="40" viewBox="0 0 145 40" fill="none" xmlns="http://www.w3.org/2000/svg">
+<path fill-rule="evenodd" clip-rule="evenodd" d="M25.132 24.3947C25.497 25.7527 25.8984 27.1413 26.3334 28.5834C26.7302 29.8992 25.5459 30.4167 25.0752 29.1758C24.571 27.8466 24.0885 26.523 23.6347 25.1729C21.065 26.4654 18.5025 27.5424 15.5961 28.7541C16.7581 33.0256 17.8309 36.5984 19.4952 39.9935C19.4953 39.9936 19.4953 39.9937 19.4954 39.9938C19.6631 39.9979 19.8313 40 20 40C31.0457 40 40 31.0457 40 20C40 16.0335 38.8453 12.3366 36.8537 9.22729C31.6585 9.69534 27.0513 10.4562 22.8185 11.406C22.8882 12.252 22.9677 13.0739 23.0555 13.855C23.3824 16.7604 23.9112 19.5281 24.6137 22.3836C27.0581 21.2848 29.084 20.3225 30.6816 19.522C32.2154 18.7535 33.6943 18.7062 31.2018 20.6594C29.0388 22.1602 27.0644 23.3566 25.132 24.3947ZM36.1559 8.20846C33.0001 3.89184 28.1561 0.887462 22.5955 0.166882C22.4257 2.86234 22.4785 6.26344 22.681 9.50447C26.7473 8.88859 31.1721 8.46032 36.1559 8.20846ZM19.9369 9.73661e-05C19.7594 2.92694 19.8384 6.65663 20.19 9.91293C17.3748 10.4109 14.7225 11.0064 12.1592 11.7038C12.0486 10.4257 11.9927 9.25764 11.9927 8.24178C11.9927 7.5054 11.3957 6.90844 10.6593 6.90844C9.92296 6.90844 9.32601 7.5054 9.32601 8.24178C9.32601 9.47868 9.42873 10.898 9.61402 12.438C8.33567 12.8278 7.07397 13.2443 5.81918 13.688C5.12493 13.9336 4.76118 14.6954 5.0067 15.3896C5.25223 16.0839 6.01406 16.4476 6.7083 16.2021C7.7931 15.8185 8.88482 15.4388 9.98927 15.0659C10.5222 18.3344 11.3344 21.9428 12.2703 25.4156C12.4336 26.0218 12.6062 26.6262 12.7863 27.2263C9.34168 28.4135 5.82612 29.3782 2.61128 29.8879C0.949407 26.9716 0 23.5967 0 20C0 8.97534 8.92023 0.0341108 19.9369 9.73661e-05ZM4.19152 32.2527C7.45069 36.4516 12.3458 39.3173 17.9204 39.8932C16.5916 37.455 14.9338 33.717 13.5405 29.5901C10.4404 30.7762 7.25883 31.6027 4.19152 32.2527ZM22.9735 23.1135C22.1479 20.41 21.4462 17.5441 20.9225 14.277C20.746 13.5841 20.5918 12.8035 20.4593 11.9636C17.6508 12.6606 14.9992 13.4372 12.4356 14.2598C12.8479 17.4766 13.5448 21.1334 14.5118 24.7218C14.662 25.2792 14.8081 25.8248 14.9514 26.3594L14.9516 26.3603L14.9524 26.3634L14.9526 26.3639L14.973 26.4401C16.1833 25.9872 17.3746 25.5123 18.53 25.0259C20.1235 24.3552 21.6051 23.7165 22.9735 23.1135Z" fill="#141519"/>
+<path d="M57.0058 34.9872C59.7347 34.9872 61.9133 34.4549 63.5416 33.3903C65.1699 32.3257 65.984 30.9471 65.984 29.2547C65.984 26.5249 63.9464 25.1601 59.8712 25.1601H57.3605C56.5236 25.1601 55.9233 25.0782 55.5594 24.9144C55.1956 24.7506 55.0136 24.4776 55.0136 24.0955C55.0136 23.7133 55.1319 23.3948 55.3684 23.14C55.4593 23.0309 55.5776 22.9945 55.7231 23.0309C56.3053 23.1946 56.8602 23.2765 57.3878 23.2765C59.2617 23.2765 60.7854 22.8261 61.9588 21.9253C63.1323 21.0245 63.719 19.6915 63.719 17.9262C63.719 17.2711 63.6007 16.6887 63.3642 16.1792C63.346 16.1428 63.3506 16.1018 63.3779 16.0563C63.4051 16.0108 63.4461 15.9881 63.5007 15.9881H64.1283C64.5831 15.9881 64.9652 15.8334 65.2745 15.524C65.5838 15.2147 65.7384 14.8325 65.7384 14.3775V13.9954C65.7384 13.5586 65.5838 13.181 65.2745 12.8625C64.9652 12.5441 64.5831 12.3848 64.1283 12.3848H60.1168C59.9894 12.3848 59.853 12.3666 59.7074 12.3302C58.9979 12.1118 58.2247 12.0027 57.3878 12.0027C56.2053 12.0027 55.1228 12.2074 54.1404 12.6168C53.1579 13.0263 52.3438 13.6814 51.6979 14.5823C51.0521 15.4831 50.7292 16.5522 50.7292 17.7897C50.7292 18.6451 50.9293 19.4276 51.3295 20.1373C51.7298 20.8471 52.2301 21.4203 52.8305 21.8571C52.8668 21.8753 52.885 21.9026 52.885 21.939C52.885 21.9754 52.8668 22.0118 52.8305 22.0481C52.3211 22.4121 51.9117 22.8534 51.6024 23.3721C51.2932 23.8907 51.1385 24.423 51.1385 24.969C51.1385 26.1337 51.6024 27.0345 52.5303 27.6714C52.5667 27.6896 52.5849 27.7215 52.5849 27.767C52.5849 27.8125 52.5667 27.8534 52.5303 27.8898C51.8026 28.2538 51.2522 28.6996 50.8793 29.2274C50.5063 29.7552 50.3198 30.3375 50.3198 30.9744C50.3198 31.8844 50.6291 32.6487 51.2477 33.2674C51.8662 33.8862 52.6622 34.3275 53.6355 34.5914C54.6088 34.8552 55.7322 34.9872 57.0058 34.9872ZM57.3878 20.2738C56.7874 20.2738 56.3008 20.06 55.9278 19.6323C55.5549 19.2047 55.3684 18.5905 55.3684 17.7897C55.3684 17.0072 55.5549 16.4021 55.9278 15.9744C56.3008 15.5468 56.7874 15.333 57.3878 15.333C57.9882 15.333 58.4748 15.5422 58.8478 15.9608C59.2208 16.3794 59.4072 16.989 59.4072 17.7897C59.4072 18.5905 59.2208 19.2047 58.8478 19.6323C58.4748 20.06 57.9882 20.2738 57.3878 20.2738ZM57.7699 31.8753C56.7329 31.8753 55.9096 31.7342 55.3002 31.4522C54.6907 31.1701 54.386 30.747 54.386 30.1828C54.386 29.7279 54.5952 29.3002 55.0136 28.8998C55.0682 28.8452 55.1501 28.8179 55.2592 28.8179H55.3411C55.7959 28.9089 56.4873 28.9544 57.4151 28.9544H58.916C59.7165 28.9544 60.3032 29.0363 60.6762 29.2001C61.0492 29.3639 61.2356 29.6642 61.2356 30.1009C61.2356 30.6105 60.9127 31.0336 60.2669 31.3703C59.621 31.7069 58.7887 31.8753 57.7699 31.8753ZM70.978 10.0918C71.7967 10.0918 72.4698 9.85524 72.9974 9.38209C73.525 8.90893 73.7888 8.29928 73.7888 7.55315C73.7888 6.80702 73.525 6.19282 72.9974 5.71057C72.4698 5.22831 71.7967 4.98718 70.978 4.98718C70.1411 4.98718 69.4543 5.22831 68.9176 5.71057C68.3809 6.19282 68.1126 6.80702 68.1126 7.55315C68.1126 8.29928 68.3809 8.90893 68.9176 9.38209C69.4543 9.85524 70.1411 10.0918 70.978 10.0918ZM71.824 28.2174C72.2606 28.2174 72.6381 28.0582 72.9565 27.7397C73.2749 27.4212 73.434 27.0436 73.434 26.6068V13.9135C73.434 13.4767 73.2749 13.0991 72.9565 12.7806C72.6381 12.4622 72.2606 12.3029 71.824 12.3029H70.1047C69.6499 12.3029 69.2678 12.4622 68.9586 12.7806C68.6493 13.0991 68.4946 13.4767 68.4946 13.9135V26.6068C68.4946 27.0436 68.6493 27.4212 68.9586 27.7397C69.2678 28.0582 69.6499 28.2174 70.1047 28.2174H71.824ZM83.6949 28.5996C84.3862 28.5996 85.0685 28.5359 85.7416 28.4085C86.1782 28.3357 86.5148 28.0991 86.7513 27.6987C86.9151 27.4258 86.9969 27.1437 86.9969 26.8525C86.9969 26.7251 86.9878 26.5886 86.9696 26.4431L86.8605 26.0063C86.7695 25.6241 86.5421 25.3193 86.1783 25.0918C85.8144 24.8643 85.405 24.7415 84.9502 24.7233C83.6949 24.6687 83.0672 23.8498 83.0672 22.2665V16.3976C83.0672 16.2702 83.1309 16.2065 83.2583 16.2065H85.1958C85.6325 16.2065 86.01 16.0472 86.3283 15.7288C86.6467 15.4103 86.8059 15.0327 86.8059 14.5959V13.9135C86.8059 13.4767 86.6467 13.0991 86.3283 12.7806C86.01 12.4622 85.6325 12.3029 85.1958 12.3029H83.2583C83.1309 12.3029 83.0672 12.2392 83.0672 12.1118V9.73696C83.0672 9.282 82.9081 8.89983 82.5897 8.59046C82.2713 8.28109 81.8938 8.1264 81.4572 8.1264H80.5293C80.0745 8.1264 79.6742 8.27654 79.3286 8.57681C78.9829 8.87708 78.7737 9.2547 78.7009 9.70966L78.4007 12.1118C78.3825 12.2392 78.3007 12.312 78.1551 12.3302L77.5275 12.3848C77.0726 12.4212 76.6906 12.6077 76.3813 12.9444C76.072 13.2811 75.9174 13.6769 75.9174 14.1319V14.5959C75.9174 15.0327 76.0766 15.4103 76.395 15.7288C76.7133 16.0472 77.0908 16.2065 77.5275 16.2065H77.8822C78.0096 16.2065 78.0733 16.2702 78.0733 16.3976V22.3211C78.0733 24.3047 78.5281 25.8471 79.4377 26.9481C80.3474 28.0491 81.7664 28.5996 83.6949 28.5996ZM97.0395 28.5996C98.4949 28.5996 99.9322 28.2629 101.351 27.5895C101.751 27.4076 102.006 27.0891 102.115 26.6341C102.17 26.4885 102.197 26.343 102.197 26.1974C102.197 25.9244 102.115 25.6514 101.952 25.3784L101.87 25.2147C101.651 24.8325 101.333 24.5777 100.915 24.4503C100.714 24.3957 100.514 24.3684 100.314 24.3684C100.078 24.3684 99.8503 24.4048 99.632 24.4776C99.0134 24.696 98.3767 24.8052 97.7217 24.8052C95.5749 24.8052 94.2741 23.8498 93.8193 21.939C93.8011 21.8844 93.8102 21.8343 93.8466 21.7888C93.883 21.7433 93.9285 21.7206 93.983 21.7206H101.488C101.961 21.7206 102.379 21.5704 102.743 21.2702C103.107 20.9699 103.298 20.5923 103.316 20.1373V19.6187C103.316 17.3257 102.734 15.4694 101.57 14.05C100.405 12.6305 98.7132 11.9208 96.4937 11.9208C95.5295 11.9208 94.5971 12.1164 93.6965 12.5077C92.796 12.8989 91.9955 13.4449 91.295 14.1455C90.5946 14.8461 90.0306 15.7288 89.6031 16.7934C89.1755 17.858 88.9618 19.0181 88.9618 20.2738C88.9618 22.8398 89.7213 24.8689 91.2405 26.3612C92.7596 27.8534 94.6926 28.5996 97.0395 28.5996ZM98.8952 18.4995H93.9012C93.7738 18.4995 93.7102 18.454 93.7102 18.363C93.7102 17.6168 94.0649 16.9526 94.7744 16.3703C95.2839 15.9335 95.8933 15.7151 96.6028 15.7151C97.4215 15.7151 98.0355 15.9471 98.4449 16.4112C98.8542 16.8753 99.0771 17.4986 99.1135 18.2811V18.3084C99.1135 18.4358 99.0407 18.4995 98.8952 18.4995ZM113.686 28.5996C115.142 28.5996 116.579 28.2629 117.998 27.5895C118.398 27.4076 118.653 27.0891 118.762 26.6341C118.817 26.4885 118.844 26.343 118.844 26.1974C118.844 25.9244 118.762 25.6514 118.598 25.3784L118.516 25.2147C118.298 24.8325 117.98 24.5777 117.561 24.4503C117.361 24.3957 117.161 24.3684 116.961 24.3684C116.724 24.3684 116.497 24.4048 116.279 24.4776C115.66 24.696 115.023 24.8052 114.368 24.8052C112.222 24.8052 110.921 23.8498 110.466 21.939C110.448 21.8844 110.457 21.8343 110.493 21.7888C110.53 21.7433 110.575 21.7206 110.63 21.7206H118.134C118.607 21.7206 119.026 21.5704 119.39 21.2702C119.753 20.9699 119.944 20.5923 119.963 20.1373V19.6187C119.963 17.3257 119.38 15.4694 118.216 14.05C117.052 12.6305 115.36 11.9208 113.14 11.9208C112.176 11.9208 111.244 12.1164 110.343 12.5077C109.443 12.8989 108.642 13.4449 107.942 14.1455C107.241 14.8461 106.677 15.7288 106.25 16.7934C105.822 17.858 105.608 19.0181 105.608 20.2738C105.608 22.8398 106.368 24.8689 107.887 26.3612C109.406 27.8534 111.339 28.5996 113.686 28.5996ZM115.542 18.4995H110.548C110.42 18.4995 110.357 18.454 110.357 18.363C110.357 17.6168 110.712 16.9526 111.421 16.3703C111.93 15.9335 112.54 15.7151 113.249 15.7151C114.068 15.7151 114.682 15.9471 115.091 16.4112C115.501 16.8753 115.724 17.4986 115.76 18.2811V18.3084C115.76 18.4358 115.687 18.4995 115.542 18.4995Z" fill="black"/>
+<path d="M126.817 28.3723H123.96L131.579 11.7057L139.377 28.3723H136.579L131.579 17.8366L126.817 28.3723Z" fill="black"/>
+<path d="M142.141 12.039H144.998V28.3724H142.141V12.039Z" fill="black"/>
+</svg>
diff --git a/api/core/model_runtime/model_providers/gitee_ai/_assets/Gitee-AI-Logo.svg b/api/core/model_runtime/model_providers/gitee_ai/_assets/Gitee-AI-Logo.svg
new file mode 100644
index 0000000000..1f51187f19
--- /dev/null
+++ b/api/core/model_runtime/model_providers/gitee_ai/_assets/Gitee-AI-Logo.svg
@@ -0,0 +1,3 @@
+<svg width="40" height="40" viewBox="0 0 40 40" fill="none" xmlns="http://www.w3.org/2000/svg">
+<path fill-rule="evenodd" clip-rule="evenodd" d="M25.132 24.3947C25.497 25.7527 25.8984 27.1413 26.3334 28.5834C26.7302 29.8992 25.5459 30.4167 25.0752 29.1758C24.571 27.8466 24.0885 26.523 23.6347 25.1729C21.065 26.4654 18.5025 27.5424 15.5961 28.7541C16.7581 33.0256 17.8309 36.5984 19.4952 39.9935C19.4953 39.9936 19.4953 39.9937 19.4954 39.9938C19.6631 39.9979 19.8313 40 20 40C31.0457 40 40 31.0457 40 20C40 16.0335 38.8453 12.3366 36.8537 9.22729C31.6585 9.69534 27.0513 10.4562 22.8185 11.406C22.8882 12.252 22.9677 13.0739 23.0555 13.855C23.3824 16.7604 23.9112 19.5281 24.6137 22.3836C27.0581 21.2848 29.084 20.3225 30.6816 19.522C32.2154 18.7535 33.6943 18.7062 31.2018 20.6594C29.0388 22.1602 27.0644 23.3566 25.132 24.3947ZM36.1559 8.20846C33.0001 3.89184 28.1561 0.887462 22.5955 0.166882C22.4257 2.86234 22.4785 6.26344 22.681 9.50447C26.7473 8.88859 31.1721 8.46032 36.1559 8.20846ZM19.9369 9.73661e-05C19.7594 2.92694 19.8384 6.65663 20.19 9.91293C17.3748 10.4109 14.7225 11.0064 12.1592 11.7038C12.0486 10.4257 11.9927 9.25764 11.9927 8.24178C11.9927 7.5054 11.3957 6.90844 10.6593 6.90844C9.92296 6.90844 9.32601 7.5054 9.32601 8.24178C9.32601 9.47868 9.42873 10.898 9.61402 12.438C8.33567 12.8278 7.07397 13.2443 5.81918 13.688C5.12493 13.9336 4.76118 14.6954 5.0067 15.3896C5.25223 16.0839 6.01406 16.4476 6.7083 16.2021C7.7931 15.8185 8.88482 15.4388 9.98927 15.0659C10.5222 18.3344 11.3344 21.9428 12.2703 25.4156C12.4336 26.0218 12.6062 26.6262 12.7863 27.2263C9.34168 28.4135 5.82612 29.3782 2.61128 29.8879C0.949407 26.9716 0 23.5967 0 20C0 8.97534 8.92023 0.0341108 19.9369 9.73661e-05ZM4.19152 32.2527C7.45069 36.4516 12.3458 39.3173 17.9204 39.8932C16.5916 37.455 14.9338 33.717 13.5405 29.5901C10.4404 30.7762 7.25883 31.6027 4.19152 32.2527ZM22.9735 23.1135C22.1479 20.41 21.4462 17.5441 20.9225 14.277C20.746 13.5841 20.5918 12.8035 20.4593 11.9636C17.6508 12.6606 14.9992 13.4372 12.4356 14.2598C12.8479 17.4766 13.5448 21.1334 14.5118 24.7218C14.662 25.2792 14.8081 25.8248 14.9514 26.3594L14.9516 26.3603L14.9524 26.3634L14.9526 26.3639L14.973 26.4401C16.1833 25.9872 17.3746 25.5123 18.53 25.0259C20.1235 24.3552 21.6051 23.7165 22.9735 23.1135Z" fill="#141519"/>
+</svg>
diff --git a/api/core/model_runtime/model_providers/gitee_ai/_common.py b/api/core/model_runtime/model_providers/gitee_ai/_common.py
new file mode 100644
index 0000000000..0750f3b75d
--- /dev/null
+++ b/api/core/model_runtime/model_providers/gitee_ai/_common.py
@@ -0,0 +1,47 @@
+from dashscope.common.error import (
+    AuthenticationError,
+    InvalidParameter,
+    RequestFailure,
+    ServiceUnavailableError,
+    UnsupportedHTTPMethod,
+    UnsupportedModel,
+)
+
+from core.model_runtime.errors.invoke import (
+    InvokeAuthorizationError,
+    InvokeBadRequestError,
+    InvokeConnectionError,
+    InvokeError,
+    InvokeRateLimitError,
+    InvokeServerUnavailableError,
+)
+
+
+class _CommonGiteeAI:
+    @property
+    def _invoke_error_mapping(self) -> dict[type[InvokeError], list[type[Exception]]]:
+        """
+        Map model invoke error to unified error
+        The key is the error type thrown to the caller
+        The value is the error type thrown by the model,
+        which needs to be converted into a unified error type for the caller.
+
+        :return: Invoke error mapping
+        """
+        return {
+            InvokeConnectionError: [
+                RequestFailure,
+            ],
+            InvokeServerUnavailableError: [
+                ServiceUnavailableError,
+            ],
+            InvokeRateLimitError: [],
+            InvokeAuthorizationError: [
+                AuthenticationError,
+            ],
+            InvokeBadRequestError: [
+                InvalidParameter,
+                UnsupportedModel,
+                UnsupportedHTTPMethod,
+            ],
+        }
diff --git a/api/core/model_runtime/model_providers/gitee_ai/gitee_ai.py b/api/core/model_runtime/model_providers/gitee_ai/gitee_ai.py
new file mode 100644
index 0000000000..ca67594ce4
--- /dev/null
+++ b/api/core/model_runtime/model_providers/gitee_ai/gitee_ai.py
@@ -0,0 +1,25 @@
+import logging
+
+from core.model_runtime.entities.model_entities import ModelType
+from core.model_runtime.errors.validate import CredentialsValidateFailedError
+from core.model_runtime.model_providers.__base.model_provider import ModelProvider
+
+logger = logging.getLogger(__name__)
+
+
+class GiteeAIProvider(ModelProvider):
+    def validate_provider_credentials(self, credentials: dict) -> None:
+        """
+        Validate provider credentials
+        if validate failed, raise exception
+
+        :param credentials: provider credentials, credentials form defined in `provider_credential_schema`.
+        """
+        try:
+            model_instance = self.get_model_instance(ModelType.LLM)
+            model_instance.validate_credentials(model="Qwen2-7B-Instruct", credentials=credentials)
+        except CredentialsValidateFailedError as ex:
+            raise ex
+        except Exception as ex:
+            logger.exception(f"{self.get_provider_schema().provider} credentials validate failed")
+            raise ex
diff --git a/api/core/model_runtime/model_providers/gitee_ai/gitee_ai.yaml b/api/core/model_runtime/model_providers/gitee_ai/gitee_ai.yaml
new file mode 100644
index 0000000000..7f7d0f2e53
--- /dev/null
+++ b/api/core/model_runtime/model_providers/gitee_ai/gitee_ai.yaml
@@ -0,0 +1,35 @@
+provider: gitee_ai
+label:
+  en_US: Gitee AI
+  zh_Hans: Gitee AI
+description:
+  en_US: 快速体验大模型，领先探索 AI 开源世界
+  zh_Hans: 快速体验大模型，领先探索 AI 开源世界
+icon_small:
+  en_US: Gitee-AI-Logo.svg
+icon_large:
+  en_US: Gitee-AI-Logo-full.svg
+help:
+  title:
+    en_US: Get your token from Gitee AI
+    zh_Hans: 从 Gitee AI 获取 token
+  url:
+    en_US: https://ai.gitee.com/dashboard/settings/tokens
+supported_model_types:
+  - llm
+  - text-embedding
+  - rerank
+  - speech2text
+  - tts
+configurate_methods:
+  - predefined-model
+provider_credential_schema:
+  credential_form_schemas:
+    - variable: api_key
+      label:
+        en_US: API Key
+      type: secret-input
+      required: true
+      placeholder:
+        zh_Hans: 在此输入您的 API Key
+        en_US: Enter your API Key
diff --git a/api/core/model_runtime/model_providers/gitee_ai/llm/Qwen2-72B-Instruct.yaml b/api/core/model_runtime/model_providers/gitee_ai/llm/Qwen2-72B-Instruct.yaml
new file mode 100644
index 0000000000..0348438a75
--- /dev/null
+++ b/api/core/model_runtime/model_providers/gitee_ai/llm/Qwen2-72B-Instruct.yaml
@@ -0,0 +1,105 @@
+model: Qwen2-72B-Instruct
+label:
+  zh_Hans: Qwen2-72B-Instruct
+  en_US: Qwen2-72B-Instruct
+model_type: llm
+features:
+  - agent-thought
+model_properties:
+  mode: chat
+  context_size: 6400
+parameter_rules:
+  - name: stream
+    use_template: boolean
+    label:
+      en_US: "Stream"
+      zh_Hans: "流式"
+    type: boolean
+    default: true
+    required: true
+    help:
+      en_US: "Whether to return the results in batches through streaming. If set to true, the generated text will be pushed to the user in real time during the generation process."
+      zh_Hans: "是否通过流式分批返回结果。如果设置为 true，生成过程中实时地向用户推送每一部分生成的文本。"
+
+  - name: max_tokens
+    use_template: max_tokens
+    label:
+      en_US: "Max Tokens"
+      zh_Hans: "最大Token数"
+    type: int
+    default: 512
+    min: 1
+    required: true
+    help:
+      en_US: "The maximum number of tokens that can be generated by the model varies depending on the model."
+      zh_Hans: "模型可生成的最大 token 个数，不同模型上限不同。"
+
+  - name: temperature
+    use_template: temperature
+    label:
+      en_US: "Temperature"
+      zh_Hans: "采样温度"
+    type: float
+    default: 0.7
+    min: 0.0
+    max: 1.0
+    precision: 1
+    required: true
+    help:
+      en_US: "The randomness of the sampling temperature control output. The temperature value is within the range of [0.0, 1.0]. The higher the value, the more random and creative the output; the lower the value, the more stable it is. It is recommended to adjust either top_p or temperature parameters according to your needs to avoid adjusting both at the same time."
+      zh_Hans: "采样温度控制输出的随机性。温度值在 [0.0, 1.0] 范围内，值越高，输出越随机和创造性；值越低，输出越稳定。建议根据需求调整 top_p 或 temperature 参数，避免同时调整两者。"
+
+  - name: top_p
+    use_template: top_p
+    label:
+      en_US: "Top P"
+      zh_Hans: "Top P"
+    type: float
+    default: 0.7
+    min: 0.0
+    max: 1.0
+    precision: 1
+    required: true
+    help:
+      en_US: "The value range of the sampling method is [0.0, 1.0]. The top_p value determines that the model selects tokens from the top p% of candidate words with the highest probability; when top_p is 0, this parameter is invalid. It is recommended to adjust either top_p or temperature parameters according to your needs to avoid adjusting both at the same time."
+      zh_Hans: "采样方法的取值范围为 [0.0,1.0]。top_p 值确定模型从概率最高的前p%的候选词中选取 tokens；当 top_p 为 0 时，此参数无效。建议根据需求调整 top_p 或 temperature 参数，避免同时调整两者。"
+
+  - name: top_k
+    use_template: top_k
+    label:
+      en_US: "Top K"
+      zh_Hans: "Top K"
+    type: int
+    default: 50
+    min: 0
+    max: 100
+    required: true
+    help:
+      en_US: "The value range is [0,100], which limits the model to only select from the top k words with the highest probability when choosing the next word at each step. The larger the value, the more diverse text generation will be."
+      zh_Hans: "取值范围为 [0,100]，限制模型在每一步选择下一个词时，只从概率最高的前 k 个词中选取。数值越大，文本生成越多样。"
+
+  - name: frequency_penalty
+    use_template: frequency_penalty
+    label:
+      en_US: "Frequency Penalty"
+      zh_Hans: "频率惩罚"
+    type: float
+    default: 0
+    min: -1.0
+    max: 1.0
+    precision: 1
+    required: false
+    help:
+      en_US: "Used to adjust the frequency of repeated content in automatically generated text. Positive numbers reduce repetition, while negative numbers increase repetition. After setting this parameter, if a word has already appeared in the text, the model will decrease the probability of choosing that word for subsequent generation."
+      zh_Hans: "用于调整自动生成文本中重复内容的频率。正数减少重复，负数增加重复。设置此参数后，如果一个词在文本中已经出现过，模型在后续生成中选择该词的概率会降低。"
+
+  - name: user
+    use_template: text
+    label:
+      en_US: "User"
+      zh_Hans: "用户"
+    type: string
+    required: false
+    help:
+      en_US: "Used to track and differentiate conversation requests from different users."
+      zh_Hans: "用于追踪和区分不同用户的对话请求。"
diff --git a/api/core/model_runtime/model_providers/gitee_ai/llm/Qwen2-7B-Instruct.yaml b/api/core/model_runtime/model_providers/gitee_ai/llm/Qwen2-7B-Instruct.yaml
new file mode 100644
index 0000000000..ba1ad788f5
--- /dev/null
+++ b/api/core/model_runtime/model_providers/gitee_ai/llm/Qwen2-7B-Instruct.yaml
@@ -0,0 +1,105 @@
+model: Qwen2-7B-Instruct
+label:
+  zh_Hans: Qwen2-7B-Instruct
+  en_US: Qwen2-7B-Instruct
+model_type: llm
+features:
+  - agent-thought
+model_properties:
+  mode: chat
+  context_size: 32768
+parameter_rules:
+  - name: stream
+    use_template: boolean
+    label:
+      en_US: "Stream"
+      zh_Hans: "流式"
+    type: boolean
+    default: true
+    required: true
+    help:
+      en_US: "Whether to return the results in batches through streaming. If set to true, the generated text will be pushed to the user in real time during the generation process."
+      zh_Hans: "是否通过流式分批返回结果。如果设置为 true，生成过程中实时地向用户推送每一部分生成的文本。"
+
+  - name: max_tokens
+    use_template: max_tokens
+    label:
+      en_US: "Max Tokens"
+      zh_Hans: "最大Token数"
+    type: int
+    default: 512
+    min: 1
+    required: true
+    help:
+      en_US: "The maximum number of tokens that can be generated by the model varies depending on the model."
+      zh_Hans: "模型可生成的最大 token 个数，不同模型上限不同。"
+
+  - name: temperature
+    use_template: temperature
+    label:
+      en_US: "Temperature"
+      zh_Hans: "采样温度"
+    type: float
+    default: 0.7
+    min: 0.0
+    max: 1.0
+    precision: 1
+    required: true
+    help:
+      en_US: "The randomness of the sampling temperature control output. The temperature value is within the range of [0.0, 1.0]. The higher the value, the more random and creative the output; the lower the value, the more stable it is. It is recommended to adjust either top_p or temperature parameters according to your needs to avoid adjusting both at the same time."
+      zh_Hans: "采样温度控制输出的随机性。温度值在 [0.0, 1.0] 范围内，值越高，输出越随机和创造性；值越低，输出越稳定。建议根据需求调整 top_p 或 temperature 参数，避免同时调整两者。"
+
+  - name: top_p
+    use_template: top_p
+    label:
+      en_US: "Top P"
+      zh_Hans: "Top P"
+    type: float
+    default: 0.7
+    min: 0.0
+    max: 1.0
+    precision: 1
+    required: true
+    help:
+      en_US: "The value range of the sampling method is [0.0, 1.0]. The top_p value determines that the model selects tokens from the top p% of candidate words with the highest probability; when top_p is 0, this parameter is invalid. It is recommended to adjust either top_p or temperature parameters according to your needs to avoid adjusting both at the same time."
+      zh_Hans: "采样方法的取值范围为 [0.0,1.0]。top_p 值确定模型从概率最高的前p%的候选词中选取 tokens；当 top_p 为 0 时，此参数无效。建议根据需求调整 top_p 或 temperature 参数，避免同时调整两者。"
+
+  - name: top_k
+    use_template: top_k
+    label:
+      en_US: "Top K"
+      zh_Hans: "Top K"
+    type: int
+    default: 50
+    min: 0
+    max: 100
+    required: true
+    help:
+      en_US: "The value range is [0,100], which limits the model to only select from the top k words with the highest probability when choosing the next word at each step. The larger the value, the more diverse text generation will be."
+      zh_Hans: "取值范围为 [0,100]，限制模型在每一步选择下一个词时，只从概率最高的前 k 个词中选取。数值越大，文本生成越多样。"
+
+  - name: frequency_penalty
+    use_template: frequency_penalty
+    label:
+      en_US: "Frequency Penalty"
+      zh_Hans: "频率惩罚"
+    type: float
+    default: 0
+    min: -1.0
+    max: 1.0
+    precision: 1
+    required: false
+    help:
+      en_US: "Used to adjust the frequency of repeated content in automatically generated text. Positive numbers reduce repetition, while negative numbers increase repetition. After setting this parameter, if a word has already appeared in the text, the model will decrease the probability of choosing that word for subsequent generation."
+      zh_Hans: "用于调整自动生成文本中重复内容的频率。正数减少重复，负数增加重复。设置此参数后，如果一个词在文本中已经出现过，模型在后续生成中选择该词的概率会降低。"
+
+  - name: user
+    use_template: text
+    label:
+      en_US: "User"
+      zh_Hans: "用户"
+    type: string
+    required: false
+    help:
+      en_US: "Used to track and differentiate conversation requests from different users."
+      zh_Hans: "用于追踪和区分不同用户的对话请求。"
diff --git a/api/core/model_runtime/model_providers/gitee_ai/llm/Yi-1.5-34B-Chat.yaml b/api/core/model_runtime/model_providers/gitee_ai/llm/Yi-1.5-34B-Chat.yaml
new file mode 100644
index 0000000000..f7260c987b
--- /dev/null
+++ b/api/core/model_runtime/model_providers/gitee_ai/llm/Yi-1.5-34B-Chat.yaml
@@ -0,0 +1,105 @@
+model: Yi-1.5-34B-Chat
+label:
+  zh_Hans: Yi-1.5-34B-Chat
+  en_US: Yi-1.5-34B-Chat
+model_type: llm
+features:
+  - agent-thought
+model_properties:
+  mode: chat
+  context_size: 4096
+parameter_rules:
+  - name: stream
+    use_template: boolean
+    label:
+      en_US: "Stream"
+      zh_Hans: "流式"
+    type: boolean
+    default: true
+    required: true
+    help:
+      en_US: "Whether to return the results in batches through streaming. If set to true, the generated text will be pushed to the user in real time during the generation process."
+      zh_Hans: "是否通过流式分批返回结果。如果设置为 true，生成过程中实时地向用户推送每一部分生成的文本。"
+
+  - name: max_tokens
+    use_template: max_tokens
+    label:
+      en_US: "Max Tokens"
+      zh_Hans: "最大Token数"
+    type: int
+    default: 512
+    min: 1
+    required: true
+    help:
+      en_US: "The maximum number of tokens that can be generated by the model varies depending on the model."
+      zh_Hans: "模型可生成的最大 token 个数，不同模型上限不同。"
+
+  - name: temperature
+    use_template: temperature
+    label:
+      en_US: "Temperature"
+      zh_Hans: "采样温度"
+    type: float
+    default: 0.7
+    min: 0.0
+    max: 1.0
+    precision: 1
+    required: true
+    help:
+      en_US: "The randomness of the sampling temperature control output. The temperature value is within the range of [0.0, 1.0]. The higher the value, the more random and creative the output; the lower the value, the more stable it is. It is recommended to adjust either top_p or temperature parameters according to your needs to avoid adjusting both at the same time."
+      zh_Hans: "采样温度控制输出的随机性。温度值在 [0.0, 1.0] 范围内，值越高，输出越随机和创造性；值越低，输出越稳定。建议根据需求调整 top_p 或 temperature 参数，避免同时调整两者。"
+
+  - name: top_p
+    use_template: top_p
+    label:
+      en_US: "Top P"
+      zh_Hans: "Top P"
+    type: float
+    default: 0.7
+    min: 0.0
+    max: 1.0
+    precision: 1
+    required: true
+    help:
+      en_US: "The value range of the sampling method is [0.0, 1.0]. The top_p value determines that the model selects tokens from the top p% of candidate words with the highest probability; when top_p is 0, this parameter is invalid. It is recommended to adjust either top_p or temperature parameters according to your needs to avoid adjusting both at the same time."
+      zh_Hans: "采样方法的取值范围为 [0.0,1.0]。top_p 值确定模型从概率最高的前p%的候选词中选取 tokens；当 top_p 为 0 时，此参数无效。建议根据需求调整 top_p 或 temperature 参数，避免同时调整两者。"
+
+  - name: top_k
+    use_template: top_k
+    label:
+      en_US: "Top K"
+      zh_Hans: "Top K"
+    type: int
+    default: 50
+    min: 0
+    max: 100
+    required: true
+    help:
+      en_US: "The value range is [0,100], which limits the model to only select from the top k words with the highest probability when choosing the next word at each step. The larger the value, the more diverse text generation will be."
+      zh_Hans: "取值范围为 [0,100]，限制模型在每一步选择下一个词时，只从概率最高的前 k 个词中选取。数值越大，文本生成越多样。"
+
+  - name: frequency_penalty
+    use_template: frequency_penalty
+    label:
+      en_US: "Frequency Penalty"
+      zh_Hans: "频率惩罚"
+    type: float
+    default: 0
+    min: -1.0
+    max: 1.0
+    precision: 1
+    required: false
+    help:
+      en_US: "Used to adjust the frequency of repeated content in automatically generated text. Positive numbers reduce repetition, while negative numbers increase repetition. After setting this parameter, if a word has already appeared in the text, the model will decrease the probability of choosing that word for subsequent generation."
+      zh_Hans: "用于调整自动生成文本中重复内容的频率。正数减少重复，负数增加重复。设置此参数后，如果一个词在文本中已经出现过，模型在后续生成中选择该词的概率会降低。"
+
+  - name: user
+    use_template: text
+    label:
+      en_US: "User"
+      zh_Hans: "用户"
+    type: string
+    required: false
+    help:
+      en_US: "Used to track and differentiate conversation requests from different users."
+      zh_Hans: "用于追踪和区分不同用户的对话请求。"
diff --git a/api/core/model_runtime/model_providers/gitee_ai/llm/_position.yaml b/api/core/model_runtime/model_providers/gitee_ai/llm/_position.yaml
new file mode 100644
index 0000000000..21f6120742
--- /dev/null
+++ b/api/core/model_runtime/model_providers/gitee_ai/llm/_position.yaml
@@ -0,0 +1,7 @@
+- Qwen2-7B-Instruct
+- Qwen2-72B-Instruct
+- Yi-1.5-34B-Chat
+- glm-4-9b-chat
+- deepseek-coder-33B-instruct-chat
+- deepseek-coder-33B-instruct-completions
+- codegeex4-all-9b
diff --git a/api/core/model_runtime/model_providers/gitee_ai/llm/codegeex4-all-9b.yaml b/api/core/model_runtime/model_providers/gitee_ai/llm/codegeex4-all-9b.yaml
new file mode 100644
index 0000000000..8632cd92ab
--- /dev/null
+++ b/api/core/model_runtime/model_providers/gitee_ai/llm/codegeex4-all-9b.yaml
@@ -0,0 +1,105 @@
+model: codegeex4-all-9b
+label:
+  zh_Hans: codegeex4-all-9b
+  en_US: codegeex4-all-9b
+model_type: llm
+features:
+  - agent-thought
+model_properties:
+  mode: chat
+  context_size: 40960
+parameter_rules:
+  - name: stream
+    use_template: boolean
+    label:
+      en_US: "Stream"
+      zh_Hans: "流式"
+    type: boolean
+    default: true
+    required: true
+    help:
+      en_US: "Whether to return the results in batches through streaming. If set to true, the generated text will be pushed to the user in real time during the generation process."
+      zh_Hans: "是否通过流式分批返回结果。如果设置为 true，生成过程中实时地向用户推送每一部分生成的文本。"
+
+  - name: max_tokens
+    use_template: max_tokens
+    label:
+      en_US: "Max Tokens"
+      zh_Hans: "最大Token数"
+    type: int
+    default: 512
+    min: 1
+    required: true
+    help:
+      en_US: "The maximum number of tokens that can be generated by the model varies depending on the model."
+      zh_Hans: "模型可生成的最大 token 个数，不同模型上限不同。"
+
+  - name: temperature
+    use_template: temperature
+    label:
+      en_US: "Temperature"
+      zh_Hans: "采样温度"
+    type: float
+    default: 0.7
+    min: 0.0
+    max: 1.0
+    precision: 1
+    required: true
+    help:
+      en_US: "The randomness of the sampling temperature control output. The temperature value is within the range of [0.0, 1.0]. The higher the value, the more random and creative the output; the lower the value, the more stable it is. It is recommended to adjust either top_p or temperature parameters according to your needs to avoid adjusting both at the same time."
+      zh_Hans: "采样温度控制输出的随机性。温度值在 [0.0, 1.0] 范围内，值越高，输出越随机和创造性；值越低，输出越稳定。建议根据需求调整 top_p 或 temperature 参数，避免同时调整两者。"
+
+  - name: top_p
+    use_template: top_p
+    label:
+      en_US: "Top P"
+      zh_Hans: "Top P"
+    type: float
+    default: 0.7
+    min: 0.0
+    max: 1.0
+    precision: 1
+    required: true
+    help:
+      en_US: "The value range of the sampling method is [0.0, 1.0]. The top_p value determines that the model selects tokens from the top p% of candidate words with the highest probability; when top_p is 0, this parameter is invalid. It is recommended to adjust either top_p or temperature parameters according to your needs to avoid adjusting both at the same time."
+      zh_Hans: "采样方法的取值范围为 [0.0,1.0]。top_p 值确定模型从概率最高的前p%的候选词中选取 tokens；当 top_p 为 0 时，此参数无效。建议根据需求调整 top_p 或 temperature 参数，避免同时调整两者。"
+
+  - name: top_k
+    use_template: top_k
+    label:
+      en_US: "Top K"
+      zh_Hans: "Top K"
+    type: int
+    default: 50
+    min: 0
+    max: 100
+    required: true
+    help:
+      en_US: "The value range is [0,100], which limits the model to only select from the top k words with the highest probability when choosing the next word at each step. The larger the value, the more diverse text generation will be."
+      zh_Hans: "取值范围为 [0,100]，限制模型在每一步选择下一个词时，只从概率最高的前 k 个词中选取。数值越大，文本生成越多样。"
+
+  - name: frequency_penalty
+    use_template: frequency_penalty
+    label:
+      en_US: "Frequency Penalty"
+      zh_Hans: "频率惩罚"
+    type: float
+    default: 0
+    min: -1.0
+    max: 1.0
+    precision: 1
+    required: false
+    help:
+      en_US: "Used to adjust the frequency of repeated content in automatically generated text. Positive numbers reduce repetition, while negative numbers increase repetition. After setting this parameter, if a word has already appeared in the text, the model will decrease the probability of choosing that word for subsequent generation."
+      zh_Hans: "用于调整自动生成文本中重复内容的频率。正数减少重复，负数增加重复。设置此参数后，如果一个词在文本中已经出现过，模型在后续生成中选择该词的概率会降低。"
+
+  - name: user
+    use_template: text
+    label:
+      en_US: "User"
+      zh_Hans: "用户"
+    type: string
+    required: false
+    help:
+      en_US: "Used to track and differentiate conversation requests from different users."
+      zh_Hans: "用于追踪和区分不同用户的对话请求。"
diff --git a/api/core/model_runtime/model_providers/gitee_ai/llm/deepseek-coder-33B-instruct-chat.yaml b/api/core/model_runtime/model_providers/gitee_ai/llm/deepseek-coder-33B-instruct-chat.yaml
new file mode 100644
index 0000000000..2ac00761d5
--- /dev/null
+++ b/api/core/model_runtime/model_providers/gitee_ai/llm/deepseek-coder-33B-instruct-chat.yaml
@@ -0,0 +1,105 @@
+model: deepseek-coder-33B-instruct-chat
+label:
+  zh_Hans: deepseek-coder-33B-instruct-chat
+  en_US: deepseek-coder-33B-instruct-chat
+model_type: llm
+features:
+  - agent-thought
+model_properties:
+  mode: chat
+  context_size: 9000
+parameter_rules:
+  - name: stream
+    use_template: boolean
+    label:
+      en_US: "Stream"
+      zh_Hans: "流式"
+    type: boolean
+    default: true
+    required: true
+    help:
+      en_US: "Whether to return the results in batches through streaming. If set to true, the generated text will be pushed to the user in real time during the generation process."
+      zh_Hans: "是否通过流式分批返回结果。如果设置为 true，生成过程中实时地向用户推送每一部分生成的文本。"
+
+  - name: max_tokens
+    use_template: max_tokens
+    label:
+      en_US: "Max Tokens"
+      zh_Hans: "最大Token数"
+    type: int
+    default: 512
+    min: 1
+    required: true
+    help:
+      en_US: "The maximum number of tokens that can be generated by the model varies depending on the model."
+      zh_Hans: "模型可生成的最大 token 个数，不同模型上限不同。"
+
+  - name: temperature
+    use_template: temperature
+    label:
+      en_US: "Temperature"
+      zh_Hans: "采样温度"
+    type: float
+    default: 0.7
+    min: 0.0
+    max: 1.0
+    precision: 1
+    required: true
+    help:
+      en_US: "The randomness of the sampling temperature control output. The temperature value is within the range of [0.0, 1.0]. The higher the value, the more random and creative the output; the lower the value, the more stable it is. It is recommended to adjust either top_p or temperature parameters according to your needs to avoid adjusting both at the same time."
+      zh_Hans: "采样温度控制输出的随机性。温度值在 [0.0, 1.0] 范围内，值越高，输出越随机和创造性；值越低，输出越稳定。建议根据需求调整 top_p 或 temperature 参数，避免同时调整两者。"
+
+  - name: top_p
+    use_template: top_p
+    label:
+      en_US: "Top P"
+      zh_Hans: "Top P"
+    type: float
+    default: 0.7
+    min: 0.0
+    max: 1.0
+    precision: 1
+    required: true
+    help:
+      en_US: "The value range of the sampling method is [0.0, 1.0]. The top_p value determines that the model selects tokens from the top p% of candidate words with the highest probability; when top_p is 0, this parameter is invalid. It is recommended to adjust either top_p or temperature parameters according to your needs to avoid adjusting both at the same time."
+      zh_Hans: "采样方法的取值范围为 [0.0,1.0]。top_p 值确定模型从概率最高的前p%的候选词中选取 tokens；当 top_p 为 0 时，此参数无效。建议根据需求调整 top_p 或 temperature 参数，避免同时调整两者。"
+
+  - name: top_k
+    use_template: top_k
+    label:
+      en_US: "Top K"
+      zh_Hans: "Top K"
+    type: int
+    default: 50
+    min: 0
+    max: 100
+    required: true
+    help:
+      en_US: "The value range is [0,100], which limits the model to only select from the top k words with the highest probability when choosing the next word at each step. The larger the value, the more diverse text generation will be."
+      zh_Hans: "取值范围为 [0,100]，限制模型在每一步选择下一个词时，只从概率最高的前 k 个词中选取。数值越大，文本生成越多样。"
+
+  - name: frequency_penalty
+    use_template: frequency_penalty
+    label:
+      en_US: "Frequency Penalty"
+      zh_Hans: "频率惩罚"
+    type: float
+    default: 0
+    min: -1.0
+    max: 1.0
+    precision: 1
+    required: false
+    help:
+      en_US: "Used to adjust the frequency of repeated content in automatically generated text. Positive numbers reduce repetition, while negative numbers increase repetition. After setting this parameter, if a word has already appeared in the text, the model will decrease the probability of choosing that word for subsequent generation."
+      zh_Hans: "用于调整自动生成文本中重复内容的频率。正数减少重复，负数增加重复。设置此参数后，如果一个词在文本中已经出现过，模型在后续生成中选择该词的概率会降低。"
+
+  - name: user
+    use_template: text
+    label:
+      en_US: "User"
+      zh_Hans: "用户"
+    type: string
+    required: false
+    help:
+      en_US: "Used to track and differentiate conversation requests from different users."
+      zh_Hans: "用于追踪和区分不同用户的对话请求。"
diff --git a/api/core/model_runtime/model_providers/gitee_ai/llm/deepseek-coder-33B-instruct-completions.yaml b/api/core/model_runtime/model_providers/gitee_ai/llm/deepseek-coder-33B-instruct-completions.yaml
new file mode 100644
index 0000000000..7c364d89f7
--- /dev/null
+++ b/api/core/model_runtime/model_providers/gitee_ai/llm/deepseek-coder-33B-instruct-completions.yaml
@@ -0,0 +1,91 @@
+model: deepseek-coder-33B-instruct-completions
+label:
+  zh_Hans: deepseek-coder-33B-instruct-completions
+  en_US: deepseek-coder-33B-instruct-completions
+model_type: llm
+features:
+  - agent-thought
+model_properties:
+  mode: completion
+  context_size: 9000
+parameter_rules:
+  - name: stream
+    use_template: boolean
+    label:
+      en_US: "Stream"
+      zh_Hans: "流式"
+    type: boolean
+    default: true
+    required: true
+    help:
+      en_US: "Whether to return the results in batches through streaming. If set to true, the generated text will be pushed to the user in real time during the generation process."
+      zh_Hans: "是否通过流式分批返回结果。如果设置为 true，生成过程中实时地向用户推送每一部分生成的文本。"
+
+  - name: max_tokens
+    use_template: max_tokens
+    label:
+      en_US: "Max Tokens"
+      zh_Hans: "最大Token数"
+    type: int
+    default: 512
+    min: 1
+    required: true
+    help:
+      en_US: "The maximum number of tokens that can be generated by the model varies depending on the model."
+      zh_Hans: "模型可生成的最大 token 个数，不同模型上限不同。"
+
+  - name: temperature
+    use_template: temperature
+    label:
+      en_US: "Temperature"
+      zh_Hans: "采样温度"
+    type: float
+    default: 0.7
+    min: 0.0
+    max: 1.0
+    precision: 1
+    required: true
+    help:
+      en_US: "The randomness of the sampling temperature control output. The temperature value is within the range of [0.0, 1.0]. The higher the value, the more random and creative the output; the lower the value, the more stable it is. It is recommended to adjust either top_p or temperature parameters according to your needs to avoid adjusting both at the same time."
+      zh_Hans: "采样温度控制输出的随机性。温度值在 [0.0, 1.0] 范围内，值越高，输出越随机和创造性；值越低，输出越稳定。建议根据需求调整 top_p 或 temperature 参数，避免同时调整两者。"
+
+  - name: top_p
+    use_template: top_p
+    label:
+      en_US: "Top P"
+      zh_Hans: "Top P"
+    type: float
+    default: 0.7
+    min: 0.0
+    max: 1.0
+    precision: 1
+    required: true
+    help:
+      en_US: "The value range of the sampling method is [0.0, 1.0]. The top_p value determines that the model selects tokens from the top p% of candidate words with the highest probability; when top_p is 0, this parameter is invalid. It is recommended to adjust either top_p or temperature parameters according to your needs to avoid adjusting both at the same time."
+      zh_Hans: "采样方法的取值范围为 [0.0,1.0]。top_p 值确定模型从概率最高的前p%的候选词中选取 tokens；当 top_p 为 0 时，此参数无效。建议根据需求调整 top_p 或 temperature 参数，避免同时调整两者。"
+
+  - name: frequency_penalty
+    use_template: frequency_penalty
+    label:
+      en_US: "Frequency Penalty"
+      zh_Hans: "频率惩罚"
+    type: float
+    default: 0
+    min: -1.0
+    max: 1.0
+    precision: 1
+    required: false
+    help:
+      en_US: "Used to adjust the frequency of repeated content in automatically generated text. Positive numbers reduce repetition, while negative numbers increase repetition. After setting this parameter, if a word has already appeared in the text, the model will decrease the probability of choosing that word for subsequent generation."
+      zh_Hans: "用于调整自动生成文本中重复内容的频率。正数减少重复，负数增加重复。设置此参数后，如果一个词在文本中已经出现过，模型在后续生成中选择该词的概率会降低。"
+
+  - name: user
+    use_template: text
+    label:
+      en_US: "User"
+      zh_Hans: "用户"
+    type: string
+    required: false
+    help:
+      en_US: "Used to track and differentiate conversation requests from different users."
+      zh_Hans: "用于追踪和区分不同用户的对话请求。"
diff --git a/api/core/model_runtime/model_providers/gitee_ai/llm/glm-4-9b-chat.yaml b/api/core/model_runtime/model_providers/gitee_ai/llm/glm-4-9b-chat.yaml
new file mode 100644
index 0000000000..2afe1cf959
--- /dev/null
+++ b/api/core/model_runtime/model_providers/gitee_ai/llm/glm-4-9b-chat.yaml
@@ -0,0 +1,105 @@
+model: glm-4-9b-chat
+label:
+  zh_Hans: glm-4-9b-chat
+  en_US: glm-4-9b-chat
+model_type: llm
+features:
+  - agent-thought
+model_properties:
+  mode: chat
+  context_size: 32768
+parameter_rules:
+  - name: stream
+    use_template: boolean
+    label:
+      en_US: "Stream"
+      zh_Hans: "流式"
+    type: boolean
+    default: true
+    required: true
+    help:
+      en_US: "Whether to return the results in batches through streaming. If set to true, the generated text will be pushed to the user in real time during the generation process."
+      zh_Hans: "是否通过流式分批返回结果。如果设置为 true，生成过程中实时地向用户推送每一部分生成的文本。"
+
+  - name: max_tokens
+    use_template: max_tokens
+    label:
+      en_US: "Max Tokens"
+      zh_Hans: "最大Token数"
+    type: int
+    default: 512
+    min: 1
+    required: true
+    help:
+      en_US: "The maximum number of tokens that can be generated by the model varies depending on the model."
+      zh_Hans: "模型可生成的最大 token 个数，不同模型上限不同。"
+
+  - name: temperature
+    use_template: temperature
+    label:
+      en_US: "Temperature"
+      zh_Hans: "采样温度"
+    type: float
+    default: 0.7
+    min: 0.0
+    max: 1.0
+    precision: 1
+    required: true
+    help:
+      en_US: "The randomness of the sampling temperature control output. The temperature value is within the range of [0.0, 1.0]. The higher the value, the more random and creative the output; the lower the value, the more stable it is. It is recommended to adjust either top_p or temperature parameters according to your needs to avoid adjusting both at the same time."
+      zh_Hans: "采样温度控制输出的随机性。温度值在 [0.0, 1.0] 范围内，值越高，输出越随机和创造性；值越低，输出越稳定。建议根据需求调整 top_p 或 temperature 参数，避免同时调整两者。"
+
+  - name: top_p
+    use_template: top_p
+    label:
+      en_US: "Top P"
+      zh_Hans: "Top P"
+    type: float
+    default: 0.7
+    min: 0.0
+    max: 1.0
+    precision: 1
+    required: true
+    help:
+      en_US: "The value range of the sampling method is [0.0, 1.0]. The top_p value determines that the model selects tokens from the top p% of candidate words with the highest probability; when top_p is 0, this parameter is invalid. It is recommended to adjust either top_p or temperature parameters according to your needs to avoid adjusting both at the same time."
+      zh_Hans: "采样方法的取值范围为 [0.0,1.0]。top_p 值确定模型从概率最高的前p%的候选词中选取 tokens；当 top_p 为 0 时，此参数无效。建议根据需求调整 top_p 或 temperature 参数，避免同时调整两者。"
+
+  - name: top_k
+    use_template: top_k
+    label:
+      en_US: "Top K"
+      zh_Hans: "Top K"
+    type: int
+    default: 50
+    min: 0
+    max: 100
+    required: true
+    help:
+      en_US: "The value range is [0,100], which limits the model to only select from the top k words with the highest probability when choosing the next word at each step. The larger the value, the more diverse text generation will be."
+      zh_Hans: "取值范围为 [0,100]，限制模型在每一步选择下一个词时，只从概率最高的前 k 个词中选取。数值越大，文本生成越多样。"
+
+  - name: frequency_penalty
+    use_template: frequency_penalty
+    label:
+      en_US: "Frequency Penalty"
+      zh_Hans: "频率惩罚"
+    type: float
+    default: 0
+    min: -1.0
+    max: 1.0
+    precision: 1
+    required: false
+    help:
+      en_US: "Used to adjust the frequency of repeated content in automatically generated text. Positive numbers reduce repetition, while negative numbers increase repetition. After setting this parameter, if a word has already appeared in the text, the model will decrease the probability of choosing that word for subsequent generation."
+      zh_Hans: "用于调整自动生成文本中重复内容的频率。正数减少重复，负数增加重复。设置此参数后，如果一个词在文本中已经出现过，模型在后续生成中选择该词的概率会降低。"
+
+  - name: user
+    use_template: text
+    label:
+      en_US: "User"
+      zh_Hans: "用户"
+    type: string
+    required: false
+    help:
+      en_US: "Used to track and differentiate conversation requests from different users."
+      zh_Hans: "用于追踪和区分不同用户的对话请求。"
diff --git a/api/core/model_runtime/model_providers/gitee_ai/llm/llm.py b/api/core/model_runtime/model_providers/gitee_ai/llm/llm.py
new file mode 100644
index 0000000000..b65db6f665
--- /dev/null
+++ b/api/core/model_runtime/model_providers/gitee_ai/llm/llm.py
@@ -0,0 +1,47 @@
+from collections.abc import Generator
+from typing import Optional, Union
+
+from core.model_runtime.entities.llm_entities import LLMMode, LLMResult
+from core.model_runtime.entities.message_entities import (
+    PromptMessage,
+    PromptMessageTool,
+)
+from core.model_runtime.model_providers.openai_api_compatible.llm.llm import OAIAPICompatLargeLanguageModel
+
+
+class GiteeAILargeLanguageModel(OAIAPICompatLargeLanguageModel):
+    MODEL_TO_IDENTITY: dict[str, str] = {
+        "Yi-1.5-34B-Chat": "Yi-34B-Chat",
+        "deepseek-coder-33B-instruct-completions": "deepseek-coder-33B-instruct",
+        "deepseek-coder-33B-instruct-chat": "deepseek-coder-33B-instruct",
+    }
+
+    def _invoke(
+        self,
+        model: str,
+        credentials: dict,
+        prompt_messages: list[PromptMessage],
+        model_parameters: dict,
+        tools: Optional[list[PromptMessageTool]] = None,
+        stop: Optional[list[str]] = None,
+        stream: bool = True,
+        user: Optional[str] = None,
+    ) -> Union[LLMResult, Generator]:
+        self._add_custom_parameters(credentials, model, model_parameters)
+        return super()._invoke(model, credentials, prompt_messages, model_parameters, tools, stop, stream)
+
+    def validate_credentials(self, model: str, credentials: dict) -> None:
+        self._add_custom_parameters(credentials, model, None)
+        super().validate_credentials(model, credentials)
+
+    @staticmethod
+    def _add_custom_parameters(credentials: dict, model: str, model_parameters: dict) -> None:
+        if model is None:
+            model = "bge-large-zh-v1.5"
+
+        model_identity = GiteeAILargeLanguageModel.MODEL_TO_IDENTITY.get(model, model)
+        credentials["endpoint_url"] = f"https://ai.gitee.com/api/serverless/{model_identity}/"
+        if model.endswith("completions"):
+            credentials["mode"] = LLMMode.COMPLETION.value
+        else:
+            credentials["mode"] = LLMMode.CHAT.value
diff --git a/api/core/model_runtime/model_providers/gitee_ai/rerank/__init__.py b/api/core/model_runtime/model_providers/gitee_ai/rerank/__init__.py
new file mode 100644
index 0000000000..e69de29bb2
diff --git a/api/core/model_runtime/model_providers/gitee_ai/rerank/_position.yaml b/api/core/model_runtime/model_providers/gitee_ai/rerank/_position.yaml
new file mode 100644
index 0000000000..83162fd338
--- /dev/null
+++ b/api/core/model_runtime/model_providers/gitee_ai/rerank/_position.yaml
@@ -0,0 +1 @@
+- bge-reranker-v2-m3
diff --git a/api/core/model_runtime/model_providers/gitee_ai/rerank/bge-reranker-v2-m3.yaml b/api/core/model_runtime/model_providers/gitee_ai/rerank/bge-reranker-v2-m3.yaml
new file mode 100644
index 0000000000..f0681641e1
--- /dev/null
+++ b/api/core/model_runtime/model_providers/gitee_ai/rerank/bge-reranker-v2-m3.yaml
@@ -0,0 +1,4 @@
+model: bge-reranker-v2-m3
+model_type: rerank
+model_properties:
+  context_size: 1024
diff --git a/api/core/model_runtime/model_providers/gitee_ai/rerank/rerank.py b/api/core/model_runtime/model_providers/gitee_ai/rerank/rerank.py
new file mode 100644
index 0000000000..231345c2f4
--- /dev/null
+++ b/api/core/model_runtime/model_providers/gitee_ai/rerank/rerank.py
@@ -0,0 +1,128 @@
+from typing import Optional
+
+import httpx
+
+from core.model_runtime.entities.common_entities import I18nObject
+from core.model_runtime.entities.model_entities import AIModelEntity, FetchFrom, ModelPropertyKey, ModelType
+from core.model_runtime.entities.rerank_entities import RerankDocument, RerankResult
+from core.model_runtime.errors.invoke import (
+    InvokeAuthorizationError,
+    InvokeBadRequestError,
+    InvokeConnectionError,
+    InvokeError,
+    InvokeRateLimitError,
+    InvokeServerUnavailableError,
+)
+from core.model_runtime.errors.validate import CredentialsValidateFailedError
+from core.model_runtime.model_providers.__base.rerank_model import RerankModel
+
+
+class GiteeAIRerankModel(RerankModel):
+    """
+    Model class for rerank model.
+    """
+
+    def _invoke(
+        self,
+        model: str,
+        credentials: dict,
+        query: str,
+        docs: list[str],
+        score_threshold: Optional[float] = None,
+        top_n: Optional[int] = None,
+        user: Optional[str] = None,
+    ) -> RerankResult:
+        """
+        Invoke rerank model
+
+        :param model: model name
+        :param credentials: model credentials
+        :param query: search query
+        :param docs: docs for reranking
+        :param score_threshold: score threshold
+        :param top_n: top n documents to return
+        :param user: unique user id
+        :return: rerank result
+        """
+        if len(docs) == 0:
+            return RerankResult(model=model, docs=[])
+
+        base_url = credentials.get("base_url", "https://ai.gitee.com/api/serverless")
+        base_url = base_url.removesuffix("/")
+
+        try:
+            body = {"model": model, "query": query, "documents": docs}
+            if top_n is not None:
+                body["top_n"] = top_n
+            response = httpx.post(
+                f"{base_url}/{model}/rerank",
+                json=body,
+                headers={"Authorization": f"Bearer {credentials.get('api_key')}"},
+            )
+
+            response.raise_for_status()
+            results = response.json()
+
+            rerank_documents = []
+            for result in results["results"]:
+                rerank_document = RerankDocument(
+                    index=result["index"],
+                    text=result["document"]["text"],
+                    score=result["relevance_score"],
+                )
+                if score_threshold is None or result["relevance_score"] >= score_threshold:
+                    rerank_documents.append(rerank_document)
+            return RerankResult(model=model, docs=rerank_documents)
+        except httpx.HTTPStatusError as e:
+            raise InvokeServerUnavailableError(str(e))
+
+    def validate_credentials(self, model: str, credentials: dict) -> None:
+        """
+        Validate model credentials
+
+        :param model: model name
+        :param credentials: model credentials
+        :return:
+        """
+        try:
+            self._invoke(
+                model=model,
+                credentials=credentials,
+                query="What is the capital of the United States?",
+                docs=[
+                    "Carson City is the capital city of the American state of Nevada. At the 2010 United States "
+                    "Census, Carson City had a population of 55,274.",
+                    "The Commonwealth of the Northern Mariana Islands is a group of islands in the Pacific Ocean that "
+                    "are a political division controlled by the United States. Its capital is Saipan.",
+                ],
+                score_threshold=0.01,
+            )
+        except Exception as ex:
+            raise CredentialsValidateFailedError(str(ex))
+
+    @property
+    def _invoke_error_mapping(self) -> dict[type[InvokeError], list[type[Exception]]]:
+        """
+        Map model invoke error to unified error
+        """
+        return {
+            InvokeConnectionError: [httpx.ConnectError],
+            InvokeServerUnavailableError: [httpx.RemoteProtocolError],
+            InvokeRateLimitError: [],
+            InvokeAuthorizationError: [httpx.HTTPStatusError],
+            InvokeBadRequestError: [httpx.RequestError],
+        }
+
+    def get_customizable_model_schema(self, model: str, credentials: dict) -> AIModelEntity:
+        """
+        generate custom model entities from credentials
+        """
+        entity = AIModelEntity(
+            model=model,
+            label=I18nObject(en_US=model),
+            model_type=ModelType.RERANK,
+            fetch_from=FetchFrom.CUSTOMIZABLE_MODEL,
+            model_properties={ModelPropertyKey.CONTEXT_SIZE: int(credentials.get("context_size"))},
+        )
+
+        return entity
diff --git a/api/core/model_runtime/model_providers/gitee_ai/speech2text/__init__.py b/api/core/model_runtime/model_providers/gitee_ai/speech2text/__init__.py
new file mode 100644
index 0000000000..e69de29bb2
diff --git a/api/core/model_runtime/model_providers/gitee_ai/speech2text/_position.yaml b/api/core/model_runtime/model_providers/gitee_ai/speech2text/_position.yaml
new file mode 100644
index 0000000000..8e9b47598b
--- /dev/null
+++ b/api/core/model_runtime/model_providers/gitee_ai/speech2text/_position.yaml
@@ -0,0 +1,2 @@
+- whisper-base
+- whisper-large
diff --git a/api/core/model_runtime/model_providers/gitee_ai/speech2text/speech2text.py b/api/core/model_runtime/model_providers/gitee_ai/speech2text/speech2text.py
new file mode 100644
index 0000000000..5597f5b43e
--- /dev/null
+++ b/api/core/model_runtime/model_providers/gitee_ai/speech2text/speech2text.py
@@ -0,0 +1,53 @@
+import os
+from typing import IO, Optional
+
+import requests
+
+from core.model_runtime.errors.invoke import InvokeBadRequestError
+from core.model_runtime.errors.validate import CredentialsValidateFailedError
+from core.model_runtime.model_providers.__base.speech2text_model import Speech2TextModel
+from core.model_runtime.model_providers.gitee_ai._common import _CommonGiteeAI
+
+
+class GiteeAISpeech2TextModel(_CommonGiteeAI, Speech2TextModel):
+    """
+    Model class for OpenAI Compatible Speech to text model.
+    """
+
+    def _invoke(self, model: str, credentials: dict, file: IO[bytes], user: Optional[str] = None) -> str:
+        """
+        Invoke speech2text model
+
+        :param model: model name
+        :param credentials: model credentials
+        :param file: audio file
+        :param user: unique user id
+        :return: text for given audio file
+        """
+        # doc: https://ai.gitee.com/docs/openapi/serverless#tag/serverless/POST/{service}/speech-to-text
+
+        endpoint_url = f"https://ai.gitee.com/api/serverless/{model}/speech-to-text"
+        files = [("file", file)]
+        _, file_ext = os.path.splitext(file.name)
+        headers = {"Content-Type": f"audio/{file_ext}", "Authorization": f"Bearer {credentials.get('api_key')}"}
+        response = requests.post(endpoint_url, headers=headers, files=files)
+        if response.status_code != 200:
+            raise InvokeBadRequestError(response.text)
+        response_data = response.json()
+        return response_data["text"]
+
+    def validate_credentials(self, model: str, credentials: dict) -> None:
+        """
+        Validate model credentials
+
+        :param model: model name
+        :param credentials: model credentials
+        :return:
+        """
+        try:
+            audio_file_path = self._get_demo_file_path()
+
+            with open(audio_file_path, "rb") as audio_file:
+                self._invoke(model, credentials, audio_file)
+        except Exception as ex:
+            raise CredentialsValidateFailedError(str(ex))
diff --git a/api/core/model_runtime/model_providers/gitee_ai/speech2text/whisper-base.yaml b/api/core/model_runtime/model_providers/gitee_ai/speech2text/whisper-base.yaml
new file mode 100644
index 0000000000..a50bf5fc2d
--- /dev/null
+++ b/api/core/model_runtime/model_providers/gitee_ai/speech2text/whisper-base.yaml
@@ -0,0 +1,5 @@
+model: whisper-base
+model_type: speech2text
+model_properties:
+  file_upload_limit: 1
+  supported_file_extensions: flac,mp3,mp4,mpeg,mpga,m4a,ogg,wav,webm
diff --git a/api/core/model_runtime/model_providers/gitee_ai/speech2text/whisper-large.yaml b/api/core/model_runtime/model_providers/gitee_ai/speech2text/whisper-large.yaml
new file mode 100644
index 0000000000..1be7b1a391
--- /dev/null
+++ b/api/core/model_runtime/model_providers/gitee_ai/speech2text/whisper-large.yaml
@@ -0,0 +1,5 @@
+model: whisper-large
+model_type: speech2text
+model_properties:
+  file_upload_limit: 1
+  supported_file_extensions: flac,mp3,mp4,mpeg,mpga,m4a,ogg,wav,webm
diff --git a/api/core/model_runtime/model_providers/gitee_ai/text_embedding/_position.yaml b/api/core/model_runtime/model_providers/gitee_ai/text_embedding/_position.yaml
new file mode 100644
index 0000000000..e8abe6440d
--- /dev/null
+++ b/api/core/model_runtime/model_providers/gitee_ai/text_embedding/_position.yaml
@@ -0,0 +1,3 @@
+- bge-large-zh-v1.5
+- bge-small-zh-v1.5
+- bge-m3
diff --git a/api/core/model_runtime/model_providers/gitee_ai/text_embedding/bge-large-zh-v1.5.yaml b/api/core/model_runtime/model_providers/gitee_ai/text_embedding/bge-large-zh-v1.5.yaml
new file mode 100644
index 0000000000..9e3ca76e88
--- /dev/null
+++ b/api/core/model_runtime/model_providers/gitee_ai/text_embedding/bge-large-zh-v1.5.yaml
@@ -0,0 +1,8 @@
+model: bge-large-zh-v1.5
+label:
+  zh_Hans: bge-large-zh-v1.5
+  en_US: bge-large-zh-v1.5
+model_type: text-embedding
+model_properties:
+  context_size: 200000
+  max_chunks: 20
diff --git a/api/core/model_runtime/model_providers/gitee_ai/text_embedding/bge-m3.yaml b/api/core/model_runtime/model_providers/gitee_ai/text_embedding/bge-m3.yaml
new file mode 100644
index 0000000000..a7a99a98a3
--- /dev/null
+++ b/api/core/model_runtime/model_providers/gitee_ai/text_embedding/bge-m3.yaml
@@ -0,0 +1,8 @@
+model: bge-m3
+label:
+  zh_Hans: bge-m3
+  en_US: bge-m3
+model_type: text-embedding
+model_properties:
+  context_size: 200000
+  max_chunks: 20
diff --git a/api/core/model_runtime/model_providers/gitee_ai/text_embedding/bge-small-zh-v1.5.yaml b/api/core/model_runtime/model_providers/gitee_ai/text_embedding/bge-small-zh-v1.5.yaml
new file mode 100644
index 0000000000..bd760408fa
--- /dev/null
+++ b/api/core/model_runtime/model_providers/gitee_ai/text_embedding/bge-small-zh-v1.5.yaml
@@ -0,0 +1,8 @@
+model: bge-small-zh-v1.5
+label:
+  zh_Hans: bge-small-zh-v1.5
+  en_US: bge-small-zh-v1.5
+model_type: text-embedding
+model_properties:
+  context_size: 200000
+  max_chunks: 20
diff --git a/api/core/model_runtime/model_providers/gitee_ai/text_embedding/text_embedding.py b/api/core/model_runtime/model_providers/gitee_ai/text_embedding/text_embedding.py
new file mode 100644
index 0000000000..b833c5652c
--- /dev/null
+++ b/api/core/model_runtime/model_providers/gitee_ai/text_embedding/text_embedding.py
@@ -0,0 +1,31 @@
+from typing import Optional
+
+from core.entities.embedding_type import EmbeddingInputType
+from core.model_runtime.entities.text_embedding_entities import TextEmbeddingResult
+from core.model_runtime.model_providers.openai_api_compatible.text_embedding.text_embedding import (
+    OAICompatEmbeddingModel,
+)
+
+
+class GiteeAIEmbeddingModel(OAICompatEmbeddingModel):
+    def _invoke(
+        self,
+        model: str,
+        credentials: dict,
+        texts: list[str],
+        user: Optional[str] = None,
+        input_type: EmbeddingInputType = EmbeddingInputType.DOCUMENT,
+    ) -> TextEmbeddingResult:
+        self._add_custom_parameters(credentials, model)
+        return super()._invoke(model, credentials, texts, user, input_type)
+
+    def validate_credentials(self, model: str, credentials: dict) -> None:
+        self._add_custom_parameters(credentials, None)
+        super().validate_credentials(model, credentials)
+
+    @staticmethod
+    def _add_custom_parameters(credentials: dict, model: str) -> None:
+        if model is None:
+            model = "bge-m3"
+
+        credentials["endpoint_url"] = f"https://ai.gitee.com/api/serverless/{model}/v1/"
diff --git a/api/core/model_runtime/model_providers/gitee_ai/tts/ChatTTS.yaml b/api/core/model_runtime/model_providers/gitee_ai/tts/ChatTTS.yaml
new file mode 100644
index 0000000000..940391dfab
--- /dev/null
+++ b/api/core/model_runtime/model_providers/gitee_ai/tts/ChatTTS.yaml
@@ -0,0 +1,11 @@
+model: ChatTTS
+model_type: tts
+model_properties:
+  default_voice: 'default'
+  voices:
+    - mode: 'default'
+      name: 'Default'
+      language: [ 'zh-Hans', 'en-US', 'de-DE', 'fr-FR', 'es-ES', 'it-IT', 'th-TH', 'id-ID' ]
+  word_limit: 3500
+  audio_type: 'mp3'
+  max_workers: 5
diff --git a/api/core/model_runtime/model_providers/gitee_ai/tts/FunAudioLLM-CosyVoice-300M.yaml b/api/core/model_runtime/model_providers/gitee_ai/tts/FunAudioLLM-CosyVoice-300M.yaml
new file mode 100644
index 0000000000..8fc5734801
--- /dev/null
+++ b/api/core/model_runtime/model_providers/gitee_ai/tts/FunAudioLLM-CosyVoice-300M.yaml
@@ -0,0 +1,11 @@
+model: FunAudioLLM-CosyVoice-300M
+model_type: tts
+model_properties:
+  default_voice: 'default'
+  voices:
+    - mode: 'default'
+      name: 'Default'
+      language: [ 'zh-Hans', 'en-US', 'de-DE', 'fr-FR', 'es-ES', 'it-IT', 'th-TH', 'id-ID' ]
+  word_limit: 3500
+  audio_type: 'mp3'
+  max_workers: 5
diff --git a/api/core/model_runtime/model_providers/gitee_ai/tts/__init__.py b/api/core/model_runtime/model_providers/gitee_ai/tts/__init__.py
new file mode 100644
index 0000000000..e69de29bb2
diff --git a/api/core/model_runtime/model_providers/gitee_ai/tts/_position.yaml b/api/core/model_runtime/model_providers/gitee_ai/tts/_position.yaml
new file mode 100644
index 0000000000..13c6ec8454
--- /dev/null
+++ b/api/core/model_runtime/model_providers/gitee_ai/tts/_position.yaml
@@ -0,0 +1,4 @@
+- speecht5_tts
+- ChatTTS
+- fish-speech-1.2-sft
+- FunAudioLLM-CosyVoice-300M
diff --git a/api/core/model_runtime/model_providers/gitee_ai/tts/fish-speech-1.2-sft.yaml b/api/core/model_runtime/model_providers/gitee_ai/tts/fish-speech-1.2-sft.yaml
new file mode 100644
index 0000000000..93cc28bc9d
--- /dev/null
+++ b/api/core/model_runtime/model_providers/gitee_ai/tts/fish-speech-1.2-sft.yaml
@@ -0,0 +1,11 @@
+model: fish-speech-1.2-sft
+model_type: tts
+model_properties:
+  default_voice: 'default'
+  voices:
+    - mode: 'default'
+      name: 'Default'
+      language: [ 'zh-Hans', 'en-US', 'de-DE', 'fr-FR', 'es-ES', 'it-IT', 'th-TH', 'id-ID' ]
+  word_limit: 3500
+  audio_type: 'mp3'
+  max_workers: 5
diff --git a/api/core/model_runtime/model_providers/gitee_ai/tts/speecht5_tts.yaml b/api/core/model_runtime/model_providers/gitee_ai/tts/speecht5_tts.yaml
new file mode 100644
index 0000000000..f9c843bd41
--- /dev/null
+++ b/api/core/model_runtime/model_providers/gitee_ai/tts/speecht5_tts.yaml
@@ -0,0 +1,11 @@
+model: speecht5_tts
+model_type: tts
+model_properties:
+  default_voice: 'default'
+  voices:
+    - mode: 'default'
+      name: 'Default'
+      language: [ 'zh-Hans', 'en-US', 'de-DE', 'fr-FR', 'es-ES', 'it-IT', 'th-TH', 'id-ID' ]
+  word_limit: 3500
+  audio_type: 'mp3'
+  max_workers: 5
diff --git a/api/core/model_runtime/model_providers/gitee_ai/tts/tts.py b/api/core/model_runtime/model_providers/gitee_ai/tts/tts.py
new file mode 100644
index 0000000000..ed2bd5b13d
--- /dev/null
+++ b/api/core/model_runtime/model_providers/gitee_ai/tts/tts.py
@@ -0,0 +1,79 @@
+from typing import Optional
+
+import requests
+
+from core.model_runtime.errors.invoke import InvokeBadRequestError
+from core.model_runtime.errors.validate import CredentialsValidateFailedError
+from core.model_runtime.model_providers.__base.tts_model import TTSModel
+from core.model_runtime.model_providers.gitee_ai._common import _CommonGiteeAI
+
+
+class GiteeAIText2SpeechModel(_CommonGiteeAI, TTSModel):
+    """
+    Model class for OpenAI Speech to text model.
+    """
+
+    def _invoke(
+        self, model: str, tenant_id: str, credentials: dict, content_text: str, voice: str, user: Optional[str] = None
+    ) -> any:
+        """
+        _invoke text2speech model
+
+        :param model: model name
+        :param tenant_id: user tenant id
+        :param credentials: model credentials
+        :param content_text: text content to be translated
+        :param voice: model timbre
+        :param user: unique user id
+        :return: text translated to audio file
+        """
+        return self._tts_invoke_streaming(model=model, credentials=credentials, content_text=content_text, voice=voice)
+
+    def validate_credentials(self, model: str, credentials: dict) -> None:
+        """
+        validate credentials text2speech model
+
+        :param model: model name
+        :param credentials: model credentials
+        :return: text translated to audio file
+        """
+        try:
+            self._tts_invoke_streaming(
+                model=model,
+                credentials=credentials,
+                content_text="Hello Dify!",
+                voice=self._get_model_default_voice(model, credentials),
+            )
+        except Exception as ex:
+            raise CredentialsValidateFailedError(str(ex))
+
+    def _tts_invoke_streaming(self, model: str, credentials: dict, content_text: str, voice: str) -> any:
+        """
+        _tts_invoke_streaming text2speech model
+        :param model: model name
+        :param credentials: model credentials
+        :param content_text: text content to be translated
+        :param voice: model timbre
+        :return: text translated to audio file
+        """
+        try:
+            # doc: https://ai.gitee.com/docs/openapi/serverless#tag/serverless/POST/{service}/text-to-speech
+            endpoint_url = "https://ai.gitee.com/api/serverless/" + model + "/text-to-speech"
+
+            headers = {"Content-Type": "application/json"}
+            api_key = credentials.get("api_key")
+            if api_key:
+                headers["Authorization"] = f"Bearer {api_key}"
+
+            payload = {"inputs": content_text}
+            response = requests.post(endpoint_url, headers=headers, json=payload)
+
+            if response.status_code != 200:
+                raise InvokeBadRequestError(response.text)
+
+            data = response.content
+
+            for i in range(0, len(data), 1024):
+                yield data[i : i + 1024]
+        except Exception as ex:
+            raise InvokeBadRequestError(str(ex))
diff --git a/api/pytest.ini b/api/pytest.ini
index dcca08e2e5..a23a4b3f3d 100644
--- a/api/pytest.ini
+++ b/api/pytest.ini
@@ -27,3 +27,4 @@ env =
     XINFERENCE_GENERATION_MODEL_UID = generate
     XINFERENCE_RERANK_MODEL_UID = rerank
     XINFERENCE_SERVER_URL = http://a.abc.com:11451
+    GITEE_AI_API_KEY = aaaaaaaaaaaaaaaaaaaa
diff --git a/api/tests/integration_tests/.env.example b/api/tests/integration_tests/.env.example
index 2d52399d29..6791cd891b 100644
--- a/api/tests/integration_tests/.env.example
+++ b/api/tests/integration_tests/.env.example
@@ -83,3 +83,6 @@ VOLC_EMBEDDING_ENDPOINT_ID=
 
 # 360 AI Credentials
 ZHINAO_API_KEY=
+
+# Gitee AI Credentials
+GITEE_AI_API_KEY=
diff --git a/api/tests/integration_tests/model_runtime/gitee_ai/__init__.py b/api/tests/integration_tests/model_runtime/gitee_ai/__init__.py
new file mode 100644
index 0000000000..e69de29bb2
diff --git a/api/tests/integration_tests/model_runtime/gitee_ai/test_llm.py b/api/tests/integration_tests/model_runtime/gitee_ai/test_llm.py
new file mode 100644
index 0000000000..753c52ce31
--- /dev/null
+++ b/api/tests/integration_tests/model_runtime/gitee_ai/test_llm.py
@@ -0,0 +1,132 @@
+import os
+from collections.abc import Generator
+
+import pytest
+
+from core.model_runtime.entities.llm_entities import LLMResult, LLMResultChunk, LLMResultChunkDelta
+from core.model_runtime.entities.message_entities import (
+    AssistantPromptMessage,
+    PromptMessageTool,
+    SystemPromptMessage,
+    UserPromptMessage,
+)
+from core.model_runtime.entities.model_entities import AIModelEntity
+from core.model_runtime.errors.validate import CredentialsValidateFailedError
+from core.model_runtime.model_providers.gitee_ai.llm.llm import GiteeAILargeLanguageModel
+
+
+def test_predefined_models():
+    model = GiteeAILargeLanguageModel()
+    model_schemas = model.predefined_models()
+
+    assert len(model_schemas) >= 1
+    assert isinstance(model_schemas[0], AIModelEntity)
+
+
+def test_validate_credentials_for_chat_model():
+    model = GiteeAILargeLanguageModel()
+
+    with pytest.raises(CredentialsValidateFailedError):
+        # model name to gpt-3.5-turbo because of mocking
+        model.validate_credentials(model="gpt-3.5-turbo", credentials={"api_key": "invalid_key"})
+
+    model.validate_credentials(
+        model="Qwen2-7B-Instruct",
+        credentials={"api_key": os.environ.get("GITEE_AI_API_KEY")},
+    )
+
+
+def test_invoke_chat_model():
+    model = GiteeAILargeLanguageModel()
+
+    result = model.invoke(
+        model="Qwen2-7B-Instruct",
+        credentials={"api_key": os.environ.get("GITEE_AI_API_KEY")},
+        prompt_messages=[
+            SystemPromptMessage(
+                content="You are a helpful AI assistant.",
+            ),
+            UserPromptMessage(content="Hello World!"),
+        ],
+        model_parameters={
+            "temperature": 0.0,
+            "top_p": 1.0,
+            "presence_penalty": 0.0,
+            "frequency_penalty": 0.0,
+            "max_tokens": 10,
+            "stream": False,
+        },
+        stop=["How"],
+        stream=False,
+        user="foo",
+    )
+
+    assert isinstance(result, LLMResult)
+    assert len(result.message.content) > 0
+
+
+def test_invoke_stream_chat_model():
+    model = GiteeAILargeLanguageModel()
+
+    result = model.invoke(
+        model="Qwen2-7B-Instruct",
+        credentials={"api_key": os.environ.get("GITEE_AI_API_KEY")},
+        prompt_messages=[
+            SystemPromptMessage(
+                content="You are a helpful AI assistant.",
+            ),
+            UserPromptMessage(content="Hello World!"),
+        ],
+        model_parameters={"temperature": 0.0, "max_tokens": 100, "stream": False},
+        stream=True,
+        user="foo",
+    )
+
+    assert isinstance(result, Generator)
+
+    for chunk in result:
+        assert isinstance(chunk, LLMResultChunk)
+        assert isinstance(chunk.delta, LLMResultChunkDelta)
+        assert isinstance(chunk.delta.message, AssistantPromptMessage)
+        assert len(chunk.delta.message.content) > 0 if chunk.delta.finish_reason is None else True
+        if chunk.delta.finish_reason is not None:
+            assert chunk.delta.usage is not None
+
+
+def test_get_num_tokens():
+    model = GiteeAILargeLanguageModel()
+
+    num_tokens = model.get_num_tokens(
+        model="Qwen2-7B-Instruct",
+        credentials={"api_key": os.environ.get("GITEE_AI_API_KEY")},
+        prompt_messages=[UserPromptMessage(content="Hello World!")],
+    )
+
+    assert num_tokens == 10
+
+    num_tokens = model.get_num_tokens(
+        model="Qwen2-7B-Instruct",
+        credentials={"api_key": os.environ.get("GITEE_AI_API_KEY")},
+        prompt_messages=[
+            SystemPromptMessage(
+                content="You are a helpful AI assistant.",
+            ),
+            UserPromptMessage(content="Hello World!"),
+        ],
+        tools=[
+            PromptMessageTool(
+                name="get_weather",
+                description="Determine weather in my location",
+                parameters={
+                    "type": "object",
+                    "properties": {
+                        "location": {"type": "string", "description": "The city and state e.g. San Francisco, CA"},
+                        "unit": {"type": "string", "enum": ["c", "f"]},
+                    },
+                    "required": ["location"],
+                },
+            ),
+        ],
+    )
+
+    assert num_tokens == 77
diff --git a/api/tests/integration_tests/model_runtime/gitee_ai/test_provider.py b/api/tests/integration_tests/model_runtime/gitee_ai/test_provider.py
new file mode 100644
index 0000000000..f12ed54a45
--- /dev/null
+++ b/api/tests/integration_tests/model_runtime/gitee_ai/test_provider.py
@@ -0,0 +1,15 @@
+import os
+
+import pytest
+
+from core.model_runtime.errors.validate import CredentialsValidateFailedError
+from core.model_runtime.model_providers.gitee_ai.gitee_ai import GiteeAIProvider
+
+
+def test_validate_provider_credentials():
+    provider = GiteeAIProvider()
+
+    with pytest.raises(CredentialsValidateFailedError):
+        provider.validate_provider_credentials(credentials={"api_key": "invalid_key"})
+
+    provider.validate_provider_credentials(credentials={"api_key": os.environ.get("GITEE_AI_API_KEY")})
diff --git a/api/tests/integration_tests/model_runtime/gitee_ai/test_rerank.py b/api/tests/integration_tests/model_runtime/gitee_ai/test_rerank.py
new file mode 100644
index 0000000000..0e5914a61f
--- /dev/null
+++ b/api/tests/integration_tests/model_runtime/gitee_ai/test_rerank.py
@@ -0,0 +1,47 @@
+import os
+
+import pytest
+
+from core.model_runtime.entities.rerank_entities import RerankResult
+from core.model_runtime.errors.validate import CredentialsValidateFailedError
+from core.model_runtime.model_providers.gitee_ai.rerank.rerank import GiteeAIRerankModel
+
+
+def test_validate_credentials():
+    model = GiteeAIRerankModel()
+
+    with pytest.raises(CredentialsValidateFailedError):
+        model.validate_credentials(
+            model="bge-reranker-v2-m3",
+            credentials={"api_key": "invalid_key"},
+        )
+
+    model.validate_credentials(
+        model="bge-reranker-v2-m3",
+        credentials={
+            "api_key": os.environ.get("GITEE_AI_API_KEY"),
+        },
+    )
+
+
+def test_invoke_model():
+    model = GiteeAIRerankModel()
+    result = model.invoke(
+        model="bge-reranker-v2-m3",
+        credentials={
+            "api_key": os.environ.get("GITEE_AI_API_KEY"),
+        },
+        query="What is the capital of the United States?",
+        docs=[
+            "Carson City is the capital city of the American state of Nevada. At the 2010 United States "
+            "Census, Carson City had a population of 55,274.",
+            "The Commonwealth of the Northern Mariana Islands is a group of islands in the Pacific Ocean that "
+            "are a political division controlled by the United States. Its capital is Saipan.",
+        ],
+        top_n=1,
+        score_threshold=0.01,
+    )
+
+    assert isinstance(result, RerankResult)
+    assert len(result.docs) == 1
+    assert result.docs[0].score >= 0.01
diff --git a/api/tests/integration_tests/model_runtime/gitee_ai/test_speech2text.py b/api/tests/integration_tests/model_runtime/gitee_ai/test_speech2text.py
new file mode 100644
index 0000000000..4a01453fdd
--- /dev/null
+++ b/api/tests/integration_tests/model_runtime/gitee_ai/test_speech2text.py
@@ -0,0 +1,45 @@
+import os
+
+import pytest
+
+from core.model_runtime.errors.validate import CredentialsValidateFailedError
+from core.model_runtime.model_providers.gitee_ai.speech2text.speech2text import GiteeAISpeech2TextModel
+
+
+def test_validate_credentials():
+    model = GiteeAISpeech2TextModel()
+
+    with pytest.raises(CredentialsValidateFailedError):
+        model.validate_credentials(
+            model="whisper-base",
+            credentials={"api_key": "invalid_key"},
+        )
+
+    model.validate_credentials(
+        model="whisper-base",
+        credentials={"api_key": os.environ.get("GITEE_AI_API_KEY")},
+    )
+
+
+def test_invoke_model():
+    model = GiteeAISpeech2TextModel()
+
+    # Get the directory of the current file
+    current_dir = os.path.dirname(os.path.abspath(__file__))
+
+    # Get assets directory
+    assets_dir = os.path.join(os.path.dirname(current_dir), "assets")
+
+    # Construct the path to the audio file
+    audio_file_path = os.path.join(assets_dir, "audio.mp3")
+
+    # Open the file and get the file object
+    with open(audio_file_path, "rb") as audio_file:
+        file = audio_file
+
+        result = model.invoke(
+            model="whisper-base", credentials={"api_key": os.environ.get("GITEE_AI_API_KEY")}, file=file
+        )
+
+        assert isinstance(result, str)
+        assert result == "1 2 3 4 5 6 7 8 9 10"
diff --git a/api/tests/integration_tests/model_runtime/gitee_ai/test_text_embedding.py b/api/tests/integration_tests/model_runtime/gitee_ai/test_text_embedding.py
new file mode 100644
index 0000000000..34648f0bc8
--- /dev/null
+++ b/api/tests/integration_tests/model_runtime/gitee_ai/test_text_embedding.py
@@ -0,0 +1,46 @@
+import os
+
+import pytest
+
+from core.model_runtime.entities.text_embedding_entities import TextEmbeddingResult
+from core.model_runtime.errors.validate import CredentialsValidateFailedError
+from core.model_runtime.model_providers.gitee_ai.text_embedding.text_embedding import GiteeAIEmbeddingModel
+
+
+def test_validate_credentials():
+    model = GiteeAIEmbeddingModel()
+
+    with pytest.raises(CredentialsValidateFailedError):
+        model.validate_credentials(model="bge-large-zh-v1.5", credentials={"api_key": "invalid_key"})
+
+    model.validate_credentials(model="bge-large-zh-v1.5", credentials={"api_key": os.environ.get("GITEE_AI_API_KEY")})
+
+
+def test_invoke_model():
+    model = GiteeAIEmbeddingModel()
+
+    result = model.invoke(
+        model="bge-large-zh-v1.5",
+        credentials={
+            "api_key": os.environ.get("GITEE_AI_API_KEY"),
+        },
+        texts=["hello", "world"],
+        user="user",
+    )
+
+    assert isinstance(result, TextEmbeddingResult)
+    assert len(result.embeddings) == 2
+
+
+def test_get_num_tokens():
+    model = GiteeAIEmbeddingModel()
+
+    num_tokens = model.get_num_tokens(
+        model="bge-large-zh-v1.5",
+        credentials={
+            "api_key": os.environ.get("GITEE_AI_API_KEY"),
+        },
+        texts=["hello", "world"],
+    )
+
+    assert num_tokens == 2
diff --git a/api/tests/integration_tests/model_runtime/gitee_ai/test_tts.py b/api/tests/integration_tests/model_runtime/gitee_ai/test_tts.py
new file mode 100644
index 0000000000..9f18161a7b
--- /dev/null
+++ b/api/tests/integration_tests/model_runtime/gitee_ai/test_tts.py
@@ -0,0 +1,23 @@
+import os
+
+from core.model_runtime.model_providers.gitee_ai.tts.tts import GiteeAIText2SpeechModel
+
+
+def test_invoke_model():
+    model = GiteeAIText2SpeechModel()
+
+    result = model.invoke(
+        model="speecht5_tts",
+        tenant_id="test",
+        credentials={
+            "api_key": os.environ.get("GITEE_AI_API_KEY"),
+        },
+        content_text="Hello, world!",
+        voice="",
+    )
+
+    content = b""
+    for chunk in result:
+        content += chunk
+
+    assert content != b""

From ddb960ddfbd47bfa58fbdb92f6d781c55a3978d3 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?=E9=9D=9E=E6=B3=95=E6=93=8D=E4=BD=9C?= <hjlarry@163.com>
Date: Mon, 28 Oct 2024 16:52:57 +0800
Subject: [PATCH 03/29] feat: support Vectorizer can be used in workflow
 (#9932)

---
 api/core/agent/base_agent_runner.py           | 12 +++++
 api/core/file/file_manager.py                 | 12 ++++-
 .../builtin/vectorizer/tools/test_data.py     |  1 -
 .../builtin/vectorizer/tools/vectorizer.py    | 53 ++++++++++++-------
 .../builtin/vectorizer/tools/vectorizer.yaml  | 15 +++---
 .../provider/builtin/vectorizer/vectorizer.py | 10 +++-
 .../builtin/vectorizer/vectorizer.yaml        |  8 ---
 api/core/tools/tool_manager.py                | 14 +++--
 8 files changed, 82 insertions(+), 43 deletions(-)
 delete mode 100644 api/core/tools/provider/builtin/vectorizer/tools/test_data.py

diff --git a/api/core/agent/base_agent_runner.py b/api/core/agent/base_agent_runner.py
index 514dcfbd68..507455c176 100644
--- a/api/core/agent/base_agent_runner.py
+++ b/api/core/agent/base_agent_runner.py
@@ -165,6 +165,12 @@ class BaseAgentRunner(AppRunner):
                 continue
 
             parameter_type = parameter.type.as_normal_type()
+            if parameter.type in {
+                ToolParameter.ToolParameterType.SYSTEM_FILES,
+                ToolParameter.ToolParameterType.FILE,
+                ToolParameter.ToolParameterType.FILES,
+            }:
+                continue
             enum = []
             if parameter.type == ToolParameter.ToolParameterType.SELECT:
                 enum = [option.value for option in parameter.options]
@@ -250,6 +256,12 @@ class BaseAgentRunner(AppRunner):
                 continue
 
             parameter_type = parameter.type.as_normal_type()
+            if parameter.type in {
+                ToolParameter.ToolParameterType.SYSTEM_FILES,
+                ToolParameter.ToolParameterType.FILE,
+                ToolParameter.ToolParameterType.FILES,
+            }:
+                continue
             enum = []
             if parameter.type == ToolParameter.ToolParameterType.SELECT:
                 enum = [option.value for option in parameter.options]
diff --git a/api/core/file/file_manager.py b/api/core/file/file_manager.py
index 0c6ce8ce75..b69d7a74c0 100644
--- a/api/core/file/file_manager.py
+++ b/api/core/file/file_manager.py
@@ -76,8 +76,16 @@ def to_prompt_message_content(f: File, /):
 
 
 def download(f: File, /):
-    upload_file = file_repository.get_upload_file(session=db.session(), file=f)
-    return _download_file_content(upload_file.key)
+    if f.transfer_method == FileTransferMethod.TOOL_FILE:
+        tool_file = file_repository.get_tool_file(session=db.session(), file=f)
+        return _download_file_content(tool_file.file_key)
+    elif f.transfer_method == FileTransferMethod.LOCAL_FILE:
+        upload_file = file_repository.get_upload_file(session=db.session(), file=f)
+        return _download_file_content(upload_file.key)
+    # remote file
+    response = ssrf_proxy.get(f.remote_url, follow_redirects=True)
+    response.raise_for_status()
+    return response.content
 
 
 def _download_file_content(path: str, /):
diff --git a/api/core/tools/provider/builtin/vectorizer/tools/test_data.py b/api/core/tools/provider/builtin/vectorizer/tools/test_data.py
deleted file mode 100644
index 8effa9818a..0000000000
--- a/api/core/tools/provider/builtin/vectorizer/tools/test_data.py
+++ /dev/null
@@ -1 +0,0 @@
-VECTORIZER_ICON_PNG = "iVBORw0KGgoAAAANSUhEUgAAAGAAAABgCAYAAADimHc4AAAACXBIWXMAACxLAAAsSwGlPZapAAAAAXNSR0IArs4c6QAAAARnQU1BAACxjwv8YQUAAAboSURBVHgB7Z09bBxFFMffRoAvcQqbguBUxu4wCUikMCZ0TmQK4NLQJCJOlQIkokgEGhQ7NCFIKEhQuIqNnIaGMxRY2GVwmlggDHS+pIHELmIXMTEULPP3eeXz7e7szO7MvE1ufpKV03nuNn7/mfcxH7tEHo/H42lXgqwG1bGw65+/aTQM6K0gpJdCoi7ypCIMui5s9Qv9R1OVTqrVxoL1jPbpvH4hrIp/rnmj5+YOhTQ++1kwmdZgT9ovRi6EF4Xhv/XGL0Sv6OLXYMu0BokjYOSDcBQfJI8xhKFP/HAlqCW8v5vqubBr8yn6maCexxiIDR376LnWmBBzQZtPEvx+L3mMAleOZKb1/XgM2EOnyWMFZJKt78UEQKpJHisk2TYmgM967JFk2z3kYcULwIwXgBkvADNeAGa8AMw8Qcwc6N55/eAh0cYmGaOzQtR/kOhQX+M6+/c23r+3RlT/i2ipTrSyRqw4F+CwMMbgANHQwG7jRywLw/wqDDNzI79xYPjqa2L262jjtYzaT0QT3xEbsck4MXUakgWOvUx08liy0ZPYEKNhel4Y6AZpgR7/8Tvq1wEQ+sMJN6Nh9kqwy+bWYwAM8elZovNv6xmlU7iLs280RNO9ls51os/h/8eBVQEig8Dt5OXUsNrno2tluZw0cI3qUXKONQHy9sYkVHqnjntLA2LnFTAv1gSA+zBhfIDvkfVO/B4xRgWZn4fbe2WAnGJFAAxn03+I7PtUXdzE90Sjl4ne+6L4d5nCigAyYyHPn7tFdPN30uJwX/qI6jtISkQZFVLdhd9SrtNPTrFSB6QZBAaYntsptpAyfvk+KYOCamVR/XrNtLqepduiFnkh3g4iIw6YLAhlOJmKwB9zaarhApr/MPREjAZVisSU1s/KYsGzhmKXClYEWLm/8xpV7btXhcv5I7lt2vtJFA3q/T07r1HopdG5l5xhxQVdn28YFn8kBJCBOZmiPHio1m5QuJzlu9ntXApgZwSsNYJslvGjtjrfm8Sq4neceFUtz3dZCzwW09Gqo2hreuPN7HZRnNqa1BP1x8lhczVNK+zT0TqkjYAF4e7Okxoo2PZX5K4IrhNpb/P8FTK2S1+TcUq1HpBFmquJYo1qEYU6RVarJE0c2ooL7C5IRwBZ5nJ9joyRtk5hA3YBdHqWzG1gBKgE/bzMaK5LqMIugKrbUDHu59/YWVRBsWhrsYZdANV5HBUXYGNlC9dFBW8LdgH6FQVYUnQvkQgm3NH8YuO7bM4LsWZBfT3qRY9OxRyJgJRz+Ij+FDPEQ1C3GVMiWAVQ7f31u/ncytxi4wdZTbRGgdcHnpYLD/FcwSrAoOKizfKfVAiIF4kBMPK+Opfe1iWsMUB1BJh2BRgBabSNAOiFqkXYbcNFUF9P+u82FGdWTcEmgGrvh0FUppB1kC073muXEaDq/21kIjLxV9tFAC7/n5X6tkUM0PH/dcP+P0v41fvkFBYBVHs/MD0CDmVsOzEdb7JgEYDT/8uq4rpj44NSjwDTc/CyzV1gxbH7Ac4F0PH/S4ZHAOaFZLiY+2nFuQA6/t9kQMTCz1CG66tbWvWS4VwAVf9vugAbel6efqrsYbKBcwFeVNz8ajobyTppw2F84FQAnfl/kwER6wJZcWdBc7e2KZwKoOP/TVakWb0f7md+kVhwOwI0BDCFyq42rt4PSiuAiRGAEXdK4ZQlV+8HTgVwefwHvR7nhbOA0FwBGDgTIM/Z3SLXUj2hOW1wR10eSrs7Ou9eTB3jo/dzuh/gTABdn35c8dhpM3BxOmeTuXs/cDoCdDY4qe7l32pbaZxL1jF+GXo/cLotBcWVTiZU3T7RMn8rHiijW9FgauP4Ef1TLdhHWgacCgAj6tYCqGKjU/DNbqxIkMYZNs7MpxmnLuhmwYJna1dbdzHjY42hDL4/wqkA6HWuDkAngRH0iYVjRkVwnoZO/0gsuLwpkw7OBcAtwlwvfESHxctmfMBSiOG0oStj4HCF7T3+RWARwIU7QK/HbWlqls52mYJtezqMj3v34C5VOveFy8Ll4QoTsJ8Txp0RsW8/Os2im2LCtSC1RIqLw3RldTVplOKkPEYDhMAPqttnune2rzTv5Y+WKdEem2ixkWqZYSeDSUp3qwIYNOrR7cBjcbOORxkvADNeAGa8AMx4AZjxAjATf5Ab0Tp5rJBk2/iD3PAwYo8Vkmyb9CjDGfLYIaCp1rdiAnT8S5PeDVkgoDuVCsWeJxwToHZ163m3Z8hjloDGk54vn5gFbT/5eZw8phifvZz8XPlA9qmRj8JRCumi+OkljzbbrvxM0qPMm9rIqY6FXZubVBUinMbzcP3jbuXA6Mh2kMx07KPJJLfj8Xg8Hg/4H+KfFYb2WM4MAAAAAElFTkSuQmCC"  # noqa: E501
diff --git a/api/core/tools/provider/builtin/vectorizer/tools/vectorizer.py b/api/core/tools/provider/builtin/vectorizer/tools/vectorizer.py
index 4bd601c0bd..c722cd36c8 100644
--- a/api/core/tools/provider/builtin/vectorizer/tools/vectorizer.py
+++ b/api/core/tools/provider/builtin/vectorizer/tools/vectorizer.py
@@ -1,11 +1,12 @@
-from base64 import b64decode
 from typing import Any, Union
 
 from httpx import post
 
+from core.file.enums import FileType
+from core.file.file_manager import download
+from core.tools.entities.common_entities import I18nObject
 from core.tools.entities.tool_entities import ToolInvokeMessage, ToolParameter
-from core.tools.errors import ToolProviderCredentialValidationError
-from core.tools.provider.builtin.vectorizer.tools.test_data import VECTORIZER_ICON_PNG
+from core.tools.errors import ToolParameterValidationError
 from core.tools.tool.builtin_tool import BuiltinTool
 
 
@@ -16,30 +17,30 @@ class VectorizerTool(BuiltinTool):
         """
         invoke tools
         """
-        api_key_name = self.runtime.credentials.get("api_key_name", None)
-        api_key_value = self.runtime.credentials.get("api_key_value", None)
+        api_key_name = self.runtime.credentials.get("api_key_name")
+        api_key_value = self.runtime.credentials.get("api_key_value")
         mode = tool_parameters.get("mode", "test")
-        if mode == "production":
-            mode = "preview"
-
-        if not api_key_name or not api_key_value:
-            raise ToolProviderCredentialValidationError("Please input api key name and value")
 
+        # image file for workflow mode
+        image = tool_parameters.get("image")
+        if image and image.type != FileType.IMAGE:
+            raise ToolParameterValidationError("Not a valid image")
+        # image_id for agent mode
         image_id = tool_parameters.get("image_id", "")
-        if not image_id:
-            return self.create_text_message("Please input image id")
 
-        if image_id.startswith("__test_"):
-            image_binary = b64decode(VECTORIZER_ICON_PNG)
-        else:
+        if image_id:
             image_binary = self.get_variable_file(self.VariableKey.IMAGE)
             if not image_binary:
                 return self.create_text_message("Image not found, please request user to generate image firstly.")
+        elif image:
+            image_binary = download(image)
+        else:
+            raise ToolParameterValidationError("Please provide either image or image_id")
 
         response = post(
             "https://vectorizer.ai/api/v1/vectorize",
+            data={"mode": mode},
             files={"image": image_binary},
-            data={"mode": mode} if mode == "test" else {},
             auth=(api_key_name, api_key_value),
             timeout=30,
         )
@@ -59,11 +60,23 @@ class VectorizerTool(BuiltinTool):
         return [
             ToolParameter.get_simple_instance(
                 name="image_id",
-                llm_description=f"the image id that you want to vectorize, \
-                    and the image id should be specified in \
+                llm_description=f"the image_id that you want to vectorize, \
+                    and the image_id should be specified in \
                         {[i.name for i in self.list_default_image_variables()]}",
                 type=ToolParameter.ToolParameterType.SELECT,
-                required=True,
+                required=False,
                 options=[i.name for i in self.list_default_image_variables()],
-            )
+            ),
+            ToolParameter(
+                name="image",
+                label=I18nObject(en_US="image", zh_Hans="image"),
+                human_description=I18nObject(
+                    en_US="The image to be converted.",
+                    zh_Hans="要转换的图片。",
+                ),
+                type=ToolParameter.ToolParameterType.FILE,
+                form=ToolParameter.ToolParameterForm.LLM,
+                llm_description="you should not input this parameter. just input the image_id.",
+                required=False,
+            ),
         ]
diff --git a/api/core/tools/provider/builtin/vectorizer/tools/vectorizer.yaml b/api/core/tools/provider/builtin/vectorizer/tools/vectorizer.yaml
index 4b4fb9e245..0afd1c201f 100644
--- a/api/core/tools/provider/builtin/vectorizer/tools/vectorizer.yaml
+++ b/api/core/tools/provider/builtin/vectorizer/tools/vectorizer.yaml
@@ -4,14 +4,21 @@ identity:
   label:
     en_US: Vectorizer.AI
     zh_Hans: Vectorizer.AI
-    pt_BR: Vectorizer.AI
 description:
   human:
     en_US: Convert your PNG and JPG images to SVG vectors quickly and easily. Fully automatically. Using AI.
     zh_Hans: 一个将 PNG 和 JPG 图像快速轻松地转换为 SVG 矢量图的工具。
-    pt_BR: Convert your PNG and JPG images to SVG vectors quickly and easily. Fully automatically. Using AI.
   llm: A tool for converting images to SVG vectors. you should input the image id as the input of this tool. the image id can be got from parameters.
 parameters:
+  - name: image
+    type: file
+    label:
+      en_US: image
+    human_description:
+      en_US: The image to be converted.
+      zh_Hans: 要转换的图片。
+    llm_description: you should not input this parameter. just input the image_id.
+    form: llm
   - name: mode
     type: select
     required: true
@@ -20,19 +27,15 @@ parameters:
         label:
           en_US: production
           zh_Hans: 生产模式
-          pt_BR: production
       - value: test
         label:
           en_US: test
           zh_Hans: 测试模式
-          pt_BR: test
     default: test
     label:
       en_US: Mode
       zh_Hans: 模式
-      pt_BR: Mode
     human_description:
       en_US: It is free to integrate with and test out the API in test mode, no subscription required.
       zh_Hans: 在测试模式下，可以免费测试API。
-      pt_BR: It is free to integrate with and test out the API in test mode, no subscription required.
     form: form
diff --git a/api/core/tools/provider/builtin/vectorizer/vectorizer.py b/api/core/tools/provider/builtin/vectorizer/vectorizer.py
index 3b868572f9..8140348723 100644
--- a/api/core/tools/provider/builtin/vectorizer/vectorizer.py
+++ b/api/core/tools/provider/builtin/vectorizer/vectorizer.py
@@ -1,5 +1,7 @@
 from typing import Any
 
+from core.file import File
+from core.file.enums import FileTransferMethod, FileType
 from core.tools.errors import ToolProviderCredentialValidationError
 from core.tools.provider.builtin.vectorizer.tools.vectorizer import VectorizerTool
 from core.tools.provider.builtin_tool_provider import BuiltinToolProviderController
@@ -7,6 +9,12 @@ from core.tools.provider.builtin_tool_provider import BuiltinToolProviderControl
 
 class VectorizerProvider(BuiltinToolProviderController):
     def _validate_credentials(self, credentials: dict[str, Any]) -> None:
+        test_img = File(
+            tenant_id="__test_123",
+            remote_url="https://cloud.dify.ai/logo/logo-site.png",
+            type=FileType.IMAGE,
+            transfer_method=FileTransferMethod.REMOTE_URL,
+        )
         try:
             VectorizerTool().fork_tool_runtime(
                 runtime={
@@ -14,7 +22,7 @@ class VectorizerProvider(BuiltinToolProviderController):
                 }
             ).invoke(
                 user_id="",
-                tool_parameters={"mode": "test", "image_id": "__test_123"},
+                tool_parameters={"mode": "test", "image": test_img},
             )
         except Exception as e:
             raise ToolProviderCredentialValidationError(str(e))
diff --git a/api/core/tools/provider/builtin/vectorizer/vectorizer.yaml b/api/core/tools/provider/builtin/vectorizer/vectorizer.yaml
index 1257f8d285..94dae20876 100644
--- a/api/core/tools/provider/builtin/vectorizer/vectorizer.yaml
+++ b/api/core/tools/provider/builtin/vectorizer/vectorizer.yaml
@@ -4,11 +4,9 @@ identity:
   label:
     en_US: Vectorizer.AI
     zh_Hans: Vectorizer.AI
-    pt_BR: Vectorizer.AI
   description:
     en_US: Convert your PNG and JPG images to SVG vectors quickly and easily. Fully automatically. Using AI.
     zh_Hans: 一个将 PNG 和 JPG 图像快速轻松地转换为 SVG 矢量图的工具。
-    pt_BR: Convert your PNG and JPG images to SVG vectors quickly and easily. Fully automatically. Using AI.
   icon: icon.png
   tags:
     - productivity
@@ -20,15 +18,12 @@ credentials_for_provider:
     label:
       en_US: Vectorizer.AI API Key name
       zh_Hans: Vectorizer.AI API Key name
-      pt_BR: Vectorizer.AI API Key name
     placeholder:
       en_US: Please input your Vectorizer.AI ApiKey name
       zh_Hans: 请输入你的 Vectorizer.AI ApiKey name
-      pt_BR: Please input your Vectorizer.AI ApiKey name
     help:
       en_US: Get your Vectorizer.AI API Key from Vectorizer.AI.
       zh_Hans: 从 Vectorizer.AI 获取您的 Vectorizer.AI API Key。
-      pt_BR: Get your Vectorizer.AI API Key from Vectorizer.AI.
     url: https://vectorizer.ai/api
   api_key_value:
     type: secret-input
@@ -36,12 +31,9 @@ credentials_for_provider:
     label:
       en_US: Vectorizer.AI API Key
       zh_Hans: Vectorizer.AI API Key
-      pt_BR: Vectorizer.AI API Key
     placeholder:
       en_US: Please input your Vectorizer.AI ApiKey
       zh_Hans: 请输入你的 Vectorizer.AI ApiKey
-      pt_BR: Please input your Vectorizer.AI ApiKey
     help:
       en_US: Get your Vectorizer.AI API Key from Vectorizer.AI.
       zh_Hans: 从 Vectorizer.AI 获取您的 Vectorizer.AI API Key。
-      pt_BR: Get your Vectorizer.AI API Key from Vectorizer.AI.
diff --git a/api/core/tools/tool_manager.py b/api/core/tools/tool_manager.py
index 9e984732b7..63f7775164 100644
--- a/api/core/tools/tool_manager.py
+++ b/api/core/tools/tool_manager.py
@@ -242,11 +242,15 @@ class ToolManager:
         parameters = tool_entity.get_all_runtime_parameters()
         for parameter in parameters:
             # check file types
-            if parameter.type in {
-                ToolParameter.ToolParameterType.SYSTEM_FILES,
-                ToolParameter.ToolParameterType.FILE,
-                ToolParameter.ToolParameterType.FILES,
-            }:
+            if (
+                parameter.type
+                in {
+                    ToolParameter.ToolParameterType.SYSTEM_FILES,
+                    ToolParameter.ToolParameterType.FILE,
+                    ToolParameter.ToolParameterType.FILES,
+                }
+                and parameter.required
+            ):
                 raise ValueError(f"file type parameter {parameter.name} not supported in agent")
 
             if parameter.form == ToolParameter.ToolParameterForm.FORM:

From 7056009b6adb60071b04d1441605cd0e886eb5e0 Mon Sep 17 00:00:00 2001
From: Xiao Ley <xiao.ley@outlook.com>
Date: Mon, 28 Oct 2024 17:18:28 +0800
Subject: [PATCH 04/29] feat(tools): add Baidu translation tool (#9943)

---
 .../builtin/baidu_translate/_assets/icon.png  | Bin 0 -> 16676 bytes
 .../_baidu_translate_tool_base.py             |  11 +
 .../baidu_translate/baidu_translate.py        |  17 ++
 .../baidu_translate/baidu_translate.yaml      |  39 +++
 .../baidu_translate/tools/fieldtranslate.py   |  78 +++++
 .../baidu_translate/tools/fieldtranslate.yaml | 123 ++++++++
 .../builtin/baidu_translate/tools/language.py |  95 ++++++
 .../baidu_translate/tools/language.yaml       |  43 +++
 .../baidu_translate/tools/translate.py        |  67 +++++
 .../baidu_translate/tools/translate.yaml      | 275 ++++++++++++++++++
 10 files changed, 748 insertions(+)
 create mode 100644 api/core/tools/provider/builtin/baidu_translate/_assets/icon.png
 create mode 100644 api/core/tools/provider/builtin/baidu_translate/_baidu_translate_tool_base.py
 create mode 100644 api/core/tools/provider/builtin/baidu_translate/baidu_translate.py
 create mode 100644 api/core/tools/provider/builtin/baidu_translate/baidu_translate.yaml
 create mode 100644 api/core/tools/provider/builtin/baidu_translate/tools/fieldtranslate.py
 create mode 100644 api/core/tools/provider/builtin/baidu_translate/tools/fieldtranslate.yaml
 create mode 100644 api/core/tools/provider/builtin/baidu_translate/tools/language.py
 create mode 100644 api/core/tools/provider/builtin/baidu_translate/tools/language.yaml
 create mode 100644 api/core/tools/provider/builtin/baidu_translate/tools/translate.py
 create mode 100644 api/core/tools/provider/builtin/baidu_translate/tools/translate.yaml

diff --git a/api/core/tools/provider/builtin/baidu_translate/_assets/icon.png b/api/core/tools/provider/builtin/baidu_translate/_assets/icon.png
new file mode 100644
index 0000000000000000000000000000000000000000..8eb8f21513ba7d45de8204bfe64aa3cc1fd7fc26
GIT binary patch
literal 16676
zcmeIYWl)^W7A-ssPH+qEu7kTf1a}BBz~JugFj#Ph;O>$HCpZKN4k1Wzhu}_f$$PxM
z`{z`B_urYSd8B*qwR^8#-80WqJ6cUe4h@9}1pok`DacD}yqtwzzM@D7FUPcf^Oqxi
zpRbmly9U^c!r9fy(#9S_;qK!Mp@4YXSONgv-)nPiTxr_k!+&4my1|`}xwK|apzYpW
z3Q%*=&d)4Z{?zu!(8{VrN(PXe0*c0eef}-78+13XaYk3B;WoB(!Tjl)|6Y!5zRB~i
z1N+XPH4|{>nwyvjANcdyStst*m%VzP&!WErR|DA2{15yyx{WHnE)s9;5wmvJnFO^Z
z2Gzb{p1D2pD7<M`JDVgv^$7W8KenqgcFP*Kh<@Yuczyq4KS3{u?Xl(aYZWKjQ=HBp
zz3^lCl%4pPS3%r`M`*vU3NLzZZ-4nbdsvc;<bVA#%2_{8^c>KQo^JPz9N(9C^SN5z
z@5<omxoB7SGVjdlGO+t`u)R{Op4j-#Chh6|VR+H#VdwhHILZF{<m>&>S21IgB`EoF
zjmhu)<|+ZN+2f+&IEM>6&7ZX^Kkq1hk@P<|j{ofY9sP6cdG*c+4GcPe4=E>o%BvGd
zXp4_^Y&(r#zCChJp_Tm{uu*+G3w<;|8{`v%rQDR9bMo>>X01`<c<v0u4*Oj*xcd0X
zuj7D;&p2MycX%*&W$<nOJ^RzIqlmBS$NW}DN4cTLM|egoQt7k#{wQIsmp8@k7<bQ)
zizZEWJ)s9=Zji9m_&sduwhX5)34J{7>tWILs#EPv#;@0-TD{CT*i2z^jO5vb3_IDs
zy2Rr>y0d9T^NWE(l)kX*9GD{!ZejYa<m5A+1}@P5?nJ!<N8!3MWR^w5*HR%x|4!9A
zFU*sSVJyv6tg0-{lZqGE$yLISxxrRssod63WUaj-vaPAyHL&IRIKSrqs=(g1EltPJ
zuFGxqYnqVQ>b>~S{shpbJaq!+p>?t9iq%k-WgbL_Yx#Jrz5$S%rmOGqalU1_btYcu
zq;ssU<0R1eBaVvj!M3J~$jMd0d~O?fFYxjCXYKBq&gG)UgXz8AJ95^Y0AzZ8g(gD$
z%W3dA)vNU>W8UWZ!Ton{=yR5Kqhq%9A;~W3DT58BD__gEL_a+?tzdLy5&Wj^xNq5s
zdvp7vAvfvZms#77lN-cp*3w#=ur_=Rf<rY2il@7ty4A(H<GaU2QC($H?=SRF^##I0
zXZjSYT>=N;w^TRA#q=6xUXHa!0c*`aHB^SQeZSd}2)Xjdmu{!+ZI(T>IY*x79DNYL
zsb;m>Zo1uo(-|13iM!&xCS4qDcd>KhUr(^Rj$j=6Lh^QXEUszN_T<CH;Yy<jIZ=F=
zUSg`&F`VcYoBe@3pDQtmsSx8j3?rV2E3g<!=wN;mXi7c^Q$V>GIFswQ*E)QVHEZpV
z&$(zTq+;T^oz@n{e(ZbF3y%>vXQl5m5GXrpHIBnSkj|ons>f`qF8UoK$E3eyqD<+Q
z`b2c7H_`3n(;3uKc#S&cuJ?o&9R503?fN*al?mF6Q^(if)q^D^H0ZEWTe><z47;~J
z63ca+8t8iNgZ?(6_?C50GTE@p`EhnJy8mP9_lox=AA3aKbXs+_Y)F!@xAZo1Nk=?}
zi_Gx6Z6D^2>fK)kO8E7vBM&0Ty0+3nk-PXC&F8XacjHueT;gnWU#E}|(~q2^Dw(AO
zS)3Zs?cwiM)NZjBkACtq`>-S6suGR~gIl$<66sOiWkJns-m1-~HTno!J6hQk8Ss>B
zcgX3<jC6~@<eU~(c!p!;K1nHWF-BWsfLvO{KN}&d=Z4<F=a?tkPm~MH5=>J-D%06)
zU_IU%1#PhCQ`d@z?{QcK08heOe-YRP-P`6l4Xx|BXuW?!E4YBZa<@KS-m&1dFYcef
z+_Vb925rp<CJq|ew<g)*R{1%KLWdE|QYU$yjbXUvsm#v>HoIao0S>`YKUvwubT`(I
zEC|anpDVjbT<6{&Ka*Vy$a>who$R<NpRIUcWw(wre#MphkmIJpc8@aRFx&e?n|pRA
zC<JJQUn99W77sud#rO9K`3%_VbaoTI8Dc~%TN1!PM9KtNMjo>8nXfp6PP^ft`8@LW
zV499#y)zp4dO$^8B1xB3KF5ue|Li;5xrWk8bpRNyYjx;7fyaRs`?0tszrQr6p&|pt
zz+D|SVmVaj03wJ(G~F9F`dP=f;8xa69acD#Yd$2?dgplH9fLL!7-61B^9PD7${Y&_
zM0VJb0R6j*(Z4(DDf6Po`<}vfWZ>}P!xk@t4BknXpA@c#8+(xY9j};M_>aZB{XW7}
zSjNTlMnP`W9Zrg5uMyeuVqLsepe@QLI@sW6i^b*kLZHs{g^NUfK93o$TU5342$ahs
zZj1lt9;xWXNi7!!g|qkyI$L@&e;*v@ywn`4P!VJ75jx-3Gg{yS?04i%*R0_D=AGS(
zESBt6lTOb@uOAiTqa6--l9muR=bU$G;>Urnzb|}?hHKxDC&2@mkXTDUNC~H*<EP9&
z<Yu}nvk>y@xuz;Wp#B&XNgJ0(hS9G<#J0i|c!FA|kyxG7j=D>V@JlUmd9v~>&Ix+d
z2`-;Aoor!BZz!Sbp&X=9n8#*bi?>w+)?@v02Z`+ggGFTIR{*9)2Yd8S8FZjmnwe=v
zUxmCl(Fh_mFR*uMP-FX(OTFX>UeOfvd844mXnCx?IrWjH?;~kF$@cHKia;#cQKEg_
zKppDg42+d$dK=kF5iB6E{{@cD%;-z2&N^1tYt^`QQkoc|4__!#wyw6{2}BxR3Wxx9
z#>%?`cy5VZfhxEPn%xpe0FxPb3J&JN&#(==AR2pw#rMu}ux?c7Qbe(HG|XtTf+Q*L
zn|>k)99!IdGNZx?Q4im^W=LinIBb`L1i|BHc-lHo4V)-OR%VCv<nV7)p7xxpxf3Ew
zx2q=EBPK>JJi{2YT{C(c4zbiom-YBc1E<o=xH`PVXVWS9p>sV*;s`hJmEvm~9<j4w
z_sVjfq&y`?*gj$&h#%g=%~riN-B^l}>p_&FhoEKhci#3ui3BpXoA?Flq@;KD0eew|
zB&O)T`3M|<FyS>vS@IJBFSf~r?#<jNJ?B#x1M$Adv+mwJDWd|VXdlcam^Jiwd+QUs
z-YAUt-Pl4&5mPrp$(>G)lcmP#tpYm1uIFyhvypJ*)@`abe_#2@o5+<ZM@|yN_<Syl
zY~h}X(crlTxhXX0AQmF?T3&dee~3Q#t)jDI$j@S887?dR;j5!QqVe6gl|LTT5=$xF
zNFC(^duBuYu{H-I2G8}mmzSi)SV$xDmc(AWrDP5zK9xXml$#u};>Fg*t%E|Oj964}
z?eTjNB+In#8FRVU@s?k0V%rQgVPp44;(rVobn)+7*2%^Bst|9oxrdauvSmz5sFObe
zYydV2hNz<H5o{V@aXA|qM+7WOk|YXHcGQ4c1`m1!Oy%)z1PwViF_c)CL|kB0{iwEv
z;FZ)Y=5~&nWZJ9Rb7bwMypzP*Q25SDj#>S;L@{x_Z7_rE4Wonn?8C0|aQHUs4I%v7
z*6{Lx6(b@xumr;7XbN9MN}z^|=J$PSOHRG;NK=st6mP_|oC*R*<Z?zV%Y|!FiQ#FO
z{8sAB6UF{q#~wE<`H^553mSJ)1SI0g_bmRg^vc9tO$eEr_{4CqND~Fkd#U`?Pm1yH
zfv6pBl&MrG_}L92HMo6f)Sf-NbUTV)wsXE;e^FD<b$-)y&Jnout|RPK-tA+L8WP!i
zG~-ZHwuNZ3d`7bP85v}Q9hijDbceR&n$d%47VKB3H0zXa<L|Jy>NnncM!{ma%ESPp
z)YhP^5huQ33-!~rcLZ#8G3m)qG|@fG8{+`R%u)5@w_O?Ry)uTB3yYGH=DMxRG*k(L
zhTj<HbV)c7CE>gg@Pp}F+EA8*>k#9T{DV*FXQCugWtK%S4F^k>LmE?FJI}RkQ<CM8
zvf70oR?@^G^_2z7G!WvXe5pOO5|`T5;*%JR2ca$fq?p!^#w|(J;^K!BhRGh24cSGO
zfWsKPmT&#`z3Ba+7G3yYp_X7L)=JE}OlXx$Rv;s^jnODv#$B8;<mcO=rlEcPCFrDs
zDHdtAqjSl#JlR@hE2EbLFRK*l^_t-RD<yJ<UkcyIn;20Cwmdz04AflGafg-9s9OQi
zaIg?HvO;d6qX|pF%CDM*atwB;kyKO-Q~o8jI`Sk+oN>}&u2kOq?I=jj>>yV8F&KjN
zsHKyFwy62=0m8Lzh)o&`t*-!q4onTXjd|KDTot{!O3dDO)%*Hnck0OcbB2$Uq}mq=
z_2LXe%h<gPH$(aZtFWV0T8SjnD9Xev@H}hg)?=)&j<jQ&{07)?#FNJY2e!E)0x^E;
zIOhgsm1m%6WDP{u6yjb)baq}Z)QiW8P7tM*Ch;3kr5z~w=icyuxVm9UNUkV-+?yHR
z;)^UEK{IjGRS9t<>9lO5V|A+JI}M~9s`BOs78}6Ox?1)(aIkUts<fdd&oLz$6>j+z
zk~wSnLvZ>ggHkOSInX~h5dnCp`QE1=DfOyMNO?xPaEAh`1YJXwl2)iQwWI|RtM)-F
zUR__|1l7rfmKcD(G!^3;i&?N1g{0O(D7LC5D9%(&D<MD4ow_l)&vpeMA-j>!c7g96
z-+*U;OQr8^!NO~x1z<ay%P{gaU{5zR*$xnhnnqx|Y}GtOH)FT402ff&;Op4muEUq8
zF_=ZndzDxp5jLD#5Sfg~fc*JgPVP`{`<JJlKZeDOh7ktQub+{5Hd|h^B6w4`eNuq@
zjFh5xh$R=1Cpw{*s>-!fh(H9PJYYPk`Fd?SfSQIpfPn!n0fv`pH6XaC;PgzU262s6
zNgxgf5Dr!~a&|7-yRS=KPzdis_^h_R0w-0Lp`o((>NZOfYrXg7NHbvZquJifNBtEk
zTQf;ata3#`ihzuUu5A3@iMdqcXFf;@-;m<EwHS`sVj&++zVUKXO4z_KV#`j5jHo~2
z>{+5R+{qa*X?^6ub3|!#Gx>3vG>%FbY*c)TwUrxY>n<n1$TALNz{Ofg=#e~S!INwx
zkWc|4-{#>YEBPR;5{3GE=_-UN;h{?$NUTtq^yGK#HWcs(X{;<S9o^ZXiz-9Z%W>?~
z>YlBHd1L6orOgxkY`#F7qa#qv)Sx}zcb*6kH*qt{b>mCJqFwq9e-&Q*QAu@U&iRHv
zfF}dm%C7Mi6N0q2Ix=*O<IwxQUAq*H6S<Q{J>6Jce4Xe9N-dFAqo5K)cpdsA;0)X>
zN#267-wPenW&*6zY@j<zIl3USs8UqsqCPEzR>9bA#hRq!jX09mMZX#j2ZX@KIw@y%
z^joyN-D!{Uny-|O?au3yA816^pds=;4yQx@44A|S$HsWlPQobK+7H|6b8G6v73W`T
z-bPxlwf)qDst+%&@i7VxDjUQ)9^?kn6DucW4e9GD1@Z$61j1JKUvsm@99io5l>+Mq
zh>)g~Q6!>&<Q{erIsD2Y$KsZUUQKw7XI#=iju3id^eIiwXpk`Ao)R~iqq!-w2PK$t
zEy@)_Wyh;2347J3DRX(RU@w#|T#~j?<*XG8ro{Odd+uAd{Pec>pUZG)lw1UYTg}C7
zF`EzsPjahbEJD+>X^m*bz@FO%0GySckQy&e--OL%gKiR7%Y+}=0IZAFI9(2BwtU<=
zl|d6sGA01=u0yQr4n=5{*4RgtZPfJL0Ih!D)F5K7Y0G<??V_!7cyv7Xu$?e_1sQH6
z>=I%Qn6=(GXRzs83dG-ZfDo?a{aQ~vzy!m)zG{IbN~R7@Ip=B7t>1*`VVd7UzOg@6
zH2Z!)!JbCO<cv~@S&B){#F^XHBY9QGH|LpY8<uFOA^RqI{~J*me1XG2xk8;B3rf#G
zl2h$LdOhj^(IPF~z0i4PFwwqqs8rQ`{Bcy9Qcp*61fyu8;zL6ej)(QV!3fkD1dAL=
z7k!YwrY&!@jhOrts98FQ7gYPT?Fq;O7aJ4fzarj)l*7YELmB~eJ{d`G`$>2zEE^>w
zsI!SvT9W-~&FtQMVYxdDQ`SP~T>~1%YL`5cIzn@!cWB&4M1n{eEq`un8rfnEWasLE
zh$0E~Yyjb~^Dwp{URe{=KyF(Cll&R=go20pilhMlbT|sXue6#8eGR{-BE{wv3R;k~
zhHB=-ltWtqDROeRvl}OyF-3Z3R1d{>x-A^=w`v^4mmjOG?E9-MQ$x=qQ45*OCNVhR
zOlJ?13o@LVE_L{9G;}{)Dm?W}Gi})!w<U5(?hVhn3e%oa>Qx$lKg8*TMaINM0B=+u
zF+0>9)vibC!Eg|#z@LNNB7oZdC%kQl4A#v2ra7Zl=F0lMUb0=dzpU%`${Bq3t%1b#
z;o?lZ;p_3*W8{cw<3vlI=D}z)<fC-ky$U=#x3=T6Fb=u4k2n>Qrq4V?0|g%P1#rm}
zqTqOW!YhNUW*s$m)annpx<N71i7lk;%0H?=lBnv={i>li>5>BeYUY)zkij`wC>Imq
zI(N8;B(3foF*t87K7cl_O8AB(cH`}wyvLc0w{v@iQm~;bG5LEIRacz#cfWjnpz&4E
zcAN_U+|ddmZN$AgMpea%o8Y5%BCJ~CHj{qtJAV4KVd+4f&;7k$g|d4Slvb1aH7J)Y
z+{Lh`RI^M1X5%~0%mwFvC|zZ#p~JuH{yq__j9L8fGxTfniS*}!(c$$^QFE<x@x-t)
zsbNGs>pWMg_k5M4GE}3=5lmWR>I1N=QO8{+qf4DX5pE`kD@7*ARCsviiy~h&A#g4!
z`V<g-S$P|iKOD2I7)t&t>P9vPM}ml$s;iE)^cUxDBzMNr4wJNANVu^<t)*j5dT`vJ
zelBhuiBM4}KXr+1)X)t|p{5n;mt0);eLih9t*fsn6vz`&p`RlZ+-q6qUvm!cXy-bm
zZEi~1UeqmjtZci4Yl|T%s{3#H_ZKdq3A{Z~OM67n=WZ46l;9cCR3PH=qmI#?$JuL=
zt946#7oNy8uDM>=)mx{;p1edVxHK<oOp2YBzXs?*AQV9=-yECepcC5eO~MhbK~ZEK
zEvDnmOA0pd=CLO#p_ceq03RE*VKdm^rriNXRO1s+kz#mP*%_AKXRD3uR=D$Z6Z2|S
z^jnLTAhkoVroSlcFLNv0_tfYXgsP)11jJUMQxH5f1)3-Wbe=C@h3*sH$tBg`j^JTi
zBYd|xJZOXX&_=2$O<U9Iuj?wj1E0B>I&@%X6ij`=&_@_;Nre03c?79W)s%toJr}G2
z`Uw0qxikCZT}dw?=XBg24L3S8g#t;sCCtN+r>QADnp1@}9$4LgnBjXvGPw2iUMWR{
zisa;83@yTuqIj9rixGI*1!;aAQcHviwTonAi}<=BU-cAR8^jCKhB_iRInOB(n9)yo
zUavaRU=oiFmETrLSAbSfybZD`+&8M5SN#=NO3Jr|)f>f04uV<mh>M_i?l9?DlG5Kd
z49biL=+5nh8!Ot~{N!r8%1OB^LF|Go9u%U@=!4boVG$@Yw@!x|o!>hrmH`z!HIx<A
zIAKiHI;vKnPW-M5rTNk)0Cx<;C_6#b_`V@J&ue4koH%uXvyk#)gAJd7qH1rI;188;
zv*kt>U(ew*G+hFOLrT!&ru%qUD?;b%_SYL4aK=sW2p!<NYKeW&zDAK$+i*!F)_p<H
zmNLW@;c!;#i#M<LaPhoh=uOgt+G5k=U@0C_;Fuzx*c{Rd=2j)4lS-IUW8&*@QU%Tm
zVELGM1<?{=>;G2#Y+^!*h*ODDPl<XiV8&qRn*W2&wk#MkIHKy|yT*1XRu6$~pEzuj
zbw}v27OL;LObSCja%P3ujI|*3d#0L%e9Epha4I#s;#LU0wlOJVE<tY!_Na{u-%2*%
z*1^UC3gGO7KJ*Z_d=RmtD27vRso<p|^VrOJL#JUam*t(LZ~Pe*V?iHg)Ou<$Y5POI
zEQ$sgrr^-e*ocM|o=XdgGM}Lho4#kv3;L-_G2atBhbGpNUnUI$*Mm~&jwA+P^1n?N
z-|F+8iI-fua96E~F{i3K;%)VksC(T;AtWG4u7^qp6>?=#B^vh8CPcE;aCAvA$j=LE
zuoFg=spiA>yGJ@`)$Mj@IMIU1+dlXD!6WcHhbwU;dbUG#pk_E>P75nMF+{#$poHX8
z)Qs5?+8O{p3|BLf&WEb0pp_N3*>=I9XPw0hwFw>?Vm1J5r+8D>ccxNeS8?Fag~YL*
z(2%W3%op3k5%b_AF)vgSsy_IH@`J5mz0QId0>iUJZ^){KD8b9G8dVZ#X8<!fkZZPv
zB*L$cgpfhDZ$Cll?aC48?>MXOFf&09Ltb9Rdv#?*Y0b0vBYxZ;ql9uT2ACFTEq$cy
zTI$1Zv>`1SJVQQr;fWcka*Es_lnRi4XLYna_YqbrY(+_2P$m-0L9?tNTsd7k#2gJo
z=}4SR%iY%0M36r;(ocA+ORLf>cZQD)xhuS7VU2(xd4siwRMM09-k@1J`bIPr>KyAc
zCSTld>r;$CWq_xsT<ebIRPTyW$%B4HMu-=#{T}C<w(QkCcGqRz2Sgmt=1DU(L4ogr
zb0n0p!-ZtHV@3>;NOfiLh5E#!G)Sw}Ti-W#4nbfIVVX0musGSYeLBjo80&aKwj^@?
zG4nPg=<r1InW{+y&NYCl5i9#4Rjfj=w5s5#tbc7{AOG1@b-%gn>!3DTP$(QcVt;Vt
zk6(jR@)kt<;z$+WJ@st`#c$(i81fhgC(+JjDt2|aCR?<qGPAhNJI@^pw5+Pz$;A3Q
z0?{EqyysKD=y>S&aeIX0)fDI?q>10au7^5%u^=c0M%m-iGE>3uCmb&#(S-xgPqd*=
z)I_~MpTD9($-QT$!=b)_!~y4nHA)XOWhFE`C+!RF-%+A0F-q7uOquJ~X9tWrjqkO4
zNzNOe{Rg0gx9GWtn(;B7!YKx5->Ww`C&Y^+A0iI1xaVA=TaO#rNPhgn)Q1xc05ZCF
zjneMiFrDsDy2+#Yn`&zjgv;^pplNG`@TrFb&XAZ$G&HZD%gT&p6sRvi6YsgcqH1TF
z>b6N)5P|pQ`&lN+hnk?=t$0#ue3^RO7LCG~QB?_)Ti--G<Tq`)kZ!*~u$(B3H_9mO
z^j(JP8d@|&vb`o)UI%K?N39xWpr-#kh;rVj(+}Tr^<h%l3iLQ!#1iXk5psVW;ly=n
z4~*5GS%E2wl=JwQw9qga;<p6cLX-JU+2icw45nM0m#O8~@X6B#ZF0{rTRgwN#&Z3b
z{XssEeOjT!Yb2tK1RFnY6(@n|Yx2N1)bZh>FiTz{IHKfw3S*~3v}y<}>m=4L@OtGi
zzR<gD=9TZb7bwTDF(J|_#DWNpxUA*PoD>6Pd9yQC6ADS_WDk6;;H73GaN)DcuIdQJ
z84gv6ZXX7fVpL2|(R`F)5mi`Hwk=py|KQlE2ZP}oxL`gLciNpErTW8tBGtxI{hD;Q
zBbu2k-V$buFGWRn$V1pHQMGJNKW7ob*csAC;pFT{qHlDNO=irQZf+T(sK82~9?mEc
ze`vkq#OuZsh(X{4>^Tl041j==KYHIicQNY5(gzr@->I7oFYZ~{5=y{9>RhRA=_E-a
zRbLGh;E#fdPMZent6b99Muf0I#vVzt_NCFd8~K}nbD&;Lo=S_eCOGCrcL%r_yT!NG
zi=Vt|fOyJFHTd&3jK{A6YgUSo9g$LLZR}MWD4GG5hV!C`T1`Wd=cUL&D{$@Bn7P?;
z1yo!sIT>NI71^!XQp|B5W+q%Ldt*-J2}0cRZy4w6sxCyQ>e?Y0Rml7$eI@vK&y+bj
zMxF)CT6(bVy=&Q@XXiA|FL>VtV{L73+Xd;Z;=)Nu@Tf!Oj0;w$+|fctUX48ai$t=6
zzsLvcj}|9oIjkwZ4)LD(;(&zK)ZZIAh_w;#GO@|ps>7`{S%{sw>z8f%qh6Zhw(*tw
z3`M17v9?6EfBEL9#;mCV$kcxSlI-vYL8akD7uj{*dPKHoAeV+Vp`(uX4%|Ttd9K#e
z%|^-CTg8Ws;*zmL?ROHiLP%H*7_{H&qZzMjBA$BSDv^JO)83@A#qxdbgfqES#sjB+
z^lHzdsf>+yLx&-<LL4x-)+(W9Rb@c?%KZ0<oIY*UpyCupu92GxNz555LwR<$qvo`j
zdCoCbS}4QN;oTZ+Ydm?IEBKon40C^(Yb}!+{c5?{y25n?kHwEAqdupNNcko-p%e6|
zHy{aDk$OC7^?pOH9zo5+*9-hV<IbqXZ-x@aR7+$6l0u1)B{hRDttp0M72qd??2s@S
z7r3Je9BY>mO3SrixbV)8WM-piKvX&by9Mg<9>#O`8e8<#eqF7%XN1Y@#y=c0CIQ1D
zUG&)RZNsul;Wo9l;+r<-NIY@K$jYr0`9JJ9sY*5H+N_K59Q5MIi}H!f81U^>)JCJE
zeEpK5<e@rnHq)=AE2T$CT%g4>5xTV#!LgBIuRQNfrCI7)et=Ux%IRa-7C#>0SKt;Y
zDKBEXIfIsKm|`x?@!kBf>cFo+M+!EZ0ZREp9WgU1MT&&9v8*_o*>`|)Qiu!AwQ4(L
zWF3ink)MA2G?RdQXed1|B%_$6Celc^Lwl=(D1V=bgmJs9+MJZK2N7jCLl2JvlS-RJ
z&<r6U^(Xxm&97*orr+gbIIgLvJAM;3EwOOBLbyoC*=PPZb@EZA(9-xkJYPD@W<UNf
z@7ua&^as6+IPJGga3(S!Yx;SDc{^glm)623ChNWR)04_~Z?xx;+B>e`b-1D}X-1^u
zKRr#UuI`AF-OTpo$@-m^B9dZ)sy&;pRG%-0e_z-<Ew87qB{4}yH}6)ifq$bv&~N8Y
zRCRZChYi2>%*60cOzdk<bD->zI9|FYqJ3{tT(W35k2RBdWMymCW)m2v9Hm##8yh+8
zl+@GbW!${AmrlZBT&+J<K;>XkMFG)LTPgE;ht%yoAnY(#52({mfRk_?nMwv#C5G`v
zy>4J%fzq$xK+o*YnH-IC&hX@!nHCC`v1$_a(x&B=%=tG#72E0SQD1=8hj?_?vp3@I
zg!d`i9{F<D4<&E7YIY5LS=6}zq`E+MaV61|DyAQ5qhTY&Os1P(BPIxJT2ij<*|oNV
zshu+(S)jHmqwtwdSRYFFIe6jyZ>x~tRvhWHQIN@n)!poIu4mi&=By>ODshW+qDh;I
zRoa|lW99||7u~psasU_M-?Kkiq&+R79UZD;z^aI3z)^mX+pRbdEs{9IR}qiKES4!X
z@W2Sm<LC{pz=^2L>u!UP|9EUa>4D`4Wp)>pD?((V{G`n#2#k1(CF2VuxP=Q&pXX9R
zFG>g(V9wq-8PS%KHC|n5i&CzqJ6Q;JZ0}3{*5gVD!{i#*qYiQEq4!--d%G1SvMYDF
zMp-FVsXPA(JSaV^V|3!N#6Czg?<wAhFd_BncLBwXHU^gy5V-e<EWlN^zGZ#*VSO@}
z#wu3Y{ZOTtUw)oR4@V6yXjFEGokuV1d#&~-RX)<b^b}pW@lSD0OZ&w3T7&zAn-p8L
zC0YL9>z*xc{nf%%meKO6G&Cu8-S;s3&-i%U64)zJAHrWn4J%+;p28d%8o~;RR)N@#
zY&wO3&;b=0ngWSo^IGI=osSank?|YkG`G9&7fDjJzcVbp>#^t1PQGKXXg!PDKxM>9
zEMwO~jX@4LsA{Q_PisUH6*0h?d#ylOX_sHb<G2J&s2XP7ev?ahKi-$rr#qX0`X%^7
zXy_5SK#IWcxPlB5?BnZL?P!H(#i}({>yqhfY#z^yV52YiP))<vaA*y1{?a%OG*|d@
zw$b9%%=((g$L-R^J~N>xK>%)RXRfkL{A9|A?&{w}zr$^U5Sks61y!iCeCaIoVGks{
zy|6`a?FS!-Y<&+c_QfpjmzYXjZ)?zj7lF7PGQHYzGZaP(nouHwYX&upEp?IlD(T%h
zah)%ioRZ%JPEV%Lj3*y9YRxE{g6U{OYCGhM1&kMdNMOB9%%#+|2AR~$?IoH$T2CP&
z?e1NzGmOh)oY<D&U}ZFsb*kp7M`ahs`}UD^)s|b%Wdx7JqmpfU`a|94n|<w}%1O{q
zc_Dh4@*eDx2#7ASXow>Gg;tc2ks2h#;|=1%rPiplJ=h(2#N9hNB&*cp+?Iuh4hb0w
zI^MjtHiNTCZN*Wq>&3rzIPy8fPA07OE=)<zn}5)T#ZXi4w3mF<l*iRzSy6Z>jv?YT
zpGU4)T;&M(h#=3OyC<saGW>A;gwrPPWGh){<-=YGm^{r!p=TX`{D2nX?)I95`AGj$
zp5r8_4rMuLS9<<l=FUka<GLB;B0W@R6P^c?R3Q{e)(L3k{DX8GWEiuF<Q@VRnai>z
zls`Zzsgh0Svk30eFNV^cZP!h+6JU(MTYHHBYo`6u=J&4EL{95RwHGy=zDGs|>Zi!&
zXk~LMnP>U}GT~V!;@H%Xag)E#edr;`2z7k6<q=Z8$c@9?9WZ@MGh9}6z}Y6PEq0?>
z0cTvhZ#9~|@J;zy4=qTsK10ZbCVCokGi4mn_$zi;He|S<G8$#1tbNq9^hb7B$0|6t
zFlyzUJJ*QLp&wi)LX!YcjrMk=C<>oiv$A?yLF6g(Nf$DHhpKPQoij_?SoMo0UmJSN
z7??M*v$EyH(~W|(L4NwVkBch!X`ox47R{on5H91vAo#uw`0{>{&lK0SMQG=Fk+=uK
zp=j+J`hoZzDb`4?m^{zp9Neo4VE9tT#oerd#;pJ4Ox)%3qSO%REV_JG)6{HK&Kj8n
z>_nm;_ln!+`k*SZoBNQ;atUc~&9T(>Fj{;5o4BQ`+z5Z=Rb?J^J2oF|{8<q)W41De
zY*Nt(#^uG*jTTcf11vxtnlx-5!WfmQR^Tg3f1vQ{xf!J((!lV}RF~^CF&2@tcmaW7
zE6pK9@i6#}6PwEE{^wnX4Km*%#KJ)hP}X7RE2d9^I$t$UZ0t)z7&6<)^2E~?%}>pl
zKfyHl^21#~@(1>t^MG_W8!<9)-1K^KYHnmO??QjHAcrg#r}=9>N0A=hyYuj*=Ql1Q
zt7{@FkOD{2BGKhjpev$o^cjV|eqoPAoQu<+VT$Ew<1&eeaAX13GvBa(rmRt0$OR?T
zis39PR&Ns>n5&DQo9X5+ZR)ggX5rKR5*|fXM1A)$#P2TqyD|x~Z*lUZ9vNRUrkFmY
zYMI>nS%tj+g1s8z^IB$_-4@3t3g_!*p1R;3gxhOO&>h~C((B5Ftul$rRhpl2dD+CI
zt#d~c*U!qC?-9JPGK;QNW+k1YWvHarwG}W3vY-dy9aNJS`D;Ts(W8LL6Ye(w_4m<(
zkEXF#SJM@m3u1~T76(a31+;S5*DQ_{z?AGKy@iV;qth+zWUO1{H=HiAk{&BNghP2m
zLr0mWcH*}J*EQgay9XsdGQcV?lH$)4cBD5Euix(KOr}r=+*L-tKhz*t!}Y)*`SSV{
zKEZ~lME>?mzcP0yU@N|?cXG3H(!tS4%5?22^VRNj>RJt^=Ny)_PnBW0`hf(IGyDWL
zKjwCbIJr%6Am@1FQCo=RlC6jKsv$v-bP#Q^Ej^>dosgOkcWf~*{MSZs4abLD>OIh}
z$<MC}<gh1x!%DKZTj>YtI067L;WkoIY6?<P|ET7Bso~2FND`6n7bh7s(Ja+q3e~|p
zNGuf8$Ha4)W5O+ztiUty0JUAc%I2nFWs48B>+MY#tO|>5u0yX2rMQFHJYFx^r=tDE
z&iEnfe7%+Y=c&l)8jNJ|ICr%j$<$R<mg2zR8&7T2PO2y*IMgB&%XAKU1qJW;dcV6n
z-`89EYkR*)x@^Ci1*_8JK_c~O*C_JVYKU@gqx)+Zst5K4%;}60?~;yU#+-6rp}!L5
zvM<xT8~~d&PW37xHWyW5sba}#E0_CIZZ(bi#5U{HH7<zUzmgINfMgwUQ_GuTDJ4=!
zN}$oEs>{UbyvKdT_&vez4odo2nl0ijEy$In0EpJKh4?${$Ev~o7i2z0T*P)0`$uy)
zq+{SjyF(E9vgak-nHa3D@3M&vfGfXbaoOMsX@41kt!_EH3GwYIKuR^zel&i&oN@cI
z=aDc#6Q7_JKGe?9sWu>26kv16<O54W0xX6fHNN%sQnhmWoo91>3oCHvnmBzjn)*_8
zNo4a<U8$%1M$p{JfemcoWCmgLc5r^Fy95A)#k`%t=5`Qw3Nwh6jiU(F&yLSj6gCzj
zRJuIMAZ2GMh_#KpuPa2;S4GR**UntPf=WyjMc7;L1;7E~4yN#Suy=G5^cJD|3s>;v
z`cE@E6~$jB?sg(nddg}PQckWA3T`%THV~_fw~Z$!l_&~@u&afopoX;U-yvS^M5wIY
z-JJ#5*}c5H*u1#doLsHgIRpd**g>4^oSdvL7OZYQj_zP@R!2ALKM;SzkcPOKyV^Lr
z+c-H={J{j9IeEB?P*J_~Q~YCm4$jKT|AcpR`#TFSe6V|io!L3qK<o|<?EmiJ<}Ty;
z0`m6({a-!Yv|fr-*)<?;P9Co25E)O1qdWD#Ls*#q)8E;{)&8$^EX>&<_7H~`Q@59>
z9RCqgPC;4ipB{fGu(EM*{>$ry?EkQIx3T;eS^qJ%KRth?^X~(BasMaoe^~z`_rHu^
ztdx}nrJc+@{tQn+T7>FPd_fB*a~li6zb?W2U_Jp}ZZ1{`57>;A+surQl^<lr$;tud
zF*gTufjGH&`2Gz_!O_hf>}U@81N8#VX7hq$4(1Wy;N!Jm<+tSJVdduJ;$j7xaqzQ3
zI3c_|oZMV|yyiUr2BGR|^P)<y{lAau50u3pC{9ZdCm6)R%5NdS&&tgO0kaBlnnPGQ
zcz7&1_{_L?`FO#9L0Om!$~w6^fM2H5#sO>vVRv@4`m5s);erxs3L;dTY@mO&sM&+v
zEngf&sNUE(dU*e<L(9eiqUjF)!zKqG7YM}9$-%|TA;2lX&G|1Q9f+&jixU4}a)8*l
z{)YQ!S_EH`c_9}3N2f0Ue|fy*A}Hkw0lPc7YB@RCi%|U;62%|SzvN9J{I^Mww{d&1
z@cE<oziVC-;_|n<zbyfKo4>j!DE^YIAlUqGLEONe5R1P8z4-mD%iJ35Xa#v$-+vd>
zKiX~nFOvn~;<Mni;Id#fH?uHj<p%SDSj|A(5LN+x4n7M$ZVqmKkokY2yE$39dx2dc
z5>_vnzGU+vpue)AVEBtl#{abTvWEQO=|wlJ93WOsek~4=ASb6F2QM>-Ul0VMV*h)>
z?0;7EKQb0(|Nn3z{FlMMZ38cUe`|Z$US4)9_J3|yf9LEEjsFinf1iv0hY?<&{}<%H
z;`e`a{g1Byih=*i_<!p9A6@?y1OJur|J3#W8(k>>df<ULzWfXFdU>4bJ8<U!08p$H
zq$RYh*X9lUoVDf&e+PJx>jQ};6T?kCaSHY=_@YOZdyo!oE4jXZA9YW!l95q*MQtF5
zP;MI#ywz-5D5%J4J1oaVRpHTK@IHOu0#lhcEfXyUd)$}`vya&>dG&bh@;bq^zsc+8
zX;(N};O`Rwzizj{Tfd+^%*g1cUj+eH!{0dLiva`U4J4#L;{sQwKmumr36m{CpF4gW
zri-_Q%H*Cb)Ga6vqF|kW$xBj6hv7<T@tv$S4UFnF$8OX7EPWTy@TH5Bl)S#)4i!qR
z%5@2RcTi8;w1SJ8I+wtpmq21LF&^u|N9kL_y524Hk$b7}v)ny>&+8*+tcLaPr0-5Y
zT23;($DKNyQa%VKOZjEA!$az(G2s=F_IMQn1Srwm;W^b_gw=#y-+zM{iiy*fU&k=m
z!sEJq4b#cOl@fxc9tb)z?dTiDwq*OV^2x<`9=<T9<lNf=hRZ(d0;{K!=|1N`AAYRI
zDXuOWL%x~&?yaS>l?IkcCQn0#$u9_c<|JpghL&}3EiV>~zdmdSz5OIlB^r(js-fw2
zmMKqK79+E%z-~j%Llde{WC%e+y<W(1@W-VH5Z)ZJoJ!PZRH}K@`p2J$R&q`Fa^vHI
zz5F$lWm0q+g;7~o)41Pka4!0#arxNv*XlVw4fE^Rj%SA%w8U!#^AWC%hX&cv$T|@(
zu=G9ZziY-;QYB86vl`>|a>FL?*zpK6lymTW%my>Vjao6y7F-CMX>k-_7pIXfd_MUm
zSh;oAuu-YAhIpC4`M@uYfdG5z$8(#r)`%zWVCnCy3sQTqHsdH7hx>-nGbk<%6#XRd
z-XotkPAD0>W^vMUx~>M!oTFzZT1CQa1<#(%=z2Agg`DA3%0z^~s+?nCfvUW^tT2Sz
z&QMhu`kKi>i3uyE>;Az<w>_xQUjP|UQL8O`Ej{Q4Y*mqp10&DOnD$)zClfvT+vA;#
zB7lD6!nse`3BonZFng`suc}diz)o!T%@SAX@m%++Y&97rKoo$(yHW|v2}&y3v_r)L
zXgp%Ozkre);vK7ULD-%L3cj82tdtkM!U8k%EiyjyjGxwkJ-*W5jjEz2nONZ0I3ue;
zun0NRD4+>N;XAVgH$3qwp`Xg<{1b<cRHZ0s+OXU=xM?)sDfJx;4L+$HD^5x3>oe$C
zn05?cpUd=$A6No|tHy5L#gmgDakxoD)&)r!Hb0gVP!b*6UIh)t6``hNc`XA=#nJ&3
zfuNh}HzDY@NG1oBr@~GpJ+Ays{F(*BqhrifRZ@7v_L?l9?&1fjI06HLHKDJq5*IIG
zRV$4~V<$q+4HPrXyaVFwy?=Sb-10dytCmjGDQz0B>1l%SS*;xV+@d#1uV#+z-NzH#
zds8!~GGWgT%n-{_Njgt`_`%$At*y+;ruIt|7!MorVKxy<DFA?H2y=BBCV`|XrRGD^
zwYlzCr4X_JZM<Q8reRJu=GlU~@|6yhx3Z?YKTb(=zHGcx{9W|Pj_W?5zU69QYPR{i
z96`3NsBQ6cV@#?cWx%uVC7FH}<D7gjVKZt)@5D3GyslA0JqW^zR{0|}63bI51TYxY
zxFoIf46drIB7CHSePZiLiK`Z|9Hg55T%PPawh(P3eYfI0*iVcol_2B$<;*Mu&0tHE
zTxiqw3XR&uFwFK*UcWMh#vWwpf{SSHfepZoXY-kuTBH)(XLIGTR`$4NsLph`K!&c<
zlC|~cZ)(=_S-Y{r!KO%J1Gu@>a%skRvcA_zcV2bfGGuF2eJQLa=(HwCfqvGSb8lB6
zLFa7~g_#~B%wB$-x~G?}b`3|YB$_rNh$xNd5s)o?3zwsq!Yk;cV~riW2jx?j>{grC
z&0trp>x;>)laco3Lz}WxAliAwiyK(2-|1(U1|;htMdi5t?ZLFc5OP?{BC;^^wu#l|
zUH*w##)ZVg7-NbN)|6DQ<*kST$BO2xK)&7+(fVZ;m|7CGz!LNKN9VZ5h{(u7%*tiI
z+Lwj0vz_W3AW~G>?(-ss(34SL%kIO0wsUywp*TWpMHBKZ@fKTbkfT_)OMyrH%}tj;
z664_cx**X=E2}w;(8XwB24QAB&+m~K;L|a^)C4qW{&u5ftbM{#{0%n#C!RJF?s`f~
zJ4LZ&ktU4{lzm2d;b`~;Z;PFUnoyBNFMg8`%s*lMJ<{!jqV<J$lB5!>cIx(4E^pJ(
zuCDAuzT|uWGqI)nR7=?*j?HSqEf}r}*qNHHn<EGlfXyO5GuQYtj3LHANo!gR+9Cvu
zC&ejMaLjfI1NL8e@5C=<J&8F?pWZgpwkr9^A|-Khxu)r<t2@d`guvxEjHH&SOb3ZL
z|9roN9awMdhP#T0!;W;Bi|uI0$qPP?)|Q(h-}uRyU`A(urQ^jir|8LvaCF)D@uQIs
z>3W;N<?9L0^-npM>Vcoy>=x~wq65O(KW@-8w6&#PeJ;-v5rp$pD|Hz6{vy;>EY6O9
zRCOMbHx+B@Q1IC>J3;Js<rMdnrUdXxPE~ndw%=65)!L=X@v$i9!nvRQ()j@kr@FIU
zLx+h=XKOS&p0O&1USnx5S;jnN$j=Yn)1M=Ft()>%&@USeC$?ruHn*7b^X6@{u=mGo
zgc_!ObcBS3?3|#FI68J_!a>&`L1ZRA1dXkM?U_9Hp_4Yts{*fke2sYOa#uOfd#)=9
zjQE*3;`w;x&d#>Jh|7txL@&>Lulb%JFrJ%JL<(HYiXJ`NUGCy1jn1<Aqd%jD8aJWD
z6sZP1Y;Et~zxY*jlQ%2o;FZQ1HGAd5vEI?8e}q6j&EnT!9?xTl*sRe8v@tibb^juw
zx2GdvvzcQ-hjMpTy{S12oA<4DCvo_m{4Ir<`QygD)hmwDaoedffVT2naxA+$YV!tN
zcVm<72e$TWW6k+4vY~g20yrgV)Iw)piBqO<@R6X<nJ$<6hh&YL0d*Zg3xpPyQE1R9
z0V+wkFn+904V+R-VD85$%ZkbkvX>&VGaTr7kH}Wa?nN&4MQ&F0W>AY9P7hFAeWQVv
za@t=`C8e7vBh4O;vSt|aY}n;}^`&3I);d*3#0~dHAhSxe8`abht07&uM=!$SG$8X=
zQvA}G2l(mfdw}=PFypJ6ETOXyN4(3rAJE$62PiqqbPf?+_M089G@GdCNx-&6-#1J6
zvNxX!3wlCV)TLOIzJ4e&U0J_fxz|Req>Y~p%{EerBU5H@TUOJup1ztJo`vQ-VkI0Y
z;5ihJ1UOQNH-0dMDR_%60@(FC@1iz~mCpFYOZ!8n^okBo^DQ&L_v8@)H=Nc$+@rV7
zP|kKxYtbJla@!TGFeitNe~Q$qdsN}&%T#}m37eM3{a_s)wTbFTS$0D40Sio@iIJpz
zn6!ysO~Ipzq>d!NLvaI0%<`#Hx4~}cHQQJgvtw~syq!WA;SzDDgmpvCoCyCiKrlGq
z0*rt;MMwc|uD-z3)cWvFKTXTAN!973e-@zbb0LJQ2V}r%DUMr(g7QM%no%M6M%}s5
meP>v*b~vM6)Xh5kMgEP=YCOTKS@X~9cLf<0={iZ%(EkGst+QnS

literal 0
HcmV?d00001

diff --git a/api/core/tools/provider/builtin/baidu_translate/_baidu_translate_tool_base.py b/api/core/tools/provider/builtin/baidu_translate/_baidu_translate_tool_base.py
new file mode 100644
index 0000000000..ce907c3c61
--- /dev/null
+++ b/api/core/tools/provider/builtin/baidu_translate/_baidu_translate_tool_base.py
@@ -0,0 +1,11 @@
+from hashlib import md5
+
+
+class BaiduTranslateToolBase:
+    def _get_sign(self, appid, secret, salt, query):
+        """
+        get baidu translate sign
+        """
+        # concatenate the string in the order of appid+q+salt+secret
+        str = appid + query + salt + secret
+        return md5(str.encode("utf-8")).hexdigest()
diff --git a/api/core/tools/provider/builtin/baidu_translate/baidu_translate.py b/api/core/tools/provider/builtin/baidu_translate/baidu_translate.py
new file mode 100644
index 0000000000..cccd2f8c8f
--- /dev/null
+++ b/api/core/tools/provider/builtin/baidu_translate/baidu_translate.py
@@ -0,0 +1,17 @@
+from typing import Any
+
+from core.tools.errors import ToolProviderCredentialValidationError
+from core.tools.provider.builtin.baidu_translate.tools.translate import BaiduTranslateTool
+from core.tools.provider.builtin_tool_provider import BuiltinToolProviderController
+
+
+class BaiduTranslateProvider(BuiltinToolProviderController):
+    def _validate_credentials(self, credentials: dict[str, Any]) -> None:
+        try:
+            BaiduTranslateTool().fork_tool_runtime(
+                runtime={
+                    "credentials": credentials,
+                }
+            ).invoke(user_id="", tool_parameters={"q": "这是一段测试文本", "from": "auto", "to": "en"})
+        except Exception as e:
+            raise ToolProviderCredentialValidationError(str(e))
diff --git a/api/core/tools/provider/builtin/baidu_translate/baidu_translate.yaml b/api/core/tools/provider/builtin/baidu_translate/baidu_translate.yaml
new file mode 100644
index 0000000000..06dadeeefc
--- /dev/null
+++ b/api/core/tools/provider/builtin/baidu_translate/baidu_translate.yaml
@@ -0,0 +1,39 @@
+identity:
+  author: Xiao Ley
+  name: baidu_translate
+  label:
+    en_US: Baidu Translate
+    zh_Hans: 百度翻译
+  description:
+    en_US: Translate text using Baidu
+    zh_Hans: 使用百度进行翻译
+  icon: icon.png
+  tags:
+    - utilities
+credentials_for_provider:
+  appid:
+    type: secret-input
+    required: true
+    label:
+      en_US: Baidu translate appid
+      zh_Hans: Baidu translate appid
+    placeholder:
+      en_US: Please input your Baidu translate appid
+      zh_Hans: 请输入你的百度翻译 appid
+    help:
+      en_US: Get your Baidu translate appid from Baidu translate
+      zh_Hans: 从百度翻译开放平台获取你的 appid
+    url: https://api.fanyi.baidu.com
+  secret:
+    type: secret-input
+    required: true
+    label:
+      en_US: Baidu translate secret
+      zh_Hans: Baidu translate secret
+    placeholder:
+      en_US: Please input your Baidu translate secret
+      zh_Hans: 请输入你的百度翻译 secret
+    help:
+      en_US: Get your Baidu translate secret from Baidu translate
+      zh_Hans: 从百度翻译开放平台获取你的 secret
+    url: https://api.fanyi.baidu.com
diff --git a/api/core/tools/provider/builtin/baidu_translate/tools/fieldtranslate.py b/api/core/tools/provider/builtin/baidu_translate/tools/fieldtranslate.py
new file mode 100644
index 0000000000..bce259f31d
--- /dev/null
+++ b/api/core/tools/provider/builtin/baidu_translate/tools/fieldtranslate.py
@@ -0,0 +1,78 @@
+import random
+from hashlib import md5
+from typing import Any, Union
+
+import requests
+
+from core.tools.entities.tool_entities import ToolInvokeMessage
+from core.tools.provider.builtin.baidu_translate._baidu_translate_tool_base import BaiduTranslateToolBase
+from core.tools.tool.builtin_tool import BuiltinTool
+
+
+class BaiduFieldTranslateTool(BuiltinTool, BaiduTranslateToolBase):
+    def _invoke(
+        self,
+        user_id: str,
+        tool_parameters: dict[str, Any],
+    ) -> Union[ToolInvokeMessage, list[ToolInvokeMessage]]:
+        """
+        invoke tools
+        """
+        BAIDU_FIELD_TRANSLATE_URL = "https://fanyi-api.baidu.com/api/trans/vip/fieldtranslate"
+
+        appid = self.runtime.credentials.get("appid", "")
+        if not appid:
+            raise ValueError("invalid baidu translate appid")
+
+        secret = self.runtime.credentials.get("secret", "")
+        if not secret:
+            raise ValueError("invalid baidu translate secret")
+
+        q = tool_parameters.get("q", "")
+        if not q:
+            raise ValueError("Please input text to translate")
+
+        from_ = tool_parameters.get("from", "")
+        if not from_:
+            raise ValueError("Please select source language")
+
+        to = tool_parameters.get("to", "")
+        if not to:
+            raise ValueError("Please select destination language")
+
+        domain = tool_parameters.get("domain", "")
+        if not domain:
+            raise ValueError("Please select domain")
+
+        salt = str(random.randint(32768, 16777215))
+        sign = self._get_sign(appid, secret, salt, q, domain)
+
+        headers = {"Content-Type": "application/x-www-form-urlencoded"}
+        params = {
+            "q": q,
+            "from": from_,
+            "to": to,
+            "appid": appid,
+            "salt": salt,
+            "domain": domain,
+            "sign": sign,
+            "needIntervene": 1,
+        }
+        try:
+            response = requests.post(BAIDU_FIELD_TRANSLATE_URL, headers=headers, data=params)
+            result = response.json()
+
+            if "trans_result" in result:
+                result_text = result["trans_result"][0]["dst"]
+            else:
+                result_text = f'{result["error_code"]}: {result["error_msg"]}'
+
+            return self.create_text_message(str(result_text))
+        except requests.RequestException as e:
+            raise ValueError(f"Translation service error: {e}")
+        except Exception:
+            raise ValueError("Translation service error, please check the network")
+
+    def _get_sign(self, appid, secret, salt, query, domain):
+        str = appid + query + salt + domain + secret
+        return md5(str.encode("utf-8")).hexdigest()
diff --git a/api/core/tools/provider/builtin/baidu_translate/tools/fieldtranslate.yaml b/api/core/tools/provider/builtin/baidu_translate/tools/fieldtranslate.yaml
new file mode 100644
index 0000000000..de51fddbae
--- /dev/null
+++ b/api/core/tools/provider/builtin/baidu_translate/tools/fieldtranslate.yaml
@@ -0,0 +1,123 @@
+identity:
+  name: field_translate
+  author: Xiao Ley
+  label:
+    en_US: Field translate
+    zh_Hans: 百度领域翻译
+description:
+  human:
+    en_US: A tool for Baidu Field translate (Currently, the fields of "novel" and "wiki" only support Chinese to English translation. If the language direction is set to English to Chinese, the default output will be a universal translation result).
+    zh_Hans: 百度领域翻译，提供多种领域的文本翻译（目前“网络文学领域”和“人文社科领域”仅支持中到英，如设置语言方向为英到中，则默认输出通用翻译结果）
+  llm: A tool for Baidu Field translate
+parameters:
+  - name: q
+    type: string
+    required: true
+    label:
+      en_US: Text content
+      zh_Hans: 文本内容
+    human_description:
+      en_US: Text content to be translated
+      zh_Hans: 需要翻译的文本内容
+    llm_description: Text content to be translated
+    form: llm
+  - name: from
+    type: select
+    required: true
+    label:
+      en_US: source language
+      zh_Hans: 源语言
+    human_description:
+      en_US: The source language of the input text
+      zh_Hans: 输入的文本的源语言
+    default: auto
+    form: form
+    options:
+      - value: auto
+        label:
+          en_US: auto
+          zh_Hans: 自动检测
+      - value: zh
+        label:
+          en_US: Chinese
+          zh_Hans: 中文
+      - value: en
+        label:
+          en_US: English
+          zh_Hans: 英语
+  - name: to
+    type: select
+    required: true
+    label:
+      en_US: destination language
+      zh_Hans: 目标语言
+    human_description:
+      en_US: The destination language of the input text
+      zh_Hans: 输入文本的目标语言
+    default: en
+    form: form
+    options:
+      - value: zh
+        label:
+          en_US: Chinese
+          zh_Hans: 中文
+      - value: en
+        label:
+          en_US: English
+          zh_Hans: 英语
+  - name: domain
+    type: select
+    required: true
+    label:
+      en_US: domain
+      zh_Hans: 领域
+    human_description:
+      en_US: The domain of the input text
+      zh_Hans: 输入文本的领域
+    default: novel
+    form: form
+    options:
+      - value: it
+        label:
+          en_US: it
+          zh_Hans: 信息技术领域
+      - value: finance
+        label:
+          en_US: finance
+          zh_Hans: 金融财经领域
+      - value: machinery
+        label:
+          en_US: machinery
+          zh_Hans: 机械制造领域
+      - value: senimed
+        label:
+          en_US: senimed
+          zh_Hans: 生物医药领域
+      - value: novel
+        label:
+          en_US: novel (only support Chinese to English translation)
+          zh_Hans: 网络文学领域（仅支持中到英）
+      - value: academic
+        label:
+          en_US: academic
+          zh_Hans: 学术论文领域
+      - value: aerospace
+        label:
+          en_US: aerospace
+          zh_Hans: 航空航天领域
+      - value: wiki
+        label:
+          en_US: wiki (only support Chinese to English translation)
+          zh_Hans: 人文社科领域（仅支持中到英）
+      - value: news
+        label:
+          en_US: news
+          zh_Hans: 新闻咨询领域
+      - value: law
+        label:
+          en_US: law
+          zh_Hans: 法律法规领域
+      - value: contract
+        label:
+          en_US: contract
+          zh_Hans: 合同领域
diff --git a/api/core/tools/provider/builtin/baidu_translate/tools/language.py b/api/core/tools/provider/builtin/baidu_translate/tools/language.py
new file mode 100644
index 0000000000..3bbaee88b3
--- /dev/null
+++ b/api/core/tools/provider/builtin/baidu_translate/tools/language.py
@@ -0,0 +1,95 @@
+import random
+from typing import Any, Union
+
+import requests
+
+from core.tools.entities.tool_entities import ToolInvokeMessage
+from core.tools.provider.builtin.baidu_translate._baidu_translate_tool_base import BaiduTranslateToolBase
+from core.tools.tool.builtin_tool import BuiltinTool
+
+
+class BaiduLanguageTool(BuiltinTool, BaiduTranslateToolBase):
+    def _invoke(
+        self,
+        user_id: str,
+        tool_parameters: dict[str, Any],
+    ) -> Union[ToolInvokeMessage, list[ToolInvokeMessage]]:
+        """
+        invoke tools
+        """
+        BAIDU_LANGUAGE_URL = "https://fanyi-api.baidu.com/api/trans/vip/language"
+
+        appid = self.runtime.credentials.get("appid", "")
+        if not appid:
+            raise ValueError("invalid baidu translate appid")
+
+        secret = self.runtime.credentials.get("secret", "")
+        if not secret:
+            raise ValueError("invalid baidu translate secret")
+
+        q = tool_parameters.get("q", "")
+        if not q:
+            raise ValueError("Please input text to translate")
+
+        description_language = tool_parameters.get("description_language", "English")
+
+        salt = str(random.randint(32768, 16777215))
+        sign = self._get_sign(appid, secret, salt, q)
+
+        headers = {"Content-Type": "application/x-www-form-urlencoded"}
+        params = {
+            "q": q,
+            "appid": appid,
+            "salt": salt,
+            "sign": sign,
+        }
+
+        try:
+            response = requests.post(BAIDU_LANGUAGE_URL, params=params, headers=headers)
+            result = response.json()
+            if "error_code" not in result:
+                raise ValueError("Translation service error, please check the network")
+
+            result_text = ""
+            if result["error_code"] != 0:
+                result_text = f'{result["error_code"]}: {result["error_msg"]}'
+            else:
+                result_text = result["data"]["src"]
+                result_text = self.mapping_result(description_language, result_text)
+
+            return self.create_text_message(result_text)
+        except requests.RequestException as e:
+            raise ValueError(f"Translation service error: {e}")
+        except Exception:
+            raise ValueError("Translation service error, please check the network")
+
+    def mapping_result(self, description_language: str, result: str) -> str:
+        """
+        mapping result
+        """
+        mapping = {
+            "English": {
+                "zh": "Chinese",
+                "en": "English",
+                "jp": "Japanese",
+                "kor": "Korean",
+                "th": "Thai",
+                "vie": "Vietnamese",
+                "ru": "Russian",
+            },
+            "Chinese": {
+                "zh": "中文",
+                "en": "英文",
+                "jp": "日文",
+                "kor": "韩文",
+                "th": "泰语",
+                "vie": "越南语",
+                "ru": "俄语",
+            },
+        }
+
+        language_mapping = mapping.get(description_language)
+        if not language_mapping:
+            return result
+
+        return language_mapping.get(result, result)
diff --git a/api/core/tools/provider/builtin/baidu_translate/tools/language.yaml b/api/core/tools/provider/builtin/baidu_translate/tools/language.yaml
new file mode 100644
index 0000000000..60cca2e288
--- /dev/null
+++ b/api/core/tools/provider/builtin/baidu_translate/tools/language.yaml
@@ -0,0 +1,43 @@
+identity:
+  name: language
+  author: Xiao Ley
+  label:
+    en_US: Baidu Language
+    zh_Hans: 百度语种识别
+description:
+  human:
+    en_US: A tool for Baidu Language, support Chinese, English, Japanese, Korean, Thai, Vietnamese and Russian
+    zh_Hans: 使用百度进行语种识别，支持的语种：中文、英语、日语、韩语、泰语、越南语和俄语
+  llm: A tool for Baidu Language
+parameters:
+  - name: q
+    type: string
+    required: true
+    label:
+      en_US: Text content
+      zh_Hans: 文本内容
+    human_description:
+      en_US: Text content to be recognized
+      zh_Hans: 需要识别语言的文本内容
+    llm_description: Text content to be recognized
+    form: llm
+  - name: description_language
+    type: select
+    required: true
+    label:
+      en_US: Description language
+      zh_Hans: 描述语言
+    human_description:
+      en_US: Describe the language used to identify the results
+      zh_Hans: 描述识别结果所用的语言
+    default: Chinese
+    form: form
+    options:
+      - value: Chinese
+        label:
+          en_US: Chinese
+          zh_Hans: 中文
+      - value: English
+        label:
+          en_US: English
+          zh_Hans: 英语
diff --git a/api/core/tools/provider/builtin/baidu_translate/tools/translate.py b/api/core/tools/provider/builtin/baidu_translate/tools/translate.py
new file mode 100644
index 0000000000..7cd816a3bc
--- /dev/null
+++ b/api/core/tools/provider/builtin/baidu_translate/tools/translate.py
@@ -0,0 +1,67 @@
+import random
+from typing import Any, Union
+
+import requests
+
+from core.tools.entities.tool_entities import ToolInvokeMessage
+from core.tools.provider.builtin.baidu_translate._baidu_translate_tool_base import BaiduTranslateToolBase
+from core.tools.tool.builtin_tool import BuiltinTool
+
+
+class BaiduTranslateTool(BuiltinTool, BaiduTranslateToolBase):
+    def _invoke(
+        self,
+        user_id: str,
+        tool_parameters: dict[str, Any],
+    ) -> Union[ToolInvokeMessage, list[ToolInvokeMessage]]:
+        """
+        invoke tools
+        """
+        BAIDU_TRANSLATE_URL = "https://fanyi-api.baidu.com/api/trans/vip/translate"
+
+        appid = self.runtime.credentials.get("appid", "")
+        if not appid:
+            raise ValueError("invalid baidu translate appid")
+
+        secret = self.runtime.credentials.get("secret", "")
+        if not secret:
+            raise ValueError("invalid baidu translate secret")
+
+        q = tool_parameters.get("q", "")
+        if not q:
+            raise ValueError("Please input text to translate")
+
+        from_ = tool_parameters.get("from", "")
+        if not from_:
+            raise ValueError("Please select source language")
+
+        to = tool_parameters.get("to", "")
+        if not to:
+            raise ValueError("Please select destination language")
+
+        salt = str(random.randint(32768, 16777215))
+        sign = self._get_sign(appid, secret, salt, q)
+
+        headers = {"Content-Type": "application/x-www-form-urlencoded"}
+        params = {
+            "q": q,
+            "from": from_,
+            "to": to,
+            "appid": appid,
+            "salt": salt,
+            "sign": sign,
+        }
+        try:
+            response = requests.post(BAIDU_TRANSLATE_URL, params=params, headers=headers)
+            result = response.json()
+
+            if "trans_result" in result:
+                result_text = result["trans_result"][0]["dst"]
+            else:
+                result_text = f'{result["error_code"]}: {result["error_msg"]}'
+
+            return self.create_text_message(str(result_text))
+        except requests.RequestException as e:
+            raise ValueError(f"Translation service error: {e}")
+        except Exception:
+            raise ValueError("Translation service error, please check the network")
diff --git a/api/core/tools/provider/builtin/baidu_translate/tools/translate.yaml b/api/core/tools/provider/builtin/baidu_translate/tools/translate.yaml
new file mode 100644
index 0000000000..c8ff32cb6b
--- /dev/null
+++ b/api/core/tools/provider/builtin/baidu_translate/tools/translate.yaml
@@ -0,0 +1,275 @@
+identity:
+  name: translate
+  author: Xiao Ley
+  label:
+    en_US: Translate
+    zh_Hans: 百度翻译
+description:
+  human:
+    en_US: A tool for Baidu Translate
+    zh_Hans: 百度翻译
+  llm: A tool for Baidu Translate
+parameters:
+  - name: q
+    type: string
+    required: true
+    label:
+      en_US: Text content
+      zh_Hans: 文本内容
+    human_description:
+      en_US: Text content to be translated
+      zh_Hans: 需要翻译的文本内容
+    llm_description: Text content to be translated
+    form: llm
+  - name: from
+    type: select
+    required: true
+    label:
+      en_US: source language
+      zh_Hans: 源语言
+    human_description:
+      en_US: The source language of the input text
+      zh_Hans: 输入的文本的源语言
+    default: auto
+    form: form
+    options:
+      - value: auto
+        label:
+          en_US: auto
+          zh_Hans: 自动检测
+      - value: zh
+        label:
+          en_US: Chinese
+          zh_Hans: 中文
+      - value: en
+        label:
+          en_US: English
+          zh_Hans: 英语
+      - value: cht
+        label:
+          en_US: Traditional Chinese
+          zh_Hans: 繁体中文
+      - value: yue
+        label:
+          en_US: Yue
+          zh_Hans: 粤语
+      - value: wyw
+        label:
+          en_US: Wyw
+          zh_Hans: 文言文
+      - value: jp
+        label:
+          en_US: Japanese
+          zh_Hans: 日语
+      - value: kor
+        label:
+          en_US: Korean
+          zh_Hans: 韩语
+      - value: fra
+        label:
+          en_US: French
+          zh_Hans: 法语
+      - value: spa
+        label:
+          en_US: Spanish
+          zh_Hans: 西班牙语
+      - value: th
+        label:
+          en_US: Thai
+          zh_Hans: 泰语
+      - value: ara
+        label:
+          en_US: Arabic
+          zh_Hans: 阿拉伯语
+      - value: ru
+        label:
+          en_US: Russian
+          zh_Hans: 俄语
+      - value: pt
+        label:
+          en_US: Portuguese
+          zh_Hans: 葡萄牙语
+      - value: de
+        label:
+          en_US: German
+          zh_Hans: 德语
+      - value: it
+        label:
+          en_US: Italian
+          zh_Hans: 意大利语
+      - value: el
+        label:
+          en_US: Greek
+          zh_Hans: 希腊语
+      - value: nl
+        label:
+          en_US: Dutch
+          zh_Hans: 荷兰语
+      - value: pl
+        label:
+          en_US: Polish
+          zh_Hans: 波兰语
+      - value: bul
+        label:
+          en_US: Bulgarian
+          zh_Hans: 保加利亚语
+      - value: est
+        label:
+          en_US: Estonian
+          zh_Hans: 爱沙尼亚语
+      - value: dan
+        label:
+          en_US: Danish
+          zh_Hans: 丹麦语
+      - value: fin
+        label:
+          en_US: Finnish
+          zh_Hans: 芬兰语
+      - value: cs
+        label:
+          en_US: Czech
+          zh_Hans: 捷克语
+      - value: rom
+        label:
+          en_US: Romanian
+          zh_Hans: 罗马尼亚语
+      - value: slo
+        label:
+          en_US: Slovak
+          zh_Hans: 斯洛文尼亚语
+      - value: swe
+        label:
+          en_US: Swedish
+          zh_Hans: 瑞典语
+      - value: hu
+        label:
+          en_US: Hungarian
+          zh_Hans: 匈牙利语
+      - value: vie
+        label:
+          en_US: Vietnamese
+          zh_Hans: 越南语
+  - name: to
+    type: select
+    required: true
+    label:
+      en_US: destination language
+      zh_Hans: 目标语言
+    human_description:
+      en_US: The destination language of the input text
+      zh_Hans: 输入文本的目标语言
+    default: en
+    form: form
+    options:
+      - value: zh
+        label:
+          en_US: Chinese
+          zh_Hans: 中文
+      - value: en
+        label:
+          en_US: English
+          zh_Hans: 英语
+      - value: cht
+        label:
+          en_US: Traditional Chinese
+          zh_Hans: 繁体中文
+      - value: yue
+        label:
+          en_US: Yue
+          zh_Hans: 粤语
+      - value: wyw
+        label:
+          en_US: Wyw
+          zh_Hans: 文言文
+      - value: jp
+        label:
+          en_US: Japanese
+          zh_Hans: 日语
+      - value: kor
+        label:
+          en_US: Korean
+          zh_Hans: 韩语
+      - value: fra
+        label:
+          en_US: French
+          zh_Hans: 法语
+      - value: spa
+        label:
+          en_US: Spanish
+          zh_Hans: 西班牙语
+      - value: th
+        label:
+          en_US: Thai
+          zh_Hans: 泰语
+      - value: ara
+        label:
+          en_US: Arabic
+          zh_Hans: 阿拉伯语
+      - value: ru
+        label:
+          en_US: Russian
+          zh_Hans: 俄语
+      - value: pt
+        label:
+          en_US: Portuguese
+          zh_Hans: 葡萄牙语
+      - value: de
+        label:
+          en_US: German
+          zh_Hans: 德语
+      - value: it
+        label:
+          en_US: Italian
+          zh_Hans: 意大利语
+      - value: el
+        label:
+          en_US: Greek
+          zh_Hans: 希腊语
+      - value: nl
+        label:
+          en_US: Dutch
+          zh_Hans: 荷兰语
+      - value: pl
+        label:
+          en_US: Polish
+          zh_Hans: 波兰语
+      - value: bul
+        label:
+          en_US: Bulgarian
+          zh_Hans: 保加利亚语
+      - value: est
+        label:
+          en_US: Estonian
+          zh_Hans: 爱沙尼亚语
+      - value: dan
+        label:
+          en_US: Danish
+          zh_Hans: 丹麦语
+      - value: fin
+        label:
+          en_US: Finnish
+          zh_Hans: 芬兰语
+      - value: cs
+        label:
+          en_US: Czech
+          zh_Hans: 捷克语
+      - value: rom
+        label:
+          en_US: Romanian
+          zh_Hans: 罗马尼亚语
+      - value: slo
+        label:
+          en_US: Slovak
+          zh_Hans: 斯洛文尼亚语
+      - value: swe
+        label:
+          en_US: Swedish
+          zh_Hans: 瑞典语
+      - value: hu
+        label:
+          en_US: Hungarian
+          zh_Hans: 匈牙利语
+      - value: vie
+        label:
+          en_US: Vietnamese
+          zh_Hans: 越南语

From 4da0b706948a7623403ddc71804d1884644659c4 Mon Sep 17 00:00:00 2001
From: -LAN- <laipz8200@outlook.com>
Date: Mon, 28 Oct 2024 17:51:01 +0800
Subject: [PATCH 05/29] feat(http-request-executor): enhance file handling in
 HTTP requests (#9944)

---
 api/core/workflow/nodes/http_request/executor.py          | 8 ++++++--
 .../core/workflow/nodes/test_http_request_node.py         | 2 +-
 2 files changed, 7 insertions(+), 3 deletions(-)

diff --git a/api/core/workflow/nodes/http_request/executor.py b/api/core/workflow/nodes/http_request/executor.py
index 0270d7e0fd..6872478299 100644
--- a/api/core/workflow/nodes/http_request/executor.py
+++ b/api/core/workflow/nodes/http_request/executor.py
@@ -33,7 +33,7 @@ class Executor:
     params: Mapping[str, str] | None
     content: str | bytes | None
     data: Mapping[str, Any] | None
-    files: Mapping[str, bytes] | None
+    files: Mapping[str, tuple[str | None, bytes, str]] | None
     json: Any
     headers: dict[str, str]
     auth: HttpRequestNodeAuthorization
@@ -141,7 +141,11 @@ class Executor:
                     files = {k: self.variable_pool.get_file(selector) for k, selector in file_selectors.items()}
                     files = {k: v for k, v in files.items() if v is not None}
                     files = {k: variable.value for k, variable in files.items()}
-                    files = {k: file_manager.download(v) for k, v in files.items() if v.related_id is not None}
+                    files = {
+                        k: (v.filename, file_manager.download(v), v.mime_type or "application/octet-stream")
+                        for k, v in files.items()
+                        if v.related_id is not None
+                    }
 
                     self.data = form_data
                     self.files = files
diff --git a/api/tests/unit_tests/core/workflow/nodes/test_http_request_node.py b/api/tests/unit_tests/core/workflow/nodes/test_http_request_node.py
index 2a5fda48b1..720037d05f 100644
--- a/api/tests/unit_tests/core/workflow/nodes/test_http_request_node.py
+++ b/api/tests/unit_tests/core/workflow/nodes/test_http_request_node.py
@@ -192,7 +192,7 @@ def test_http_request_node_form_with_file(monkeypatch):
 
     def attr_checker(*args, **kwargs):
         assert kwargs["data"] == {"name": "test"}
-        assert kwargs["files"] == {"file": b"test"}
+        assert kwargs["files"] == {"file": (None, b"test", "application/octet-stream")}
         return httpx.Response(200, content=b"")
 
     monkeypatch.setattr(

From 81d4d8cea1d6c37eb4f2d4cf142ad12a667efc91 Mon Sep 17 00:00:00 2001
From: Joel <iamjoel007@gmail.com>
Date: Mon, 28 Oct 2024 18:01:33 +0800
Subject: [PATCH 06/29] fix: separator change add too many backslash (#9949)

---
 web/app/components/datasets/create/step-two/escape.ts | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/web/app/components/datasets/create/step-two/escape.ts b/web/app/components/datasets/create/step-two/escape.ts
index 098f43bc7f..2e1c3a9d73 100644
--- a/web/app/components/datasets/create/step-two/escape.ts
+++ b/web/app/components/datasets/create/step-two/escape.ts
@@ -3,7 +3,7 @@ function escape(input: string): string {
     return ''
 
   const res = input
-    .replaceAll('\\', '\\\\')
+    // .replaceAll('\\', '\\\\') // This would add too many backslashes
     .replaceAll('\0', '\\0')
     .replaceAll('\b', '\\b')
     .replaceAll('\f', '\\f')

From adcd83f6a808e2d3a90a4844aca14441a8a9a49e Mon Sep 17 00:00:00 2001
From: AllenWriter <allen@dify.ai>
Date: Mon, 28 Oct 2024 18:34:23 +0800
Subject: [PATCH 07/29] Docs: fix docs url (#9954)

---
 .../workflow/nodes/_base/hooks/use-node-help-link.ts      | 8 ++++----
 1 file changed, 4 insertions(+), 4 deletions(-)

diff --git a/web/app/components/workflow/nodes/_base/hooks/use-node-help-link.ts b/web/app/components/workflow/nodes/_base/hooks/use-node-help-link.ts
index b5fe9554da..2ecdf101d2 100644
--- a/web/app/components/workflow/nodes/_base/hooks/use-node-help-link.ts
+++ b/web/app/components/workflow/nodes/_base/hooks/use-node-help-link.ts
@@ -23,8 +23,8 @@ export const useNodeHelpLink = (nodeType: BlockEnum) => {
         [BlockEnum.Code]: 'code',
         [BlockEnum.TemplateTransform]: 'template',
         [BlockEnum.VariableAssigner]: 'variable-assigner',
-        [BlockEnum.VariableAggregator]: 'variable-assigner',
-        [BlockEnum.Assigner]: 'variable-assignment',
+        [BlockEnum.VariableAggregator]: 'variable-aggregator',
+        [BlockEnum.Assigner]: 'variable-assigner',
         [BlockEnum.Iteration]: 'iteration',
         [BlockEnum.IterationStart]: 'iteration',
         [BlockEnum.ParameterExtractor]: 'parameter-extractor',
@@ -46,8 +46,8 @@ export const useNodeHelpLink = (nodeType: BlockEnum) => {
       [BlockEnum.Code]: 'code',
       [BlockEnum.TemplateTransform]: 'template',
       [BlockEnum.VariableAssigner]: 'variable-assigner',
-      [BlockEnum.VariableAggregator]: 'variable-assigner',
-      [BlockEnum.Assigner]: 'variable-assignment',
+      [BlockEnum.VariableAggregator]: 'variable-aggregator',
+      [BlockEnum.Assigner]: 'variable-assigner',
       [BlockEnum.Iteration]: 'iteration',
       [BlockEnum.IterationStart]: 'iteration',
       [BlockEnum.ParameterExtractor]: 'parameter-extractor',

From badf9baf9bbe87a56c4343cfbbbf70fab0d567db Mon Sep 17 00:00:00 2001
From: Jyong <76649700+JohnJyong@users.noreply.github.com>
Date: Mon, 28 Oct 2024 18:37:35 +0800
Subject: [PATCH 08/29] Fix/external api update (#9955)

---
 api/services/external_knowledge_service.py | 4 ++++
 1 file changed, 4 insertions(+)

diff --git a/api/services/external_knowledge_service.py b/api/services/external_knowledge_service.py
index 4efdf8d7db..094772d674 100644
--- a/api/services/external_knowledge_service.py
+++ b/api/services/external_knowledge_service.py
@@ -6,6 +6,8 @@ from typing import Any, Optional, Union
 import httpx
 import validators
 
+from constants import HIDDEN_VALUE
+
 # from tasks.external_document_indexing_task import external_document_indexing_task
 from core.helper import ssrf_proxy
 from extensions.ext_database import db
@@ -92,6 +94,8 @@ class ExternalDatasetService:
         ).first()
         if external_knowledge_api is None:
             raise ValueError("api template not found")
+        if args.get("settings") and args.get("settings").get("api_key") == HIDDEN_VALUE:
+            args.get("settings")["api_key"] = external_knowledge_api.settings_dict.get("api_key")
 
         external_knowledge_api.name = args.get("name")
         external_knowledge_api.description = args.get("description", "")

From de57af46c03d65f1f0c951e8f530516ea450656d Mon Sep 17 00:00:00 2001
From: -LAN- <laipz8200@outlook.com>
Date: Mon, 28 Oct 2024 18:47:45 +0800
Subject: [PATCH 09/29] chore: update version to 0.10.2 in packaging and docker
 configurations (#9924)

---
 api/configs/packaging/__init__.py | 2 +-
 docker-legacy/docker-compose.yaml | 6 +++---
 docker/docker-compose.yaml        | 6 +++---
 web/package.json                  | 2 +-
 4 files changed, 8 insertions(+), 8 deletions(-)

diff --git a/api/configs/packaging/__init__.py b/api/configs/packaging/__init__.py
index 389a64f53e..3dc87e3058 100644
--- a/api/configs/packaging/__init__.py
+++ b/api/configs/packaging/__init__.py
@@ -9,7 +9,7 @@ class PackagingInfo(BaseSettings):
 
     CURRENT_VERSION: str = Field(
         description="Dify version",
-        default="0.10.1",
+        default="0.10.2",
     )
 
     COMMIT_SHA: str = Field(
diff --git a/docker-legacy/docker-compose.yaml b/docker-legacy/docker-compose.yaml
index 17b788ff81..e3f1c3b761 100644
--- a/docker-legacy/docker-compose.yaml
+++ b/docker-legacy/docker-compose.yaml
@@ -2,7 +2,7 @@ version: '3'
 services:
   # API service
   api:
-    image: langgenius/dify-api:0.10.1
+    image: langgenius/dify-api:0.10.2
     restart: always
     environment:
       # Startup mode, 'api' starts the API server.
@@ -227,7 +227,7 @@ services:
   # worker service
   # The Celery worker for processing the queue.
   worker:
-    image: langgenius/dify-api:0.10.1
+    image: langgenius/dify-api:0.10.2
     restart: always
     environment:
       CONSOLE_WEB_URL: ''
@@ -396,7 +396,7 @@ services:
 
   # Frontend web application.
   web:
-    image: langgenius/dify-web:0.10.1
+    image: langgenius/dify-web:0.10.2
     restart: always
     environment:
       # The base URL of console application api server, refers to the Console base URL of WEB service if console domain is
diff --git a/docker/docker-compose.yaml b/docker/docker-compose.yaml
index d43bd5e2d1..bf8a8b07e6 100644
--- a/docker/docker-compose.yaml
+++ b/docker/docker-compose.yaml
@@ -242,7 +242,7 @@ x-shared-env: &shared-api-worker-env
 services:
   # API service
   api:
-    image: langgenius/dify-api:0.10.1
+    image: langgenius/dify-api:0.10.2
     restart: always
     environment:
       # Use the shared environment variables.
@@ -262,7 +262,7 @@ services:
   # worker service
   # The Celery worker for processing the queue.
   worker:
-    image: langgenius/dify-api:0.10.1
+    image: langgenius/dify-api:0.10.2
     restart: always
     environment:
       # Use the shared environment variables.
@@ -281,7 +281,7 @@ services:
 
   # Frontend web application.
   web:
-    image: langgenius/dify-web:0.10.1
+    image: langgenius/dify-web:0.10.2
     restart: always
     environment:
       CONSOLE_API_URL: ${CONSOLE_API_URL:-}
diff --git a/web/package.json b/web/package.json
index e01603e8d4..04ef26afcd 100644
--- a/web/package.json
+++ b/web/package.json
@@ -1,6 +1,6 @@
 {
   "name": "dify-web",
-  "version": "0.10.1",
+  "version": "0.10.2",
   "private": true,
   "engines": {
     "node": ">=18.17.0"

From de850262b8633a00eefe99333658dbd08156e4bb Mon Sep 17 00:00:00 2001
From: crazywoola <100913391+crazywoola@users.noreply.github.com>
Date: Mon, 28 Oct 2024 19:23:31 +0800
Subject: [PATCH 10/29] fix: button rendering when using streaming (#9957)

---
 web/app/components/base/markdown.tsx | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/web/app/components/base/markdown.tsx b/web/app/components/base/markdown.tsx
index 33ff23d3b7..dde4bcf786 100644
--- a/web/app/components/base/markdown.tsx
+++ b/web/app/components/base/markdown.tsx
@@ -252,7 +252,7 @@ const MarkdownButton = ({ node }: any) => {
     className={cn('!h-8 !px-3 select-none')}
     onClick={() => onSend?.(message)}
   >
-    <span className='text-[13px]'>{node.children[0].value}</span>
+    <span className='text-[13px]'>{node.children[0]?.value || ''}</span>
   </Button>
 }
 MarkdownButton.displayName = 'MarkdownButton'

From f47177ecb4c4b36df11c19f0ec866c2c5a162888 Mon Sep 17 00:00:00 2001
From: Jyong <76649700+JohnJyong@users.noreply.github.com>
Date: Mon, 28 Oct 2024 23:04:54 +0800
Subject: [PATCH 11/29] add top_k for es full text search (#9963)

---
 .../rag/datasource/vdb/elasticsearch/elasticsearch_vector.py    | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/api/core/rag/datasource/vdb/elasticsearch/elasticsearch_vector.py b/api/core/rag/datasource/vdb/elasticsearch/elasticsearch_vector.py
index 052a187225..c62042af80 100644
--- a/api/core/rag/datasource/vdb/elasticsearch/elasticsearch_vector.py
+++ b/api/core/rag/datasource/vdb/elasticsearch/elasticsearch_vector.py
@@ -142,7 +142,7 @@ class ElasticSearchVector(BaseVector):
 
     def search_by_full_text(self, query: str, **kwargs: Any) -> list[Document]:
         query_str = {"match": {Field.CONTENT_KEY.value: query}}
-        results = self._client.search(index=self._collection_name, query=query_str)
+        results = self._client.search(index=self._collection_name, query=query_str, size=kwargs.get("top_k", 4))
         docs = []
         for hit in results["hits"]["hits"]:
             docs.append(

From b6d045cebfd610de0d82c954fd75aefa9889a5e9 Mon Sep 17 00:00:00 2001
From: Wu Tianwei <30284043+WTW0313@users.noreply.github.com>
Date: Tue, 29 Oct 2024 09:55:14 +0800
Subject: [PATCH 12/29] fix: Fix page logout issue due to refresh-token (#9970)

---
 web/hooks/use-refresh-token.ts | 10 ++++++++++
 1 file changed, 10 insertions(+)

diff --git a/web/hooks/use-refresh-token.ts b/web/hooks/use-refresh-token.ts
index 293f3159de..53dc4faf00 100644
--- a/web/hooks/use-refresh-token.ts
+++ b/web/hooks/use-refresh-token.ts
@@ -41,6 +41,7 @@ const useRefreshToken = () => {
       return new Error('No access token or refresh token found')
     }
     if (localStorage?.getItem('is_refreshing') === '1') {
+      clearTimeout(timer.current)
       timer.current = setTimeout(() => {
         getNewAccessToken()
       }, 1000)
@@ -61,12 +62,14 @@ const useRefreshToken = () => {
       localStorage?.setItem('console_token', access_token)
       localStorage?.setItem('refresh_token', refresh_token)
       const newTokenExpireTime = getExpireTime(access_token)
+      clearTimeout(timer.current)
       timer.current = setTimeout(() => {
         getNewAccessToken()
       }, newTokenExpireTime - advanceTime.current - getCurrentTimeStamp())
     }
     else {
       const newTokenExpireTime = getExpireTime(currentAccessToken)
+      clearTimeout(timer.current)
       timer.current = setTimeout(() => {
         getNewAccessToken()
       }, newTokenExpireTime - advanceTime.current - getCurrentTimeStamp())
@@ -74,8 +77,15 @@ const useRefreshToken = () => {
     return null
   }, [getExpireTime, getCurrentTimeStamp, handleError])
 
+  const handleVisibilityChange = useCallback(() => {
+    if (document.visibilityState === 'visible')
+      getNewAccessToken()
+  }, [])
+
   useEffect(() => {
+    window.addEventListener('visibilitychange', handleVisibilityChange)
     return () => {
+      window.removeEventListener('visibilitychange', handleVisibilityChange)
       clearTimeout(timer.current)
       localStorage?.removeItem('is_refreshing')
     }

From 61ff2fd0f3d5898db093fe31484751058cf5e553 Mon Sep 17 00:00:00 2001
From: ice yao <yao3690093@gmail.com>
Date: Tue, 29 Oct 2024 10:33:00 +0800
Subject: [PATCH 13/29] chore: Enable tencent cos test to run (#9971)

---
 .../unit_tests/oss/__mock/tencent_cos.py      | 81 +++++++++++++++++++
 .../unit_tests/oss/tencent_cos/__init__.py    |  0
 .../oss/tencent_cos/test_tencent_cos.py       | 20 +++++
 .../oss/volcengine_tos/test_volcengine_tos.py |  2 -
 4 files changed, 101 insertions(+), 2 deletions(-)
 create mode 100644 api/tests/unit_tests/oss/__mock/tencent_cos.py
 create mode 100644 api/tests/unit_tests/oss/tencent_cos/__init__.py
 create mode 100644 api/tests/unit_tests/oss/tencent_cos/test_tencent_cos.py

diff --git a/api/tests/unit_tests/oss/__mock/tencent_cos.py b/api/tests/unit_tests/oss/__mock/tencent_cos.py
new file mode 100644
index 0000000000..5189b68e87
--- /dev/null
+++ b/api/tests/unit_tests/oss/__mock/tencent_cos.py
@@ -0,0 +1,81 @@
+import os
+from unittest.mock import MagicMock
+
+import pytest
+from _pytest.monkeypatch import MonkeyPatch
+from qcloud_cos import CosS3Client
+from qcloud_cos.streambody import StreamBody
+
+from tests.unit_tests.oss.__mock.base import (
+    get_example_bucket,
+    get_example_data,
+    get_example_filename,
+    get_example_filepath,
+)
+
+
+class MockTencentCosClass:
+    def __init__(self, conf, retry=1, session=None):
+        self.bucket_name = get_example_bucket()
+        self.key = get_example_filename()
+        self.content = get_example_data()
+        self.filepath = get_example_filepath()
+        self.resp = {
+            "ETag": "ee8de918d05640145b18f70f4c3aa602",
+            "Server": "tencent-cos",
+            "x-cos-hash-crc64ecma": 16749565679157681890,
+            "x-cos-request-id": "NWU5MDNkYzlfNjRiODJhMDlfMzFmYzhfMTFm****",
+        }
+
+    def put_object(self, Bucket, Body, Key, EnableMD5=False, **kwargs):  # noqa: N803
+        assert Bucket == self.bucket_name
+        assert Key == self.key
+        assert Body == self.content
+        return self.resp
+
+    def get_object(self, Bucket, Key, KeySimplifyCheck=True, **kwargs):  # noqa: N803
+        assert Bucket == self.bucket_name
+        assert Key == self.key
+
+        mock_stream_body = MagicMock(StreamBody)
+        mock_raw_stream = MagicMock()
+        mock_stream_body.get_raw_stream.return_value = mock_raw_stream
+        mock_raw_stream.read.return_value = self.content
+
+        mock_stream_body.get_stream_to_file = MagicMock()
+
+        def chunk_generator(chunk_size=2):
+            for i in range(0, len(self.content), chunk_size):
+                yield self.content[i : i + chunk_size]
+
+        mock_stream_body.get_stream.return_value = chunk_generator(chunk_size=4096)
+        return {"Body": mock_stream_body}
+
+    def object_exists(self, Bucket, Key):  # noqa: N803
+        assert Bucket == self.bucket_name
+        assert Key == self.key
+        return True
+
+    def delete_object(self, Bucket, Key, **kwargs):  # noqa: N803
+        assert Bucket == self.bucket_name
+        assert Key == self.key
+        self.resp.update({"x-cos-delete-marker": True})
+        return self.resp
+
+
+MOCK = os.getenv("MOCK_SWITCH", "false").lower() == "true"
+
+
+@pytest.fixture
+def setup_tencent_cos_mock(monkeypatch: MonkeyPatch):
+    if MOCK:
+        monkeypatch.setattr(CosS3Client, "__init__", MockTencentCosClass.__init__)
+        monkeypatch.setattr(CosS3Client, "put_object", MockTencentCosClass.put_object)
+        monkeypatch.setattr(CosS3Client, "get_object", MockTencentCosClass.get_object)
+        monkeypatch.setattr(CosS3Client, "object_exists", MockTencentCosClass.object_exists)
+        monkeypatch.setattr(CosS3Client, "delete_object", MockTencentCosClass.delete_object)
+
+    yield
+
+    if MOCK:
+        monkeypatch.undo()
diff --git a/api/tests/unit_tests/oss/tencent_cos/__init__.py b/api/tests/unit_tests/oss/tencent_cos/__init__.py
new file mode 100644
index 0000000000..e69de29bb2
diff --git a/api/tests/unit_tests/oss/tencent_cos/test_tencent_cos.py b/api/tests/unit_tests/oss/tencent_cos/test_tencent_cos.py
new file mode 100644
index 0000000000..303f0493bd
--- /dev/null
+++ b/api/tests/unit_tests/oss/tencent_cos/test_tencent_cos.py
@@ -0,0 +1,20 @@
+from unittest.mock import patch
+
+import pytest
+from qcloud_cos import CosConfig
+
+from extensions.storage.tencent_cos_storage import TencentCosStorage
+from tests.unit_tests.oss.__mock.base import (
+    BaseStorageTest,
+    get_example_bucket,
+)
+from tests.unit_tests.oss.__mock.tencent_cos import setup_tencent_cos_mock
+
+
+class TestTencentCos(BaseStorageTest):
+    @pytest.fixture(autouse=True)
+    def setup_method(self, setup_tencent_cos_mock):
+        """Executed before each test method."""
+        with patch.object(CosConfig, "__init__", return_value=None):
+            self.storage = TencentCosStorage()
+        self.storage.bucket_name = get_example_bucket()
diff --git a/api/tests/unit_tests/oss/volcengine_tos/test_volcengine_tos.py b/api/tests/unit_tests/oss/volcengine_tos/test_volcengine_tos.py
index 9f8aa158a9..5afbc9e8b4 100644
--- a/api/tests/unit_tests/oss/volcengine_tos/test_volcengine_tos.py
+++ b/api/tests/unit_tests/oss/volcengine_tos/test_volcengine_tos.py
@@ -1,5 +1,3 @@
-from collections.abc import Generator
-
 import pytest
 from tos import TosClientV2
 

From eb698963555be44d8812bd53e6189117550aeeae Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?=E9=9D=9E=E6=B3=95=E6=93=8D=E4=BD=9C?= <hjlarry@163.com>
Date: Tue, 29 Oct 2024 10:33:15 +0800
Subject: [PATCH 14/29] fix: allow external knowledge api use simple host
 (#9966)

---
 api/services/external_knowledge_service.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/api/services/external_knowledge_service.py b/api/services/external_knowledge_service.py
index 094772d674..b49738c61c 100644
--- a/api/services/external_knowledge_service.py
+++ b/api/services/external_knowledge_service.py
@@ -70,7 +70,7 @@ class ExternalDatasetService:
 
         endpoint = f"{settings['endpoint']}/retrieval"
         api_key = settings["api_key"]
-        if not validators.url(endpoint):
+        if not validators.url(endpoint, simple_host=True):
             raise ValueError(f"invalid endpoint: {endpoint}")
         try:
             response = httpx.post(endpoint, headers={"Authorization": f"Bearer {api_key}"})

From fc37e654fc26304bed0a1a07bedc23a4e2c68b91 Mon Sep 17 00:00:00 2001
From: crazywoola <100913391+crazywoola@users.noreply.github.com>
Date: Tue, 29 Oct 2024 13:32:50 +0800
Subject: [PATCH 15/29] Feat/support form in conversation (#9980)

---
 .../base/markdown-blocks/button.tsx           |  22 +++
 .../components/base/markdown-blocks/form.tsx  | 137 ++++++++++++++++++
 web/app/components/base/markdown.tsx          |  20 +--
 3 files changed, 162 insertions(+), 17 deletions(-)
 create mode 100644 web/app/components/base/markdown-blocks/button.tsx
 create mode 100644 web/app/components/base/markdown-blocks/form.tsx

diff --git a/web/app/components/base/markdown-blocks/button.tsx b/web/app/components/base/markdown-blocks/button.tsx
new file mode 100644
index 0000000000..56647b3bbe
--- /dev/null
+++ b/web/app/components/base/markdown-blocks/button.tsx
@@ -0,0 +1,22 @@
+import { useChatContext } from '@/app/components/base/chat/chat/context'
+import Button from '@/app/components/base/button'
+import cn from '@/utils/classnames'
+
+const MarkdownButton = ({ node }: any) => {
+  const { onSend } = useChatContext()
+  const variant = node.properties.dataVariant
+  const message = node.properties.dataMessage
+  const size = node.properties.dataSize
+
+  return <Button
+    variant={variant}
+    size={size}
+    className={cn('!h-8 !px-3 select-none')}
+    onClick={() => onSend?.(message)}
+  >
+    <span className='text-[13px]'>{node.children[0]?.value || ''}</span>
+  </Button>
+}
+MarkdownButton.displayName = 'MarkdownButton'
+
+export default MarkdownButton
diff --git a/web/app/components/base/markdown-blocks/form.tsx b/web/app/components/base/markdown-blocks/form.tsx
new file mode 100644
index 0000000000..f87f2dcd91
--- /dev/null
+++ b/web/app/components/base/markdown-blocks/form.tsx
@@ -0,0 +1,137 @@
+import Button from '@/app/components/base/button'
+import Input from '@/app/components/base/input'
+import Textarea from '@/app/components/base/textarea'
+import { useChatContext } from '@/app/components/base/chat/chat/context'
+
+enum DATA_FORMAT {
+  TEXT = 'text',
+  JSON = 'json',
+}
+enum SUPPORTED_TAGS {
+  LABEL = 'label',
+  INPUT = 'input',
+  TEXTAREA = 'textarea',
+  BUTTON = 'button',
+}
+enum SUPPORTED_TYPES {
+  TEXT = 'text',
+  PASSWORD = 'password',
+  EMAIL = 'email',
+  NUMBER = 'number',
+}
+const MarkdownForm = ({ node }: any) => {
+  // const supportedTypes = ['text', 'password', 'email', 'number']
+  //   <form data-format="text">
+  //      <label for="username">Username:</label>
+  //      <input type="text" name="username" />
+  //      <label for="password">Password:</label>
+  //      <input type="password" name="password" />
+  //      <label for="content">Content:</label>
+  //      <textarea name="content"></textarea>
+  //      <button data-size="small" data-variant="primary">Login</button>
+  //   </form>
+  const { onSend } = useChatContext()
+
+  const getFormValues = (children: any) => {
+    const formValues: { [key: string]: any } = {}
+    children.forEach((child: any) => {
+      if (child.tagName === SUPPORTED_TAGS.INPUT)
+        formValues[child.properties.name] = child.properties.value
+      if (child.tagName === SUPPORTED_TAGS.TEXTAREA)
+        formValues[child.properties.name] = child.properties.value
+    })
+    return formValues
+  }
+  const onSubmit = (e: any) => {
+    e.preventDefault()
+    const format = node.properties.dataFormat || DATA_FORMAT.TEXT
+    const result = getFormValues(node.children)
+    if (format === DATA_FORMAT.JSON) {
+      onSend?.(JSON.stringify(result))
+    }
+    else {
+      const textResult = Object.entries(result)
+        .map(([key, value]) => `${key}: ${value}`)
+        .join('\n')
+      onSend?.(textResult)
+    }
+  }
+  return (
+    <form
+      autoComplete="off"
+      className='flex flex-col self-stretch'
+      onSubmit={(e: any) => {
+        e.preventDefault()
+        e.stopPropagation()
+      }}
+    >
+      {node.children.filter((i: any) => i.type === 'element').map((child: any, index: number) => {
+        if (child.tagName === SUPPORTED_TAGS.LABEL) {
+          return (
+            <label
+              key={index}
+              htmlFor={child.properties.for}
+              className="my-2 system-md-semibold text-text-secondary"
+            >
+              {child.children[0]?.value || ''}
+            </label>
+          )
+        }
+        if (child.tagName === SUPPORTED_TAGS.INPUT) {
+          if (Object.values(SUPPORTED_TYPES).includes(child.properties.type)) {
+            return (
+              <Input
+                key={index}
+                type={child.properties.type}
+                name={child.properties.name}
+                placeholder={child.properties.placeholder}
+                value={child.properties.value}
+                onChange={(e) => {
+                  e.preventDefault()
+                  child.properties.value = e.target.value
+                }}
+              />
+            )
+          }
+          else {
+            return <p key={index}>Unsupported input type: {child.properties.type}</p>
+          }
+        }
+        if (child.tagName === SUPPORTED_TAGS.TEXTAREA) {
+          return (
+            <Textarea
+              key={index}
+              name={child.properties.name}
+              placeholder={child.properties.placeholder}
+              value={child.properties.value}
+              onChange={(e) => {
+                e.preventDefault()
+                child.properties.value = e.target.value
+              }}
+            />
+          )
+        }
+        if (child.tagName === SUPPORTED_TAGS.BUTTON) {
+          const variant = child.properties.dataVariant
+          const size = child.properties.dataSize
+
+          return (
+            <Button
+              variant={variant}
+              size={size}
+              className='mt-4'
+              key={index}
+              onClick={onSubmit}
+            >
+              <span className='text-[13px]'>{child.children[0]?.value || ''}</span>
+            </Button>
+          )
+        }
+
+        return <p key={index}>Unsupported tag: {child.tagName}</p>
+      })}
+    </form>
+  )
+}
+MarkdownForm.displayName = 'MarkdownForm'
+export default MarkdownForm
diff --git a/web/app/components/base/markdown.tsx b/web/app/components/base/markdown.tsx
index dde4bcf786..58e54123dd 100644
--- a/web/app/components/base/markdown.tsx
+++ b/web/app/components/base/markdown.tsx
@@ -20,7 +20,8 @@ import { useChatContext } from '@/app/components/base/chat/chat/context'
 import VideoGallery from '@/app/components/base/video-gallery'
 import AudioGallery from '@/app/components/base/audio-gallery'
 import SVGRenderer from '@/app/components/base/svg-gallery'
-import Button from '@/app/components/base/button'
+import MarkdownButton from '@/app/components/base/markdown-blocks/button'
+import MarkdownForm from '@/app/components/base/markdown-blocks/form'
 
 // Available language https://github.com/react-syntax-highlighter/react-syntax-highlighter/blob/master/AVAILABLE_LANGUAGES_HLJS.MD
 const capitalizationLanguageNameMap: Record<string, string> = {
@@ -241,22 +242,6 @@ const Link = ({ node, ...props }: any) => {
   }
 }
 
-const MarkdownButton = ({ node }: any) => {
-  const { onSend } = useChatContext()
-  const variant = node.properties.dataVariant
-  const message = node.properties.dataMessage
-  const size = node.properties.dataSize
-
-  return <Button variant={variant}
-    size={size}
-    className={cn('!h-8 !px-3 select-none')}
-    onClick={() => onSend?.(message)}
-  >
-    <span className='text-[13px]'>{node.children[0]?.value || ''}</span>
-  </Button>
-}
-MarkdownButton.displayName = 'MarkdownButton'
-
 export function Markdown(props: { content: string; className?: string }) {
   const latexContent = preprocessLaTeX(props.content)
   return (
@@ -289,6 +274,7 @@ export function Markdown(props: { content: string; className?: string }) {
           a: Link,
           p: Paragraph,
           button: MarkdownButton,
+          form: MarkdownForm,
         }}
         linkTarget='_blank'
       >

From c8ef9223e5a671d29ac8cfd0f79aea91ddf4354a Mon Sep 17 00:00:00 2001
From: roadgoat19 <123213767+roadgoat19@users.noreply.github.com>
Date: Tue, 29 Oct 2024 03:00:23 -0400
Subject: [PATCH 16/29] feat: couchbase integration (#6165)

Co-authored-by: crazywoola <427733928@qq.com>
Co-authored-by: Elliot Scribner <elliot.scribner@couchbase.com>
Co-authored-by: crazywoola <100913391+crazywoola@users.noreply.github.com>
Co-authored-by: Bowen Liang <bowenliang@apache.org>
---
 .github/workflows/api-tests.yml               |   3 +-
 .github/workflows/expose_service_ports.sh     |   4 +-
 .gitignore                                    |   3 +-
 api/.env.example                              |   9 +-
 api/commands.py                               |   1 +
 api/configs/middleware/__init__.py            |   2 +
 .../middleware/vdb/couchbase_config.py        |  34 ++
 api/controllers/console/datasets/datasets.py  |   2 +
 .../rag/datasource/vdb/couchbase/__init__.py  |   0
 .../vdb/couchbase/couchbase_vector.py         | 378 ++++++++++++++++++
 api/core/rag/datasource/vdb/vector_factory.py |   4 +
 api/core/rag/datasource/vdb/vector_type.py    |   1 +
 api/poetry.lock                               |  55 ++-
 api/pyproject.toml                            |   1 +
 .../vdb/couchbase/__init__.py                 |   0
 .../vdb/couchbase/test_couchbase.py           |  50 +++
 dev/pytest/pytest_vdb.sh                      |   3 +-
 docker/.env.example                           |  10 +-
 docker/couchbase-server/Dockerfile            |   4 +
 docker/couchbase-server/init-cbserver.sh      |  44 ++
 docker/docker-compose.yaml                    |  38 ++
 21 files changed, 639 insertions(+), 7 deletions(-)
 create mode 100644 api/configs/middleware/vdb/couchbase_config.py
 create mode 100644 api/core/rag/datasource/vdb/couchbase/__init__.py
 create mode 100644 api/core/rag/datasource/vdb/couchbase/couchbase_vector.py
 create mode 100644 api/tests/integration_tests/vdb/couchbase/__init__.py
 create mode 100644 api/tests/integration_tests/vdb/couchbase/test_couchbase.py
 create mode 100644 docker/couchbase-server/Dockerfile
 create mode 100755 docker/couchbase-server/init-cbserver.sh

diff --git a/.github/workflows/api-tests.yml b/.github/workflows/api-tests.yml
index e9c2b7b086..c87d5a4dd4 100644
--- a/.github/workflows/api-tests.yml
+++ b/.github/workflows/api-tests.yml
@@ -78,7 +78,7 @@ jobs:
       - name: Run Workflow
         run: poetry run -C api bash dev/pytest/pytest_workflow.sh
 
-      - name: Set up Vector Stores (Weaviate, Qdrant, PGVector, Milvus, PgVecto-RS, Chroma, MyScale, ElasticSearch)
+      - name: Set up Vector Stores (Weaviate, Qdrant, PGVector, Milvus, PgVecto-RS, Chroma, MyScale, ElasticSearch, Couchbase)
         uses: hoverkraft-tech/compose-action@v2.0.0
         with:
           compose-file: |
@@ -86,6 +86,7 @@ jobs:
           services: |
             weaviate
             qdrant
+            couchbase-server
             etcd
             minio
             milvus-standalone
diff --git a/.github/workflows/expose_service_ports.sh b/.github/workflows/expose_service_ports.sh
index ae3e0ee69d..bc65c19a91 100755
--- a/.github/workflows/expose_service_ports.sh
+++ b/.github/workflows/expose_service_ports.sh
@@ -7,5 +7,7 @@ yq eval '.services["milvus-standalone"].ports += ["19530:19530"]' -i docker/dock
 yq eval '.services.pgvector.ports += ["5433:5432"]' -i docker/docker-compose.yaml
 yq eval '.services["pgvecto-rs"].ports += ["5431:5432"]' -i docker/docker-compose.yaml
 yq eval '.services["elasticsearch"].ports += ["9200:9200"]' -i docker/docker-compose.yaml
+yq eval '.services.couchbase-server.ports += ["8091-8096:8091-8096"]' -i docker/docker-compose.yaml
+yq eval '.services.couchbase-server.ports += ["11210:11210"]' -i docker/docker-compose.yaml
 
-echo "Ports exposed for sandbox, weaviate, qdrant, chroma, milvus, pgvector, pgvecto-rs, elasticsearch"
\ No newline at end of file
+echo "Ports exposed for sandbox, weaviate, qdrant, chroma, milvus, pgvector, pgvecto-rs, elasticsearch, couchbase"
diff --git a/.gitignore b/.gitignore
index 27cf8a4ba3..29a80534f7 100644
--- a/.gitignore
+++ b/.gitignore
@@ -173,6 +173,7 @@ docker/volumes/myscale/log/*
 docker/volumes/unstructured/*
 docker/volumes/pgvector/data/*
 docker/volumes/pgvecto_rs/data/*
+docker/volumes/couchbase/*
 
 docker/nginx/conf.d/default.conf
 docker/nginx/ssl/*
@@ -189,4 +190,4 @@ pyrightconfig.json
 api/.vscode
 
 .idea/
-.vscode
\ No newline at end of file
+.vscode
diff --git a/api/.env.example b/api/.env.example
index 184a811c51..2ce425338e 100644
--- a/api/.env.example
+++ b/api/.env.example
@@ -120,7 +120,7 @@ SUPABASE_URL=your-server-url
 WEB_API_CORS_ALLOW_ORIGINS=http://127.0.0.1:3000,*
 CONSOLE_CORS_ALLOW_ORIGINS=http://127.0.0.1:3000,*
 
-# Vector database configuration, support: weaviate, qdrant, milvus, myscale, relyt, pgvecto_rs, pgvector, pgvector, chroma, opensearch, tidb_vector, vikingdb, upstash
+# Vector database configuration, support: weaviate, qdrant, milvus, myscale, relyt, pgvecto_rs, pgvector, pgvector, chroma, opensearch, tidb_vector, couchbase, vikingdb, upstash
 VECTOR_STORE=weaviate
 
 # Weaviate configuration
@@ -136,6 +136,13 @@ QDRANT_CLIENT_TIMEOUT=20
 QDRANT_GRPC_ENABLED=false
 QDRANT_GRPC_PORT=6334
 
+#Couchbase configuration
+COUCHBASE_CONNECTION_STRING=127.0.0.1
+COUCHBASE_USER=Administrator
+COUCHBASE_PASSWORD=password
+COUCHBASE_BUCKET_NAME=Embeddings
+COUCHBASE_SCOPE_NAME=_default
+
 # Milvus configuration
 MILVUS_URI=http://127.0.0.1:19530
 MILVUS_TOKEN=
diff --git a/api/commands.py b/api/commands.py
index 720a4447da..da09f1b610 100644
--- a/api/commands.py
+++ b/api/commands.py
@@ -278,6 +278,7 @@ def migrate_knowledge_vector_database():
         VectorType.BAIDU,
         VectorType.VIKINGDB,
         VectorType.UPSTASH,
+        VectorType.COUCHBASE,
     }
     page = 1
     while True:
diff --git a/api/configs/middleware/__init__.py b/api/configs/middleware/__init__.py
index 3d68e29d0e..e8f6ba91b6 100644
--- a/api/configs/middleware/__init__.py
+++ b/api/configs/middleware/__init__.py
@@ -17,6 +17,7 @@ from configs.middleware.storage.tencent_cos_storage_config import TencentCloudCO
 from configs.middleware.storage.volcengine_tos_storage_config import VolcengineTOSStorageConfig
 from configs.middleware.vdb.analyticdb_config import AnalyticdbConfig
 from configs.middleware.vdb.chroma_config import ChromaConfig
+from configs.middleware.vdb.couchbase_config import CouchbaseConfig
 from configs.middleware.vdb.elasticsearch_config import ElasticsearchConfig
 from configs.middleware.vdb.milvus_config import MilvusConfig
 from configs.middleware.vdb.myscale_config import MyScaleConfig
@@ -251,6 +252,7 @@ class MiddlewareConfig(
     TiDBVectorConfig,
     WeaviateConfig,
     ElasticsearchConfig,
+    CouchbaseConfig,
     InternalTestConfig,
     VikingDBConfig,
     UpstashConfig,
diff --git a/api/configs/middleware/vdb/couchbase_config.py b/api/configs/middleware/vdb/couchbase_config.py
new file mode 100644
index 0000000000..391089ec6e
--- /dev/null
+++ b/api/configs/middleware/vdb/couchbase_config.py
@@ -0,0 +1,34 @@
+from typing import Optional
+
+from pydantic import BaseModel, Field
+
+
+class CouchbaseConfig(BaseModel):
+    """
+    Couchbase configs
+    """
+
+    COUCHBASE_CONNECTION_STRING: Optional[str] = Field(
+        description="COUCHBASE connection string",
+        default=None,
+    )
+
+    COUCHBASE_USER: Optional[str] = Field(
+        description="COUCHBASE user",
+        default=None,
+    )
+
+    COUCHBASE_PASSWORD: Optional[str] = Field(
+        description="COUCHBASE password",
+        default=None,
+    )
+
+    COUCHBASE_BUCKET_NAME: Optional[str] = Field(
+        description="COUCHBASE bucket name",
+        default=None,
+    )
+
+    COUCHBASE_SCOPE_NAME: Optional[str] = Field(
+        description="COUCHBASE scope name",
+        default=None,
+    )
diff --git a/api/controllers/console/datasets/datasets.py b/api/controllers/console/datasets/datasets.py
index c8022efb8b..854821746a 100644
--- a/api/controllers/console/datasets/datasets.py
+++ b/api/controllers/console/datasets/datasets.py
@@ -640,6 +640,7 @@ class DatasetRetrievalSettingApi(Resource):
                 | VectorType.ELASTICSEARCH
                 | VectorType.PGVECTOR
                 | VectorType.TIDB_ON_QDRANT
+                | VectorType.COUCHBASE
             ):
                 return {
                     "retrieval_method": [
@@ -678,6 +679,7 @@ class DatasetRetrievalSettingMockApi(Resource):
                 | VectorType.MYSCALE
                 | VectorType.ORACLE
                 | VectorType.ELASTICSEARCH
+                | VectorType.COUCHBASE
                 | VectorType.PGVECTOR
             ):
                 return {
diff --git a/api/core/rag/datasource/vdb/couchbase/__init__.py b/api/core/rag/datasource/vdb/couchbase/__init__.py
new file mode 100644
index 0000000000..e69de29bb2
diff --git a/api/core/rag/datasource/vdb/couchbase/couchbase_vector.py b/api/core/rag/datasource/vdb/couchbase/couchbase_vector.py
new file mode 100644
index 0000000000..3f88d2ca2b
--- /dev/null
+++ b/api/core/rag/datasource/vdb/couchbase/couchbase_vector.py
@@ -0,0 +1,378 @@
+import json
+import logging
+import time
+import uuid
+from datetime import timedelta
+from typing import Any
+
+from couchbase import search
+from couchbase.auth import PasswordAuthenticator
+from couchbase.cluster import Cluster
+from couchbase.management.search import SearchIndex
+
+# needed for options -- cluster, timeout, SQL++ (N1QL) query, etc.
+from couchbase.options import ClusterOptions, SearchOptions
+from couchbase.vector_search import VectorQuery, VectorSearch
+from flask import current_app
+from pydantic import BaseModel, model_validator
+
+from core.rag.datasource.vdb.vector_base import BaseVector
+from core.rag.datasource.vdb.vector_factory import AbstractVectorFactory
+from core.rag.datasource.vdb.vector_type import VectorType
+from core.rag.embedding.embedding_base import Embeddings
+from core.rag.models.document import Document
+from extensions.ext_redis import redis_client
+from models.dataset import Dataset
+
+logger = logging.getLogger(__name__)
+
+
+class CouchbaseConfig(BaseModel):
+    connection_string: str
+    user: str
+    password: str
+    bucket_name: str
+    scope_name: str
+
+    @model_validator(mode="before")
+    @classmethod
+    def validate_config(cls, values: dict) -> dict:
+        if not values.get("connection_string"):
+            raise ValueError("config COUCHBASE_CONNECTION_STRING is required")
+        if not values.get("user"):
+            raise ValueError("config COUCHBASE_USER is required")
+        if not values.get("password"):
+            raise ValueError("config COUCHBASE_PASSWORD is required")
+        if not values.get("bucket_name"):
+            raise ValueError("config COUCHBASE_PASSWORD is required")
+        if not values.get("scope_name"):
+            raise ValueError("config COUCHBASE_SCOPE_NAME is required")
+        return values
+
+
+class CouchbaseVector(BaseVector):
+    def __init__(self, collection_name: str, config: CouchbaseConfig):
+        super().__init__(collection_name)
+        self._client_config = config
+
+        """Connect to couchbase"""
+
+        auth = PasswordAuthenticator(config.user, config.password)
+        options = ClusterOptions(auth)
+        self._cluster = Cluster(config.connection_string, options)
+        self._bucket = self._cluster.bucket(config.bucket_name)
+        self._scope = self._bucket.scope(config.scope_name)
+        self._bucket_name = config.bucket_name
+        self._scope_name = config.scope_name
+
+        # Wait until the cluster is ready for use.
+        self._cluster.wait_until_ready(timedelta(seconds=5))
+
+    def create(self, texts: list[Document], embeddings: list[list[float]], **kwargs):
+        index_id = str(uuid.uuid4()).replace("-", "")
+        self._create_collection(uuid=index_id, vector_length=len(embeddings[0]))
+        self.add_texts(texts, embeddings)
+
+    def _create_collection(self, vector_length: int, uuid: str):
+        lock_name = "vector_indexing_lock_{}".format(self._collection_name)
+        with redis_client.lock(lock_name, timeout=20):
+            collection_exist_cache_key = "vector_indexing_{}".format(self._collection_name)
+            if redis_client.get(collection_exist_cache_key):
+                return
+            if self._collection_exists(self._collection_name):
+                return
+            manager = self._bucket.collections()
+            manager.create_collection(self._client_config.scope_name, self._collection_name)
+
+            index_manager = self._scope.search_indexes()
+
+            index_definition = json.loads("""
+{
+    "type": "fulltext-index",
+    "name": "Embeddings._default.Vector_Search",
+    "uuid": "26d4db528e78b716",
+    "sourceType": "gocbcore",
+    "sourceName": "Embeddings",
+    "sourceUUID": "2242e4a25b4decd6650c9c7b3afa1dbf",
+    "planParams": {
+      "maxPartitionsPerPIndex": 1024,
+      "indexPartitions": 1
+    },
+    "params": {
+      "doc_config": {
+        "docid_prefix_delim": "",
+        "docid_regexp": "",
+        "mode": "scope.collection.type_field",
+        "type_field": "type"
+      },
+      "mapping": {
+        "analysis": { },
+        "default_analyzer": "standard",
+        "default_datetime_parser": "dateTimeOptional",
+        "default_field": "_all",
+        "default_mapping": {
+          "dynamic": true,
+          "enabled": true
+        },
+        "default_type": "_default",
+        "docvalues_dynamic": false,
+        "index_dynamic": true,
+        "store_dynamic": true,
+        "type_field": "_type",
+        "types": {
+          "collection_name": {
+            "dynamic": true,
+            "enabled": true,
+            "properties": {
+              "embedding": {
+                "dynamic": false,
+                "enabled": true,
+                "fields": [
+                  {
+                    "dims": 1536,
+                    "index": true,
+                    "name": "embedding",
+                    "similarity": "dot_product",
+                    "type": "vector",
+                    "vector_index_optimized_for": "recall"
+                  }
+                ]
+              },
+              "metadata": {
+                "dynamic": true,
+                "enabled": true
+              },
+              "text": {
+                "dynamic": false,
+                "enabled": true,
+                "fields": [
+                  {
+                    "index": true,
+                    "name": "text",
+                    "store": true,
+                    "type": "text"
+                  }
+                ]
+              }
+            }
+          }
+        }
+      },
+      "store": {
+        "indexType": "scorch",
+        "segmentVersion": 16
+      }
+    },
+    "sourceParams": { }
+  }
+""")
+            index_definition["name"] = self._collection_name + "_search"
+            index_definition["uuid"] = uuid
+            index_definition["params"]["mapping"]["types"]["collection_name"]["properties"]["embedding"]["fields"][0][
+                "dims"
+            ] = vector_length
+            index_definition["params"]["mapping"]["types"][self._scope_name + "." + self._collection_name] = (
+                index_definition["params"]["mapping"]["types"].pop("collection_name")
+            )
+            time.sleep(2)
+            index_manager.upsert_index(
+                SearchIndex(
+                    index_definition["name"],
+                    params=index_definition["params"],
+                    source_name=self._bucket_name,
+                ),
+            )
+            time.sleep(1)
+
+            redis_client.set(collection_exist_cache_key, 1, ex=3600)
+
+    def _collection_exists(self, name: str):
+        scope_collection_map: dict[str, Any] = {}
+
+        # Get a list of all scopes in the bucket
+        for scope in self._bucket.collections().get_all_scopes():
+            scope_collection_map[scope.name] = []
+
+            # Get a list of all the collections in the scope
+            for collection in scope.collections:
+                scope_collection_map[scope.name].append(collection.name)
+
+        # Check if the collection exists in the scope
+        return self._collection_name in scope_collection_map[self._scope_name]
+
+    def get_type(self) -> str:
+        return VectorType.COUCHBASE
+
+    def add_texts(self, documents: list[Document], embeddings: list[list[float]], **kwargs):
+        uuids = self._get_uuids(documents)
+        texts = [d.page_content for d in documents]
+        metadatas = [d.metadata for d in documents]
+
+        doc_ids = []
+
+        documents_to_insert = [
+            {"text": text, "embedding": vector, "metadata": metadata}
+            for id, text, vector, metadata in zip(uuids, texts, embeddings, metadatas)
+        ]
+        for doc, id in zip(documents_to_insert, uuids):
+            result = self._scope.collection(self._collection_name).upsert(id, doc)
+
+        doc_ids.extend(uuids)
+
+        return doc_ids
+
+    def text_exists(self, id: str) -> bool:
+        # Use a parameterized query for safety and correctness
+        query = f"""
+                SELECT COUNT(1) AS count FROM
+                `{self._client_config.bucket_name}`.{self._client_config.scope_name}.{self._collection_name}
+                WHERE META().id = $doc_id
+                """
+        # Pass the id as a parameter to the query
+        result = self._cluster.query(query, named_parameters={"doc_id": id}).execute()
+        for row in result:
+            return row["count"] > 0
+        return False  # Return False if no rows are returned
+
+    def delete_by_ids(self, ids: list[str]) -> None:
+        query = f"""
+            DELETE FROM `{self._bucket_name}`.{self._client_config.scope_name}.{self._collection_name}
+            WHERE META().id IN $doc_ids;
+            """
+        try:
+            self._cluster.query(query, named_parameters={"doc_ids": ids}).execute()
+        except Exception as e:
+            logger.error(e)
+
+    def delete_by_document_id(self, document_id: str):
+        query = f"""
+                DELETE FROM
+                `{self._client_config.bucket_name}`.{self._client_config.scope_name}.{self._collection_name}
+                WHERE META().id = $doc_id;
+                """
+        self._cluster.query(query, named_parameters={"doc_id": document_id}).execute()
+
+    # def get_ids_by_metadata_field(self, key: str, value: str):
+    #     query = f"""
+    #         SELECT id FROM
+    #         `{self._client_config.bucket_name}`.{self._client_config.scope_name}.{self._collection_name}
+    #         WHERE `metadata.{key}` = $value;
+    #         """
+    #     result = self._cluster.query(query, named_parameters={'value':value})
+    #     return [row['id'] for row in result.rows()]
+
+    def delete_by_metadata_field(self, key: str, value: str) -> None:
+        query = f"""
+            DELETE FROM `{self._client_config.bucket_name}`.{self._client_config.scope_name}.{self._collection_name}
+            WHERE metadata.{key} = $value;
+            """
+        self._cluster.query(query, named_parameters={"value": value}).execute()
+
+    def search_by_vector(self, query_vector: list[float], **kwargs: Any) -> list[Document]:
+        top_k = kwargs.get("top_k", 5)
+        score_threshold = kwargs.get("score_threshold") or 0.0
+
+        search_req = search.SearchRequest.create(
+            VectorSearch.from_vector_query(
+                VectorQuery(
+                    "embedding",
+                    query_vector,
+                    top_k,
+                )
+            )
+        )
+        try:
+            search_iter = self._scope.search(
+                self._collection_name + "_search",
+                search_req,
+                SearchOptions(limit=top_k, collections=[self._collection_name], fields=["*"]),
+            )
+
+            docs = []
+            # Parse the results
+            for row in search_iter.rows():
+                text = row.fields.pop("text")
+                metadata = self._format_metadata(row.fields)
+                score = row.score
+                metadata["score"] = score
+                doc = Document(page_content=text, metadata=metadata)
+                if score >= score_threshold:
+                    docs.append(doc)
+        except Exception as e:
+            raise ValueError(f"Search failed with error: {e}")
+
+        return docs
+
+    def search_by_full_text(self, query: str, **kwargs: Any) -> list[Document]:
+        top_k = kwargs.get("top_k", 2)
+        try:
+            CBrequest = search.SearchRequest.create(search.QueryStringQuery("text:" + query))
+            search_iter = self._scope.search(
+                self._collection_name + "_search", CBrequest, SearchOptions(limit=top_k, fields=["*"])
+            )
+
+            docs = []
+            for row in search_iter.rows():
+                text = row.fields.pop("text")
+                metadata = self._format_metadata(row.fields)
+                score = row.score
+                metadata["score"] = score
+                doc = Document(page_content=text, metadata=metadata)
+                docs.append(doc)
+
+        except Exception as e:
+            raise ValueError(f"Search failed with error: {e}")
+
+        return docs
+
+    def delete(self):
+        manager = self._bucket.collections()
+        scopes = manager.get_all_scopes()
+
+        for scope in scopes:
+            for collection in scope.collections:
+                if collection.name == self._collection_name:
+                    manager.drop_collection("_default", self._collection_name)
+
+    def _format_metadata(self, row_fields: dict[str, Any]) -> dict[str, Any]:
+        """Helper method to format the metadata from the Couchbase Search API.
+        Args:
+            row_fields (Dict[str, Any]): The fields to format.
+
+        Returns:
+            Dict[str, Any]: The formatted metadata.
+        """
+        metadata = {}
+        for key, value in row_fields.items():
+            # Couchbase Search returns the metadata key with a prefix
+            # `metadata.` We remove it to get the original metadata key
+            if key.startswith("metadata"):
+                new_key = key.split("metadata" + ".")[-1]
+                metadata[new_key] = value
+            else:
+                metadata[key] = value
+
+        return metadata
+
+
+class CouchbaseVectorFactory(AbstractVectorFactory):
+    def init_vector(self, dataset: Dataset, attributes: list, embeddings: Embeddings) -> CouchbaseVector:
+        if dataset.index_struct_dict:
+            class_prefix: str = dataset.index_struct_dict["vector_store"]["class_prefix"]
+            collection_name = class_prefix
+        else:
+            dataset_id = dataset.id
+            collection_name = Dataset.gen_collection_name_by_id(dataset_id)
+            dataset.index_struct = json.dumps(self.gen_index_struct_dict(VectorType.COUCHBASE, collection_name))
+
+        config = current_app.config
+        return CouchbaseVector(
+            collection_name=collection_name,
+            config=CouchbaseConfig(
+                connection_string=config.get("COUCHBASE_CONNECTION_STRING"),
+                user=config.get("COUCHBASE_USER"),
+                password=config.get("COUCHBASE_PASSWORD"),
+                bucket_name=config.get("COUCHBASE_BUCKET_NAME"),
+                scope_name=config.get("COUCHBASE_SCOPE_NAME"),
+            ),
+        )
diff --git a/api/core/rag/datasource/vdb/vector_factory.py b/api/core/rag/datasource/vdb/vector_factory.py
index 59a5aadacd..87d19bf60b 100644
--- a/api/core/rag/datasource/vdb/vector_factory.py
+++ b/api/core/rag/datasource/vdb/vector_factory.py
@@ -114,6 +114,10 @@ class Vector:
                 from core.rag.datasource.vdb.analyticdb.analyticdb_vector import AnalyticdbVectorFactory
 
                 return AnalyticdbVectorFactory
+            case VectorType.COUCHBASE:
+                from core.rag.datasource.vdb.couchbase.couchbase_vector import CouchbaseVectorFactory
+
+                return CouchbaseVectorFactory
             case VectorType.BAIDU:
                 from core.rag.datasource.vdb.baidu.baidu_vector import BaiduVectorFactory
 
diff --git a/api/core/rag/datasource/vdb/vector_type.py b/api/core/rag/datasource/vdb/vector_type.py
index 3b6df94f78..7384c12ff7 100644
--- a/api/core/rag/datasource/vdb/vector_type.py
+++ b/api/core/rag/datasource/vdb/vector_type.py
@@ -16,6 +16,7 @@ class VectorType(str, Enum):
     TENCENT = "tencent"
     ORACLE = "oracle"
     ELASTICSEARCH = "elasticsearch"
+    COUCHBASE = "couchbase"
     BAIDU = "baidu"
     VIKINGDB = "vikingdb"
     UPSTASH = "upstash"
diff --git a/api/poetry.lock b/api/poetry.lock
index 618dbb4033..e1e5a6410b 100644
--- a/api/poetry.lock
+++ b/api/poetry.lock
@@ -1801,6 +1801,46 @@ requests = ">=2.8"
 six = "*"
 xmltodict = "*"
 
+[[package]]
+name = "couchbase"
+version = "4.3.3"
+description = "Python Client for Couchbase"
+optional = false
+python-versions = ">=3.7"
+files = [
+    {file = "couchbase-4.3.3-cp310-cp310-macosx_10_15_x86_64.whl", hash = "sha256:d8069e4f01332859d56cca597874645c914699162b3979d1b432f0dfc186b124"},
+    {file = "couchbase-4.3.3-cp310-cp310-macosx_11_0_arm64.whl", hash = "sha256:1caa6cfef49c785b35b1702102f718227f351df87bba2694b9334520c41e9eb5"},
+    {file = "couchbase-4.3.3-cp310-cp310-manylinux2014_aarch64.manylinux_2_17_aarch64.whl", hash = "sha256:f4a9a65c44935249fa078fb90a3c28ea71da9d2d5889fcd514b12d0538010ae0"},
+    {file = "couchbase-4.3.3-cp310-cp310-manylinux2014_x86_64.manylinux_2_17_x86_64.whl", hash = "sha256:4f144b8c482c18283d8e419b844630d41f3249b07d43d40b5e3535444e57d0fb"},
+    {file = "couchbase-4.3.3-cp310-cp310-musllinux_1_1_x86_64.whl", hash = "sha256:1c534fba6fdc7cf47eed9dee8a57d1e9eb867bf008574e321fa380a77cebf32f"},
+    {file = "couchbase-4.3.3-cp310-cp310-win_amd64.whl", hash = "sha256:b841be06e0e4370b69ebef6bca3409c378186f7d6e964cd645ba18e97216c022"},
+    {file = "couchbase-4.3.3-cp311-cp311-macosx_10_15_x86_64.whl", hash = "sha256:eee7a73b3acbdc78ae314fddf7f975b3c9e05df07df255f4dcc878939a2abae0"},
+    {file = "couchbase-4.3.3-cp311-cp311-macosx_11_0_arm64.whl", hash = "sha256:53417cafcf90ff4e2fd81ebba2a08b7ad56f17160d1c5019ad3b09c758aeb363"},
+    {file = "couchbase-4.3.3-cp311-cp311-manylinux2014_aarch64.manylinux_2_17_aarch64.whl", hash = "sha256:0cefd13bea8b0f150f1b9d27fd7614f971f77419b31817781d26ba315ed658bb"},
+    {file = "couchbase-4.3.3-cp311-cp311-manylinux2014_x86_64.manylinux_2_17_x86_64.whl", hash = "sha256:78fa1054d7740e2fe38fce0a2aab4e9a2d30263d894e0615ee5df297f02f59a3"},
+    {file = "couchbase-4.3.3-cp311-cp311-musllinux_1_1_x86_64.whl", hash = "sha256:eb093899cfad5a7472258a9b6a57775dbf23a6e0180241507ba89ce3ab241e41"},
+    {file = "couchbase-4.3.3-cp311-cp311-win_amd64.whl", hash = "sha256:f7cfbdc699af5715f49365ffbb05a6a7366a534c0d7161edf270ad3e735a6c5d"},
+    {file = "couchbase-4.3.3-cp312-cp312-macosx_10_15_x86_64.whl", hash = "sha256:58352cae9b8affdaa2ac012e0a03c8c2632ee6297a878232888b4e0360d0d5df"},
+    {file = "couchbase-4.3.3-cp312-cp312-macosx_11_0_arm64.whl", hash = "sha256:728e7e3b5e1682706cb9d63993d289226d02a25089527b8ecb4e3889dabc38cf"},
+    {file = "couchbase-4.3.3-cp312-cp312-manylinux2014_aarch64.manylinux_2_17_aarch64.whl", hash = "sha256:73014bf098cf14187a39cc13453e0d859c1d54568df28f69cc308a9a5f24feb2"},
+    {file = "couchbase-4.3.3-cp312-cp312-manylinux2014_x86_64.manylinux_2_17_x86_64.whl", hash = "sha256:a743375804068ae01b73c916bfca738764c8c12f381bb399ef04e784935856a1"},
+    {file = "couchbase-4.3.3-cp312-cp312-musllinux_1_1_x86_64.whl", hash = "sha256:394c122cfe02a76a99e7d5178e64129f6da49843225e78d8629abcab556c24af"},
+    {file = "couchbase-4.3.3-cp312-cp312-win_amd64.whl", hash = "sha256:bf85d7a5cda548d9801614651206068b4445fa37972e62b14d7521a958198693"},
+    {file = "couchbase-4.3.3-cp38-cp38-macosx_10_15_x86_64.whl", hash = "sha256:92d23c9cedd571631070791f2afee0e3d7d8c9ce1bf2ea6e9a4f2fdbc37a0f1e"},
+    {file = "couchbase-4.3.3-cp38-cp38-macosx_11_0_arm64.whl", hash = "sha256:38c42eb29a73cce2998ae5df45bd61b16dce9765d3bff968ec5cf6a622faa291"},
+    {file = "couchbase-4.3.3-cp38-cp38-manylinux2014_aarch64.manylinux_2_17_aarch64.whl", hash = "sha256:afed137bf0edc642d7b201b6ab7b1e7117bb4c8eac6b2f253cc6e106f334a2a1"},
+    {file = "couchbase-4.3.3-cp38-cp38-manylinux2014_x86_64.manylinux_2_17_x86_64.whl", hash = "sha256:954d991377d47883aaf903934c5d0f19577680a2abf80d3ce5bb9b3c80991fc7"},
+    {file = "couchbase-4.3.3-cp38-cp38-musllinux_1_1_x86_64.whl", hash = "sha256:d5552b9fa684630698dc98d6f3b1082540634c1b7ad5bf53b843b5da57b0169c"},
+    {file = "couchbase-4.3.3-cp38-cp38-win_amd64.whl", hash = "sha256:f88f2b7e0c894f7237d9f3fb5c46abc44b8151a97b3ca8e75f57d23ebf59f9da"},
+    {file = "couchbase-4.3.3-cp39-cp39-macosx_10_15_x86_64.whl", hash = "sha256:769e1e2367ea1d4de181fcd4b4e353e9abef97d15b581a6c5aea49ece3dc7d59"},
+    {file = "couchbase-4.3.3-cp39-cp39-macosx_11_0_arm64.whl", hash = "sha256:47f59a0b35ffce060583fd11f98f049f3b70701cf14aab9ac092594aca486aeb"},
+    {file = "couchbase-4.3.3-cp39-cp39-manylinux2014_aarch64.manylinux_2_17_aarch64.whl", hash = "sha256:440bb93d611827ba0ea2403c6f204fe931467a6cb5811f0e03bf1779204ef843"},
+    {file = "couchbase-4.3.3-cp39-cp39-manylinux2014_x86_64.manylinux_2_17_x86_64.whl", hash = "sha256:cdb4dde62e1d41c0b8707121ab68fa78b7a1508541bd48fc850be396f91bc8d9"},
+    {file = "couchbase-4.3.3-cp39-cp39-musllinux_1_1_x86_64.whl", hash = "sha256:7f8cf45f317b39cc19db5c67b565662f08d6c90305b3aa14e04bc22707258213"},
+    {file = "couchbase-4.3.3-cp39-cp39-win_amd64.whl", hash = "sha256:c97d48ad486c8f201b4482d5594258f949369cb44792ed148d5159a3d12ae21b"},
+    {file = "couchbase-4.3.3.tar.gz", hash = "sha256:27808500551564b39b46943cf3daab572694889c1eb638425d363edb48b20da7"},
+]
+
 [[package]]
 name = "coverage"
 version = "7.2.7"
@@ -6850,6 +6890,19 @@ files = [
     {file = "pyarrow-17.0.0-cp312-cp312-win_amd64.whl", hash = "sha256:392bc9feabc647338e6c89267635e111d71edad5fcffba204425a7c8d13610d7"},
     {file = "pyarrow-17.0.0-cp38-cp38-macosx_10_15_x86_64.whl", hash = "sha256:af5ff82a04b2171415f1410cff7ebb79861afc5dae50be73ce06d6e870615204"},
     {file = "pyarrow-17.0.0-cp38-cp38-macosx_11_0_arm64.whl", hash = "sha256:edca18eaca89cd6382dfbcff3dd2d87633433043650c07375d095cd3517561d8"},
+    {file = "pyarrow-17.0.0-cp38-cp38-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:7c7916bff914ac5d4a8fe25b7a25e432ff921e72f6f2b7547d1e325c1ad9d155"},
+    {file = "pyarrow-17.0.0-cp38-cp38-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:f553ca691b9e94b202ff741bdd40f6ccb70cdd5fbf65c187af132f1317de6145"},
+    {file = "pyarrow-17.0.0-cp38-cp38-manylinux_2_28_aarch64.whl", hash = "sha256:0cdb0e627c86c373205a2f94a510ac4376fdc523f8bb36beab2e7f204416163c"},
+    {file = "pyarrow-17.0.0-cp38-cp38-manylinux_2_28_x86_64.whl", hash = "sha256:d7d192305d9d8bc9082d10f361fc70a73590a4c65cf31c3e6926cd72b76bc35c"},
+    {file = "pyarrow-17.0.0-cp38-cp38-win_amd64.whl", hash = "sha256:02dae06ce212d8b3244dd3e7d12d9c4d3046945a5933d28026598e9dbbda1fca"},
+    {file = "pyarrow-17.0.0-cp39-cp39-macosx_10_15_x86_64.whl", hash = "sha256:13d7a460b412f31e4c0efa1148e1d29bdf18ad1411eb6757d38f8fbdcc8645fb"},
+    {file = "pyarrow-17.0.0-cp39-cp39-macosx_11_0_arm64.whl", hash = "sha256:9b564a51fbccfab5a04a80453e5ac6c9954a9c5ef2890d1bcf63741909c3f8df"},
+    {file = "pyarrow-17.0.0-cp39-cp39-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:32503827abbc5aadedfa235f5ece8c4f8f8b0a3cf01066bc8d29de7539532687"},
+    {file = "pyarrow-17.0.0-cp39-cp39-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:a155acc7f154b9ffcc85497509bcd0d43efb80d6f733b0dc3bb14e281f131c8b"},
+    {file = "pyarrow-17.0.0-cp39-cp39-manylinux_2_28_aarch64.whl", hash = "sha256:dec8d129254d0188a49f8a1fc99e0560dc1b85f60af729f47de4046015f9b0a5"},
+    {file = "pyarrow-17.0.0-cp39-cp39-manylinux_2_28_x86_64.whl", hash = "sha256:a48ddf5c3c6a6c505904545c25a4ae13646ae1f8ba703c4df4a1bfe4f4006bda"},
+    {file = "pyarrow-17.0.0-cp39-cp39-win_amd64.whl", hash = "sha256:42bf93249a083aca230ba7e2786c5f673507fa97bbd9725a1e2754715151a204"},
+    {file = "pyarrow-17.0.0.tar.gz", hash = "sha256:4beca9521ed2c0921c1023e68d097d0299b62c362639ea315572a58f3f50fd28"},
 ]
 
 [package.dependencies]
@@ -10866,4 +10919,4 @@ cffi = ["cffi (>=1.11)"]
 [metadata]
 lock-version = "2.0"
 python-versions = ">=3.10,<3.13"
-content-hash = "1b268122d3d4771ba219f0e983322e0454b7b8644dba35da38d7d950d489e1ba"
+content-hash = "52552faf5f4823056eb48afe05349ab2f0e9a5bc42105211ccbbb54b59e27b59"
diff --git a/api/pyproject.toml b/api/pyproject.toml
index a549601535..a3313f0ff5 100644
--- a/api/pyproject.toml
+++ b/api/pyproject.toml
@@ -239,6 +239,7 @@ alibabacloud_gpdb20160503 = "~3.8.0"
 alibabacloud_tea_openapi = "~0.3.9"
 chromadb = "0.5.1"
 clickhouse-connect = "~0.7.16"
+couchbase = "~4.3.0"
 elasticsearch = "8.14.0"
 opensearch-py = "2.4.0"
 oracledb = "~2.2.1"
diff --git a/api/tests/integration_tests/vdb/couchbase/__init__.py b/api/tests/integration_tests/vdb/couchbase/__init__.py
new file mode 100644
index 0000000000..e69de29bb2
diff --git a/api/tests/integration_tests/vdb/couchbase/test_couchbase.py b/api/tests/integration_tests/vdb/couchbase/test_couchbase.py
new file mode 100644
index 0000000000..d76c34ba0e
--- /dev/null
+++ b/api/tests/integration_tests/vdb/couchbase/test_couchbase.py
@@ -0,0 +1,50 @@
+import subprocess
+import time
+
+from core.rag.datasource.vdb.couchbase.couchbase_vector import CouchbaseConfig, CouchbaseVector
+from tests.integration_tests.vdb.test_vector_store import (
+    AbstractVectorTest,
+    get_example_text,
+    setup_mock_redis,
+)
+
+
+def wait_for_healthy_container(service_name="couchbase-server", timeout=300):
+    start_time = time.time()
+    while time.time() - start_time < timeout:
+        result = subprocess.run(
+            ["docker", "inspect", "--format", "{{.State.Health.Status}}", service_name], capture_output=True, text=True
+        )
+        if result.stdout.strip() == "healthy":
+            print(f"{service_name} is healthy!")
+            return True
+        else:
+            print(f"Waiting for {service_name} to be healthy...")
+        time.sleep(10)
+    raise TimeoutError(f"{service_name} did not become healthy in time")
+
+
+class CouchbaseTest(AbstractVectorTest):
+    def __init__(self):
+        super().__init__()
+        self.vector = CouchbaseVector(
+            collection_name=self.collection_name,
+            config=CouchbaseConfig(
+                connection_string="couchbase://127.0.0.1",
+                user="Administrator",
+                password="password",
+                bucket_name="Embeddings",
+                scope_name="_default",
+            ),
+        )
+
+    def search_by_vector(self):
+        # brief sleep to ensure document is indexed
+        time.sleep(5)
+        hits_by_vector = self.vector.search_by_vector(query_vector=self.example_embedding)
+        assert len(hits_by_vector) == 1
+
+
+def test_couchbase(setup_mock_redis):
+    wait_for_healthy_container("couchbase-server", timeout=60)
+    CouchbaseTest().run_all_tests()
diff --git a/dev/pytest/pytest_vdb.sh b/dev/pytest/pytest_vdb.sh
index 579da6a30e..418a129693 100755
--- a/dev/pytest/pytest_vdb.sh
+++ b/dev/pytest/pytest_vdb.sh
@@ -11,4 +11,5 @@ pytest api/tests/integration_tests/vdb/chroma \
   api/tests/integration_tests/vdb/vikingdb \
   api/tests/integration_tests/vdb/baidu \
   api/tests/integration_tests/vdb/tcvectordb \
-  api/tests/integration_tests/vdb/upstash
\ No newline at end of file
+  api/tests/integration_tests/vdb/upstash \
+  api/tests/integration_tests/vdb/couchbase \
diff --git a/docker/.env.example b/docker/.env.example
index 49ce48a20d..c506a9d92e 100644
--- a/docker/.env.example
+++ b/docker/.env.example
@@ -375,7 +375,7 @@ SUPABASE_URL=your-server-url
 # ------------------------------
 
 # The type of vector store to use.
-# Supported values are `weaviate`, `qdrant`, `milvus`, `myscale`, `relyt`, `pgvector`, `pgvecto-rs`, `chroma`, `opensearch`, `tidb_vector`, `oracle`, `tencent`, `elasticsearch`, `analyticdb`, `vikingdb`.
+# Supported values are `weaviate`, `qdrant`, `milvus`, `myscale`, `relyt`, `pgvector`, `pgvecto-rs`, `chroma`, `opensearch`, `tidb_vector`, `oracle`, `tencent`, `elasticsearch`, `analyticdb`, `couchbase`, `vikingdb`.
 VECTOR_STORE=weaviate
 
 # The Weaviate endpoint URL. Only available when VECTOR_STORE is `weaviate`.
@@ -414,6 +414,14 @@ MYSCALE_PASSWORD=
 MYSCALE_DATABASE=dify
 MYSCALE_FTS_PARAMS=
 
+# Couchbase configurations, only available when VECTOR_STORE is `couchbase`
+# The connection string must include hostname defined in the docker-compose file (couchbase-server in this case)
+COUCHBASE_CONNECTION_STRING=couchbase://couchbase-server
+COUCHBASE_USER=Administrator
+COUCHBASE_PASSWORD=password
+COUCHBASE_BUCKET_NAME=Embeddings
+COUCHBASE_SCOPE_NAME=_default
+
 # pgvector configurations, only available when VECTOR_STORE is `pgvector`
 PGVECTOR_HOST=pgvector
 PGVECTOR_PORT=5432
diff --git a/docker/couchbase-server/Dockerfile b/docker/couchbase-server/Dockerfile
new file mode 100644
index 0000000000..bd8af64150
--- /dev/null
+++ b/docker/couchbase-server/Dockerfile
@@ -0,0 +1,4 @@
+FROM couchbase/server:latest AS stage_base
+# FROM couchbase:latest AS stage_base 
+COPY init-cbserver.sh /opt/couchbase/init/
+RUN chmod +x /opt/couchbase/init/init-cbserver.sh
\ No newline at end of file
diff --git a/docker/couchbase-server/init-cbserver.sh b/docker/couchbase-server/init-cbserver.sh
new file mode 100755
index 0000000000..e66bc18530
--- /dev/null
+++ b/docker/couchbase-server/init-cbserver.sh
@@ -0,0 +1,44 @@
+#!/bin/bash
+# used to start couchbase server - can't get around this as docker compose only allows you to start one command - so we have to start couchbase like the standard couchbase Dockerfile would 
+# https://github.com/couchbase/docker/blob/master/enterprise/couchbase-server/7.2.0/Dockerfile#L88
+
+/entrypoint.sh couchbase-server & 
+
+# track if setup is complete so we don't try to setup again
+FILE=/opt/couchbase/init/setupComplete.txt
+
+if ! [ -f "$FILE" ]; then
+  # used to automatically create the cluster based on environment variables
+  # https://docs.couchbase.com/server/current/cli/cbcli/couchbase-cli-cluster-init.html
+
+  echo $COUCHBASE_ADMINISTRATOR_USERNAME ":"  $COUCHBASE_ADMINISTRATOR_PASSWORD
+
+  sleep 20s
+  /opt/couchbase/bin/couchbase-cli cluster-init -c 127.0.0.1 \
+  --cluster-username $COUCHBASE_ADMINISTRATOR_USERNAME \
+  --cluster-password $COUCHBASE_ADMINISTRATOR_PASSWORD \
+  --services data,index,query,fts \
+  --cluster-ramsize $COUCHBASE_RAM_SIZE \
+  --cluster-index-ramsize $COUCHBASE_INDEX_RAM_SIZE \
+  --cluster-eventing-ramsize $COUCHBASE_EVENTING_RAM_SIZE \
+  --cluster-fts-ramsize $COUCHBASE_FTS_RAM_SIZE \
+  --index-storage-setting default
+
+  sleep 2s
+
+  # used to auto create the bucket based on environment variables
+  # https://docs.couchbase.com/server/current/cli/cbcli/couchbase-cli-bucket-create.html
+
+  /opt/couchbase/bin/couchbase-cli bucket-create -c localhost:8091 \
+  --username $COUCHBASE_ADMINISTRATOR_USERNAME \
+  --password $COUCHBASE_ADMINISTRATOR_PASSWORD \
+  --bucket $COUCHBASE_BUCKET \
+  --bucket-ramsize $COUCHBASE_BUCKET_RAMSIZE \
+  --bucket-type couchbase
+
+  # create file so we know that the cluster is setup and don't run the setup again 
+  touch $FILE
+fi 
+  # docker compose will stop the container from running unless we do this
+  # known issue and workaround
+  tail -f /dev/null
diff --git a/docker/docker-compose.yaml b/docker/docker-compose.yaml
index bf8a8b07e6..2a756ead9c 100644
--- a/docker/docker-compose.yaml
+++ b/docker/docker-compose.yaml
@@ -110,6 +110,11 @@ x-shared-env: &shared-api-worker-env
   QDRANT_CLIENT_TIMEOUT: ${QDRANT_CLIENT_TIMEOUT:-20}
   QDRANT_GRPC_ENABLED: ${QDRANT_GRPC_ENABLED:-false}
   QDRANT_GRPC_PORT: ${QDRANT_GRPC_PORT:-6334}
+  COUCHBASE_CONNECTION_STRING: ${COUCHBASE_CONNECTION_STRING:-'couchbase-server'}
+  COUCHBASE_USER: ${COUCHBASE_USER:-Administrator}
+  COUCHBASE_PASSWORD: ${COUCHBASE_PASSWORD:-password}
+  COUCHBASE_BUCKET_NAME: ${COUCHBASE_BUCKET_NAME:-Embeddings}
+  COUCHBASE_SCOPE_NAME: ${COUCHBASE_SCOPE_NAME:-_default}
   MILVUS_URI: ${MILVUS_URI:-http://127.0.0.1:19530}
   MILVUS_TOKEN: ${MILVUS_TOKEN:-}
   MILVUS_USER: ${MILVUS_USER:-root}
@@ -475,6 +480,39 @@ services:
     environment:
       QDRANT_API_KEY: ${QDRANT_API_KEY:-difyai123456}
 
+  # The Couchbase vector store.
+  couchbase-server:
+    build: ./couchbase-server
+    profiles:
+      - couchbase
+    restart: always
+    environment:
+      - CLUSTER_NAME=dify_search
+      - COUCHBASE_ADMINISTRATOR_USERNAME=${COUCHBASE_USER:-Administrator}
+      - COUCHBASE_ADMINISTRATOR_PASSWORD=${COUCHBASE_PASSWORD:-password}
+      - COUCHBASE_BUCKET=${COUCHBASE_BUCKET_NAME:-Embeddings}
+      - COUCHBASE_BUCKET_RAMSIZE=512
+      - COUCHBASE_RAM_SIZE=2048
+      - COUCHBASE_EVENTING_RAM_SIZE=512
+      - COUCHBASE_INDEX_RAM_SIZE=512
+      - COUCHBASE_FTS_RAM_SIZE=1024
+    hostname: couchbase-server
+    container_name: couchbase-server
+    working_dir: /opt/couchbase
+    stdin_open: true
+    tty: true
+    entrypoint: [""]
+    command: sh -c "/opt/couchbase/init/init-cbserver.sh"
+    volumes:
+      - ./volumes/couchbase/data:/opt/couchbase/var/lib/couchbase/data
+    healthcheck:
+      # ensure bucket was created before proceeding
+      test: [ "CMD-SHELL", "curl -s -f -u Administrator:password http://localhost:8091/pools/default/buckets | grep -q '\\[{' || exit 1" ]
+      interval: 10s
+      retries: 10
+      start_period: 30s
+      timeout: 10s
+
   # The pgvector vector database.
   pgvector:
     image: pgvector/pgvector:pg16

From 12adcf8925b5f0fee37c6443a54f4a24fc2551e5 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?=E9=9D=9E=E6=B3=95=E6=93=8D=E4=BD=9C?= <hjlarry@163.com>
Date: Tue, 29 Oct 2024 16:09:29 +0800
Subject: [PATCH 17/29] fix: gemini model use some tools raise error (#9993)

---
 .../model_providers/google/llm/llm.py         | 45 +++++++++++--------
 1 file changed, 26 insertions(+), 19 deletions(-)

diff --git a/api/core/model_runtime/model_providers/google/llm/llm.py b/api/core/model_runtime/model_providers/google/llm/llm.py
index e686ad08d9..b1b07a611b 100644
--- a/api/core/model_runtime/model_providers/google/llm/llm.py
+++ b/api/core/model_runtime/model_providers/google/llm/llm.py
@@ -116,26 +116,33 @@ class GoogleLargeLanguageModel(LargeLanguageModel):
         :param tools: tool messages
         :return: glm tools
         """
-        return glm.Tool(
-            function_declarations=[
-                glm.FunctionDeclaration(
-                    name=tool.name,
-                    parameters=glm.Schema(
-                        type=glm.Type.OBJECT,
-                        properties={
-                            key: {
-                                "type_": value.get("type", "string").upper(),
-                                "description": value.get("description", ""),
-                                "enum": value.get("enum", []),
-                            }
-                            for key, value in tool.parameters.get("properties", {}).items()
-                        },
-                        required=tool.parameters.get("required", []),
-                    ),
+        function_declarations = []
+        for tool in tools:
+            properties = {}
+            for key, value in tool.parameters.get("properties", {}).items():
+                properties[key] = {
+                    "type_": glm.Type.STRING,
+                    "description": value.get("description", ""),
+                    "enum": value.get("enum", []),
+                }
+
+            if properties:
+                parameters = glm.Schema(
+                    type=glm.Type.OBJECT,
+                    properties=properties,
+                    required=tool.parameters.get("required", []),
                 )
-                for tool in tools
-            ]
-        )
+            else:
+                parameters = None
+
+            function_declaration = glm.FunctionDeclaration(
+                name=tool.name,
+                parameters=parameters,
+                description=tool.description,
+            )
+            function_declarations.append(function_declaration)
+
+        return glm.Tool(function_declarations=function_declarations)
 
     def validate_credentials(self, model: str, credentials: dict) -> None:
         """

From 5580bcf8704fb0056979a611118c35de5f7d1b1d Mon Sep 17 00:00:00 2001
From: Jyong <76649700+JohnJyong@users.noreply.github.com>
Date: Tue, 29 Oct 2024 17:51:13 +0800
Subject: [PATCH 18/29] add tidb spend limit config (#9999)

---
 api/configs/middleware/vdb/tidb_on_qdrant_config.py        | 5 +++++
 api/core/rag/datasource/vdb/tidb_on_qdrant/tidb_service.py | 3 ++-
 2 files changed, 7 insertions(+), 1 deletion(-)

diff --git a/api/configs/middleware/vdb/tidb_on_qdrant_config.py b/api/configs/middleware/vdb/tidb_on_qdrant_config.py
index 98268798ef..d2625af264 100644
--- a/api/configs/middleware/vdb/tidb_on_qdrant_config.py
+++ b/api/configs/middleware/vdb/tidb_on_qdrant_config.py
@@ -63,3 +63,8 @@ class TidbOnQdrantConfig(BaseSettings):
         description="Tidb project id",
         default=None,
     )
+
+    TIDB_SPEND_LIMIT: Optional[int] = Field(
+        description="Tidb spend limit",
+        default=100,
+    )
diff --git a/api/core/rag/datasource/vdb/tidb_on_qdrant/tidb_service.py b/api/core/rag/datasource/vdb/tidb_on_qdrant/tidb_service.py
index f10d6339ee..0cd2a46460 100644
--- a/api/core/rag/datasource/vdb/tidb_on_qdrant/tidb_service.py
+++ b/api/core/rag/datasource/vdb/tidb_on_qdrant/tidb_service.py
@@ -4,6 +4,7 @@ import uuid
 import requests
 from requests.auth import HTTPDigestAuth
 
+from configs import dify_config
 from extensions.ext_database import db
 from extensions.ext_redis import redis_client
 from models.dataset import TidbAuthBinding
@@ -208,7 +209,7 @@ class TidbService:
             }
 
             spending_limit = {
-                "monthly": 10,
+                "monthly": dify_config.TIDB_SPEND_LIMIT,
             }
             password = str(uuid.uuid4()).replace("-", "")[:16]
             display_name = str(uuid.uuid4()).replace("-", "")

From 878d13ef4215e07ee8da346254e00843a707a361 Mon Sep 17 00:00:00 2001
From: powerfool <yuyi.wsy@oceanbase.com>
Date: Tue, 29 Oct 2024 21:10:18 +0800
Subject: [PATCH 19/29] Added OceanBase as an option for the vector store in
 Dify (#10010)

---
 .gitignore                                    |   1 +
 api/.env.example                              |   8 +
 api/commands.py                               |   1 +
 api/configs/middleware/__init__.py            |   2 +
 .../middleware/vdb/oceanbase_config.py        |  35 +++
 api/controllers/console/datasets/datasets.py  |   2 +
 .../rag/datasource/vdb/oceanbase/__init__.py  |   0
 .../vdb/oceanbase/oceanbase_vector.py         | 209 ++++++++++++++++++
 api/core/rag/datasource/vdb/vector_factory.py |   4 +
 api/core/rag/datasource/vdb/vector_type.py    |   1 +
 api/poetry.lock                               |  67 +++++-
 api/pyproject.toml                            |   1 +
 .../vdb/oceanbase/__init__.py                 |   0
 .../vdb/oceanbase/test_oceanbase.py           |  71 ++++++
 dev/pytest/pytest_vdb.sh                      |   1 +
 docker/.env.example                           |   8 +
 docker/docker-compose.yaml                    |  18 ++
 17 files changed, 427 insertions(+), 2 deletions(-)
 create mode 100644 api/configs/middleware/vdb/oceanbase_config.py
 create mode 100644 api/core/rag/datasource/vdb/oceanbase/__init__.py
 create mode 100644 api/core/rag/datasource/vdb/oceanbase/oceanbase_vector.py
 create mode 100644 api/tests/integration_tests/vdb/oceanbase/__init__.py
 create mode 100644 api/tests/integration_tests/vdb/oceanbase/test_oceanbase.py

diff --git a/.gitignore b/.gitignore
index 29a80534f7..60b5781733 100644
--- a/.gitignore
+++ b/.gitignore
@@ -174,6 +174,7 @@ docker/volumes/unstructured/*
 docker/volumes/pgvector/data/*
 docker/volumes/pgvecto_rs/data/*
 docker/volumes/couchbase/*
+docker/volumes/oceanbase/*
 
 docker/nginx/conf.d/default.conf
 docker/nginx/ssl/*
diff --git a/api/.env.example b/api/.env.example
index 2ce425338e..984985803e 100644
--- a/api/.env.example
+++ b/api/.env.example
@@ -249,6 +249,14 @@ VIKINGDB_SCHEMA=http
 VIKINGDB_CONNECTION_TIMEOUT=30
 VIKINGDB_SOCKET_TIMEOUT=30
 
+# OceanBase Vector configuration
+OCEANBASE_VECTOR_HOST=127.0.0.1
+OCEANBASE_VECTOR_PORT=2881
+OCEANBASE_VECTOR_USER=root@test
+OCEANBASE_VECTOR_PASSWORD=
+OCEANBASE_VECTOR_DATABASE=test
+OCEANBASE_MEMORY_LIMIT=6G
+
 # Upload configuration
 UPLOAD_FILE_SIZE_LIMIT=15
 UPLOAD_FILE_BATCH_LIMIT=5
diff --git a/api/commands.py b/api/commands.py
index da09f1b610..10122ceb3d 100644
--- a/api/commands.py
+++ b/api/commands.py
@@ -279,6 +279,7 @@ def migrate_knowledge_vector_database():
         VectorType.VIKINGDB,
         VectorType.UPSTASH,
         VectorType.COUCHBASE,
+        VectorType.OCEANBASE,
     }
     page = 1
     while True:
diff --git a/api/configs/middleware/__init__.py b/api/configs/middleware/__init__.py
index e8f6ba91b6..38bb804613 100644
--- a/api/configs/middleware/__init__.py
+++ b/api/configs/middleware/__init__.py
@@ -21,6 +21,7 @@ from configs.middleware.vdb.couchbase_config import CouchbaseConfig
 from configs.middleware.vdb.elasticsearch_config import ElasticsearchConfig
 from configs.middleware.vdb.milvus_config import MilvusConfig
 from configs.middleware.vdb.myscale_config import MyScaleConfig
+from configs.middleware.vdb.oceanbase_config import OceanBaseVectorConfig
 from configs.middleware.vdb.opensearch_config import OpenSearchConfig
 from configs.middleware.vdb.oracle_config import OracleConfig
 from configs.middleware.vdb.pgvector_config import PGVectorConfig
@@ -257,5 +258,6 @@ class MiddlewareConfig(
     VikingDBConfig,
     UpstashConfig,
     TidbOnQdrantConfig,
+    OceanBaseVectorConfig,
 ):
     pass
diff --git a/api/configs/middleware/vdb/oceanbase_config.py b/api/configs/middleware/vdb/oceanbase_config.py
new file mode 100644
index 0000000000..87427af960
--- /dev/null
+++ b/api/configs/middleware/vdb/oceanbase_config.py
@@ -0,0 +1,35 @@
+from typing import Optional
+
+from pydantic import Field, PositiveInt
+from pydantic_settings import BaseSettings
+
+
+class OceanBaseVectorConfig(BaseSettings):
+    """
+    Configuration settings for OceanBase Vector database
+    """
+
+    OCEANBASE_VECTOR_HOST: Optional[str] = Field(
+        description="Hostname or IP address of the OceanBase Vector server (e.g. 'localhost')",
+        default=None,
+    )
+
+    OCEANBASE_VECTOR_PORT: Optional[PositiveInt] = Field(
+        description="Port number on which the OceanBase Vector server is listening (default is 2881)",
+        default=2881,
+    )
+
+    OCEANBASE_VECTOR_USER: Optional[str] = Field(
+        description="Username for authenticating with the OceanBase Vector database",
+        default=None,
+    )
+
+    OCEANBASE_VECTOR_PASSWORD: Optional[str] = Field(
+        description="Password for authenticating with the OceanBase Vector database",
+        default=None,
+    )
+
+    OCEANBASE_VECTOR_DATABASE: Optional[str] = Field(
+        description="Name of the OceanBase Vector database to connect to",
+        default=None,
+    )
diff --git a/api/controllers/console/datasets/datasets.py b/api/controllers/console/datasets/datasets.py
index 854821746a..4f4d186edd 100644
--- a/api/controllers/console/datasets/datasets.py
+++ b/api/controllers/console/datasets/datasets.py
@@ -628,6 +628,7 @@ class DatasetRetrievalSettingApi(Resource):
                 | VectorType.BAIDU
                 | VectorType.VIKINGDB
                 | VectorType.UPSTASH
+                | VectorType.OCEANBASE
             ):
                 return {"retrieval_method": [RetrievalMethod.SEMANTIC_SEARCH.value]}
             case (
@@ -669,6 +670,7 @@ class DatasetRetrievalSettingMockApi(Resource):
                 | VectorType.BAIDU
                 | VectorType.VIKINGDB
                 | VectorType.UPSTASH
+                | VectorType.OCEANBASE
             ):
                 return {"retrieval_method": [RetrievalMethod.SEMANTIC_SEARCH.value]}
             case (
diff --git a/api/core/rag/datasource/vdb/oceanbase/__init__.py b/api/core/rag/datasource/vdb/oceanbase/__init__.py
new file mode 100644
index 0000000000..e69de29bb2
diff --git a/api/core/rag/datasource/vdb/oceanbase/oceanbase_vector.py b/api/core/rag/datasource/vdb/oceanbase/oceanbase_vector.py
new file mode 100644
index 0000000000..8dd26a073b
--- /dev/null
+++ b/api/core/rag/datasource/vdb/oceanbase/oceanbase_vector.py
@@ -0,0 +1,209 @@
+import json
+import logging
+import math
+from typing import Any
+
+from pydantic import BaseModel, model_validator
+from pyobvector import VECTOR, ObVecClient
+from sqlalchemy import JSON, Column, String, func
+from sqlalchemy.dialects.mysql import LONGTEXT
+
+from configs import dify_config
+from core.rag.datasource.vdb.vector_base import BaseVector
+from core.rag.datasource.vdb.vector_factory import AbstractVectorFactory
+from core.rag.datasource.vdb.vector_type import VectorType
+from core.rag.embedding.embedding_base import Embeddings
+from core.rag.models.document import Document
+from extensions.ext_redis import redis_client
+from models.dataset import Dataset
+
+logger = logging.getLogger(__name__)
+
+DEFAULT_OCEANBASE_HNSW_BUILD_PARAM = {"M": 16, "efConstruction": 256}
+DEFAULT_OCEANBASE_HNSW_SEARCH_PARAM = {"efSearch": 64}
+OCEANBASE_SUPPORTED_VECTOR_INDEX_TYPE = "HNSW"
+DEFAULT_OCEANBASE_VECTOR_METRIC_TYPE = "l2"
+
+
+class OceanBaseVectorConfig(BaseModel):
+    host: str
+    port: int
+    user: str
+    password: str
+    database: str
+
+    @model_validator(mode="before")
+    @classmethod
+    def validate_config(cls, values: dict) -> dict:
+        if not values["host"]:
+            raise ValueError("config OCEANBASE_VECTOR_HOST is required")
+        if not values["port"]:
+            raise ValueError("config OCEANBASE_VECTOR_PORT is required")
+        if not values["user"]:
+            raise ValueError("config OCEANBASE_VECTOR_USER is required")
+        if not values["database"]:
+            raise ValueError("config OCEANBASE_VECTOR_DATABASE is required")
+        return values
+
+
+class OceanBaseVector(BaseVector):
+    def __init__(self, collection_name: str, config: OceanBaseVectorConfig):
+        super().__init__(collection_name)
+        self._config = config
+        self._hnsw_ef_search = -1
+        self._client = ObVecClient(
+            uri=f"{self._config.host}:{self._config.port}",
+            user=self._config.user,
+            password=self._config.password,
+            db_name=self._config.database,
+        )
+
+    def get_type(self) -> str:
+        return VectorType.OCEANBASE
+
+    def create(self, texts: list[Document], embeddings: list[list[float]], **kwargs):
+        self._vec_dim = len(embeddings[0])
+        self._create_collection()
+        self.add_texts(texts, embeddings)
+
+    def _create_collection(self) -> None:
+        lock_name = "vector_indexing_lock_" + self._collection_name
+        with redis_client.lock(lock_name, timeout=20):
+            collection_exist_cache_key = "vector_indexing_" + self._collection_name
+            if redis_client.get(collection_exist_cache_key):
+                return
+
+            if self._client.check_table_exists(self._collection_name):
+                return
+
+            self.delete()
+
+            cols = [
+                Column("id", String(36), primary_key=True, autoincrement=False),
+                Column("vector", VECTOR(self._vec_dim)),
+                Column("text", LONGTEXT),
+                Column("metadata", JSON),
+            ]
+            vidx_params = self._client.prepare_index_params()
+            vidx_params.add_index(
+                field_name="vector",
+                index_type=OCEANBASE_SUPPORTED_VECTOR_INDEX_TYPE,
+                index_name="vector_index",
+                metric_type=DEFAULT_OCEANBASE_VECTOR_METRIC_TYPE,
+                params=DEFAULT_OCEANBASE_HNSW_BUILD_PARAM,
+            )
+
+            self._client.create_table_with_index_params(
+                table_name=self._collection_name,
+                columns=cols,
+                vidxs=vidx_params,
+            )
+            vals = []
+            params = self._client.perform_raw_text_sql("SHOW PARAMETERS LIKE '%ob_vector_memory_limit_percentage%'")
+            for row in params:
+                val = int(row[6])
+                vals.append(val)
+            if len(vals) == 0:
+                print("ob_vector_memory_limit_percentage not found in parameters.")
+                exit(1)
+            if any(val == 0 for val in vals):
+                try:
+                    self._client.perform_raw_text_sql("ALTER SYSTEM SET ob_vector_memory_limit_percentage = 30")
+                except Exception as e:
+                    raise Exception(
+                        "Failed to set ob_vector_memory_limit_percentage. "
+                        + "Maybe the database user has insufficient privilege.",
+                        e,
+                    )
+            redis_client.set(collection_exist_cache_key, 1, ex=3600)
+
+    def add_texts(self, documents: list[Document], embeddings: list[list[float]], **kwargs):
+        ids = self._get_uuids(documents)
+        for id, doc, emb in zip(ids, documents, embeddings):
+            self._client.insert(
+                table_name=self._collection_name,
+                data={
+                    "id": id,
+                    "vector": emb,
+                    "text": doc.page_content,
+                    "metadata": doc.metadata,
+                },
+            )
+
+    def text_exists(self, id: str) -> bool:
+        cur = self._client.get(table_name=self._collection_name, id=id)
+        return cur.rowcount != 0
+
+    def delete_by_ids(self, ids: list[str]) -> None:
+        self._client.delete(table_name=self._collection_name, ids=ids)
+
+    def get_ids_by_metadata_field(self, key: str, value: str) -> list[str]:
+        cur = self._client.get(
+            table_name=self._collection_name,
+            where_clause=f"metadata->>'$.{key}' = '{value}'",
+            output_column_name=["id"],
+        )
+        return [row[0] for row in cur]
+
+    def delete_by_metadata_field(self, key: str, value: str) -> None:
+        ids = self.get_ids_by_metadata_field(key, value)
+        self.delete_by_ids(ids)
+
+    def search_by_full_text(self, query: str, **kwargs: Any) -> list[Document]:
+        return []
+
+    def search_by_vector(self, query_vector: list[float], **kwargs: Any) -> list[Document]:
+        ef_search = kwargs.get("ef_search", self._hnsw_ef_search)
+        if ef_search != self._hnsw_ef_search:
+            self._client.set_ob_hnsw_ef_search(ef_search)
+            self._hnsw_ef_search = ef_search
+        topk = kwargs.get("top_k", 10)
+        cur = self._client.ann_search(
+            table_name=self._collection_name,
+            vec_column_name="vector",
+            vec_data=query_vector,
+            topk=topk,
+            distance_func=func.l2_distance,
+            output_column_names=["text", "metadata"],
+            with_dist=True,
+        )
+        docs = []
+        for text, metadata, distance in cur:
+            metadata = json.loads(metadata)
+            metadata["score"] = 1 - distance / math.sqrt(2)
+            docs.append(
+                Document(
+                    page_content=text,
+                    metadata=metadata,
+                )
+            )
+        return docs
+
+    def delete(self) -> None:
+        self._client.drop_table_if_exist(self._collection_name)
+
+
+class OceanBaseVectorFactory(AbstractVectorFactory):
+    def init_vector(
+        self,
+        dataset: Dataset,
+        attributes: list,
+        embeddings: Embeddings,
+    ) -> BaseVector:
+        if dataset.index_struct_dict:
+            class_prefix: str = dataset.index_struct_dict["vector_store"]["class_prefix"]
+            collection_name = class_prefix.lower()
+        else:
+            dataset_id = dataset.id
+            collection_name = Dataset.gen_collection_name_by_id(dataset_id).lower()
+            dataset.index_struct = json.dumps(self.gen_index_struct_dict(VectorType.OCEANBASE, collection_name))
+        return OceanBaseVector(
+            collection_name,
+            OceanBaseVectorConfig(
+                host=dify_config.OCEANBASE_VECTOR_HOST,
+                port=dify_config.OCEANBASE_VECTOR_PORT,
+                user=dify_config.OCEANBASE_VECTOR_USER,
+                password=(dify_config.OCEANBASE_VECTOR_PASSWORD or ""),
+                database=dify_config.OCEANBASE_VECTOR_DATABASE,
+            ),
+        )
diff --git a/api/core/rag/datasource/vdb/vector_factory.py b/api/core/rag/datasource/vdb/vector_factory.py
index 87d19bf60b..c8cb007ae8 100644
--- a/api/core/rag/datasource/vdb/vector_factory.py
+++ b/api/core/rag/datasource/vdb/vector_factory.py
@@ -134,6 +134,10 @@ class Vector:
                 from core.rag.datasource.vdb.tidb_on_qdrant.tidb_on_qdrant_vector import TidbOnQdrantVectorFactory
 
                 return TidbOnQdrantVectorFactory
+            case VectorType.OCEANBASE:
+                from core.rag.datasource.vdb.oceanbase.oceanbase_vector import OceanBaseVectorFactory
+
+                return OceanBaseVectorFactory
             case _:
                 raise ValueError(f"Vector store {vector_type} is not supported.")
 
diff --git a/api/core/rag/datasource/vdb/vector_type.py b/api/core/rag/datasource/vdb/vector_type.py
index 7384c12ff7..e3b37ece88 100644
--- a/api/core/rag/datasource/vdb/vector_type.py
+++ b/api/core/rag/datasource/vdb/vector_type.py
@@ -21,3 +21,4 @@ class VectorType(str, Enum):
     VIKINGDB = "vikingdb"
     UPSTASH = "upstash"
     TIDB_ON_QDRANT = "tidb_on_qdrant"
+    OCEANBASE = "oceanbase"
diff --git a/api/poetry.lock b/api/poetry.lock
index e1e5a6410b..5b581b9965 100644
--- a/api/poetry.lock
+++ b/api/poetry.lock
@@ -1,4 +1,4 @@
-# This file is automatically @generated by Poetry 1.8.3 and should not be changed by hand.
+# This file is automatically @generated by Poetry 1.8.2 and should not be changed by hand.
 
 [[package]]
 name = "aiohappyeyeballs"
@@ -932,6 +932,10 @@ files = [
     {file = "Brotli-1.1.0-cp310-cp310-musllinux_1_1_i686.whl", hash = "sha256:a37b8f0391212d29b3a91a799c8e4a2855e0576911cdfb2515487e30e322253d"},
     {file = "Brotli-1.1.0-cp310-cp310-musllinux_1_1_ppc64le.whl", hash = "sha256:e84799f09591700a4154154cab9787452925578841a94321d5ee8fb9a9a328f0"},
     {file = "Brotli-1.1.0-cp310-cp310-musllinux_1_1_x86_64.whl", hash = "sha256:f66b5337fa213f1da0d9000bc8dc0cb5b896b726eefd9c6046f699b169c41b9e"},
+    {file = "Brotli-1.1.0-cp310-cp310-musllinux_1_2_aarch64.whl", hash = "sha256:5dab0844f2cf82be357a0eb11a9087f70c5430b2c241493fc122bb6f2bb0917c"},
+    {file = "Brotli-1.1.0-cp310-cp310-musllinux_1_2_i686.whl", hash = "sha256:e4fe605b917c70283db7dfe5ada75e04561479075761a0b3866c081d035b01c1"},
+    {file = "Brotli-1.1.0-cp310-cp310-musllinux_1_2_ppc64le.whl", hash = "sha256:1e9a65b5736232e7a7f91ff3d02277f11d339bf34099a56cdab6a8b3410a02b2"},
+    {file = "Brotli-1.1.0-cp310-cp310-musllinux_1_2_x86_64.whl", hash = "sha256:58d4b711689366d4a03ac7957ab8c28890415e267f9b6589969e74b6e42225ec"},
     {file = "Brotli-1.1.0-cp310-cp310-win32.whl", hash = "sha256:be36e3d172dc816333f33520154d708a2657ea63762ec16b62ece02ab5e4daf2"},
     {file = "Brotli-1.1.0-cp310-cp310-win_amd64.whl", hash = "sha256:0c6244521dda65ea562d5a69b9a26120769b7a9fb3db2fe9545935ed6735b128"},
     {file = "Brotli-1.1.0-cp311-cp311-macosx_10_9_universal2.whl", hash = "sha256:a3daabb76a78f829cafc365531c972016e4aa8d5b4bf60660ad8ecee19df7ccc"},
@@ -944,8 +948,14 @@ files = [
     {file = "Brotli-1.1.0-cp311-cp311-musllinux_1_1_i686.whl", hash = "sha256:19c116e796420b0cee3da1ccec3b764ed2952ccfcc298b55a10e5610ad7885f9"},
     {file = "Brotli-1.1.0-cp311-cp311-musllinux_1_1_ppc64le.whl", hash = "sha256:510b5b1bfbe20e1a7b3baf5fed9e9451873559a976c1a78eebaa3b86c57b4265"},
     {file = "Brotli-1.1.0-cp311-cp311-musllinux_1_1_x86_64.whl", hash = "sha256:a1fd8a29719ccce974d523580987b7f8229aeace506952fa9ce1d53a033873c8"},
+    {file = "Brotli-1.1.0-cp311-cp311-musllinux_1_2_aarch64.whl", hash = "sha256:c247dd99d39e0338a604f8c2b3bc7061d5c2e9e2ac7ba9cc1be5a69cb6cd832f"},
+    {file = "Brotli-1.1.0-cp311-cp311-musllinux_1_2_i686.whl", hash = "sha256:1b2c248cd517c222d89e74669a4adfa5577e06ab68771a529060cf5a156e9757"},
+    {file = "Brotli-1.1.0-cp311-cp311-musllinux_1_2_ppc64le.whl", hash = "sha256:2a24c50840d89ded6c9a8fdc7b6ed3692ed4e86f1c4a4a938e1e92def92933e0"},
+    {file = "Brotli-1.1.0-cp311-cp311-musllinux_1_2_x86_64.whl", hash = "sha256:f31859074d57b4639318523d6ffdca586ace54271a73ad23ad021acd807eb14b"},
     {file = "Brotli-1.1.0-cp311-cp311-win32.whl", hash = "sha256:39da8adedf6942d76dc3e46653e52df937a3c4d6d18fdc94a7c29d263b1f5b50"},
     {file = "Brotli-1.1.0-cp311-cp311-win_amd64.whl", hash = "sha256:aac0411d20e345dc0920bdec5548e438e999ff68d77564d5e9463a7ca9d3e7b1"},
+    {file = "Brotli-1.1.0-cp312-cp312-macosx_10_13_universal2.whl", hash = "sha256:32d95b80260d79926f5fab3c41701dbb818fde1c9da590e77e571eefd14abe28"},
+    {file = "Brotli-1.1.0-cp312-cp312-macosx_10_13_x86_64.whl", hash = "sha256:b760c65308ff1e462f65d69c12e4ae085cff3b332d894637f6273a12a482d09f"},
     {file = "Brotli-1.1.0-cp312-cp312-macosx_10_9_universal2.whl", hash = "sha256:316cc9b17edf613ac76b1f1f305d2a748f1b976b033b049a6ecdfd5612c70409"},
     {file = "Brotli-1.1.0-cp312-cp312-macosx_10_9_x86_64.whl", hash = "sha256:caf9ee9a5775f3111642d33b86237b05808dafcd6268faa492250e9b78046eb2"},
     {file = "Brotli-1.1.0-cp312-cp312-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:70051525001750221daa10907c77830bc889cb6d865cc0b813d9db7fefc21451"},
@@ -956,8 +966,24 @@ files = [
     {file = "Brotli-1.1.0-cp312-cp312-musllinux_1_1_i686.whl", hash = "sha256:4093c631e96fdd49e0377a9c167bfd75b6d0bad2ace734c6eb20b348bc3ea180"},
     {file = "Brotli-1.1.0-cp312-cp312-musllinux_1_1_ppc64le.whl", hash = "sha256:7e4c4629ddad63006efa0ef968c8e4751c5868ff0b1c5c40f76524e894c50248"},
     {file = "Brotli-1.1.0-cp312-cp312-musllinux_1_1_x86_64.whl", hash = "sha256:861bf317735688269936f755fa136a99d1ed526883859f86e41a5d43c61d8966"},
+    {file = "Brotli-1.1.0-cp312-cp312-musllinux_1_2_aarch64.whl", hash = "sha256:87a3044c3a35055527ac75e419dfa9f4f3667a1e887ee80360589eb8c90aabb9"},
+    {file = "Brotli-1.1.0-cp312-cp312-musllinux_1_2_i686.whl", hash = "sha256:c5529b34c1c9d937168297f2c1fde7ebe9ebdd5e121297ff9c043bdb2ae3d6fb"},
+    {file = "Brotli-1.1.0-cp312-cp312-musllinux_1_2_ppc64le.whl", hash = "sha256:ca63e1890ede90b2e4454f9a65135a4d387a4585ff8282bb72964fab893f2111"},
+    {file = "Brotli-1.1.0-cp312-cp312-musllinux_1_2_x86_64.whl", hash = "sha256:e79e6520141d792237c70bcd7a3b122d00f2613769ae0cb61c52e89fd3443839"},
     {file = "Brotli-1.1.0-cp312-cp312-win32.whl", hash = "sha256:5f4d5ea15c9382135076d2fb28dde923352fe02951e66935a9efaac8f10e81b0"},
     {file = "Brotli-1.1.0-cp312-cp312-win_amd64.whl", hash = "sha256:906bc3a79de8c4ae5b86d3d75a8b77e44404b0f4261714306e3ad248d8ab0951"},
+    {file = "Brotli-1.1.0-cp313-cp313-macosx_10_13_universal2.whl", hash = "sha256:8bf32b98b75c13ec7cf774164172683d6e7891088f6316e54425fde1efc276d5"},
+    {file = "Brotli-1.1.0-cp313-cp313-macosx_10_13_x86_64.whl", hash = "sha256:7bc37c4d6b87fb1017ea28c9508b36bbcb0c3d18b4260fcdf08b200c74a6aee8"},
+    {file = "Brotli-1.1.0-cp313-cp313-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:3c0ef38c7a7014ffac184db9e04debe495d317cc9c6fb10071f7fefd93100a4f"},
+    {file = "Brotli-1.1.0-cp313-cp313-manylinux_2_17_ppc64le.manylinux2014_ppc64le.whl", hash = "sha256:91d7cc2a76b5567591d12c01f019dd7afce6ba8cba6571187e21e2fc418ae648"},
+    {file = "Brotli-1.1.0-cp313-cp313-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:a93dde851926f4f2678e704fadeb39e16c35d8baebd5252c9fd94ce8ce68c4a0"},
+    {file = "Brotli-1.1.0-cp313-cp313-manylinux_2_5_i686.manylinux1_i686.manylinux_2_17_i686.manylinux2014_i686.whl", hash = "sha256:f0db75f47be8b8abc8d9e31bc7aad0547ca26f24a54e6fd10231d623f183d089"},
+    {file = "Brotli-1.1.0-cp313-cp313-musllinux_1_2_aarch64.whl", hash = "sha256:6967ced6730aed543b8673008b5a391c3b1076d834ca438bbd70635c73775368"},
+    {file = "Brotli-1.1.0-cp313-cp313-musllinux_1_2_i686.whl", hash = "sha256:7eedaa5d036d9336c95915035fb57422054014ebdeb6f3b42eac809928e40d0c"},
+    {file = "Brotli-1.1.0-cp313-cp313-musllinux_1_2_ppc64le.whl", hash = "sha256:d487f5432bf35b60ed625d7e1b448e2dc855422e87469e3f450aa5552b0eb284"},
+    {file = "Brotli-1.1.0-cp313-cp313-musllinux_1_2_x86_64.whl", hash = "sha256:832436e59afb93e1836081a20f324cb185836c617659b07b129141a8426973c7"},
+    {file = "Brotli-1.1.0-cp313-cp313-win32.whl", hash = "sha256:43395e90523f9c23a3d5bdf004733246fba087f2948f87ab28015f12359ca6a0"},
+    {file = "Brotli-1.1.0-cp313-cp313-win_amd64.whl", hash = "sha256:9011560a466d2eb3f5a6e4929cf4a09be405c64154e12df0dd72713f6500e32b"},
     {file = "Brotli-1.1.0-cp36-cp36m-macosx_10_9_x86_64.whl", hash = "sha256:a090ca607cbb6a34b0391776f0cb48062081f5f60ddcce5d11838e67a01928d1"},
     {file = "Brotli-1.1.0-cp36-cp36m-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:2de9d02f5bda03d27ede52e8cfe7b865b066fa49258cbab568720aa5be80a47d"},
     {file = "Brotli-1.1.0-cp36-cp36m-manylinux_2_17_ppc64le.manylinux2014_ppc64le.whl", hash = "sha256:2333e30a5e00fe0fe55903c8832e08ee9c3b1382aacf4db26664a16528d51b4b"},
@@ -967,6 +993,10 @@ files = [
     {file = "Brotli-1.1.0-cp36-cp36m-musllinux_1_1_i686.whl", hash = "sha256:fd5f17ff8f14003595ab414e45fce13d073e0762394f957182e69035c9f3d7c2"},
     {file = "Brotli-1.1.0-cp36-cp36m-musllinux_1_1_ppc64le.whl", hash = "sha256:069a121ac97412d1fe506da790b3e69f52254b9df4eb665cd42460c837193354"},
     {file = "Brotli-1.1.0-cp36-cp36m-musllinux_1_1_x86_64.whl", hash = "sha256:e93dfc1a1165e385cc8239fab7c036fb2cd8093728cbd85097b284d7b99249a2"},
+    {file = "Brotli-1.1.0-cp36-cp36m-musllinux_1_2_aarch64.whl", hash = "sha256:aea440a510e14e818e67bfc4027880e2fb500c2ccb20ab21c7a7c8b5b4703d75"},
+    {file = "Brotli-1.1.0-cp36-cp36m-musllinux_1_2_i686.whl", hash = "sha256:6974f52a02321b36847cd19d1b8e381bf39939c21efd6ee2fc13a28b0d99348c"},
+    {file = "Brotli-1.1.0-cp36-cp36m-musllinux_1_2_ppc64le.whl", hash = "sha256:a7e53012d2853a07a4a79c00643832161a910674a893d296c9f1259859a289d2"},
+    {file = "Brotli-1.1.0-cp36-cp36m-musllinux_1_2_x86_64.whl", hash = "sha256:d7702622a8b40c49bffb46e1e3ba2e81268d5c04a34f460978c6b5517a34dd52"},
     {file = "Brotli-1.1.0-cp36-cp36m-win32.whl", hash = "sha256:a599669fd7c47233438a56936988a2478685e74854088ef5293802123b5b2460"},
     {file = "Brotli-1.1.0-cp36-cp36m-win_amd64.whl", hash = "sha256:d143fd47fad1db3d7c27a1b1d66162e855b5d50a89666af46e1679c496e8e579"},
     {file = "Brotli-1.1.0-cp37-cp37m-macosx_10_9_x86_64.whl", hash = "sha256:11d00ed0a83fa22d29bc6b64ef636c4552ebafcef57154b4ddd132f5638fbd1c"},
@@ -978,6 +1008,10 @@ files = [
     {file = "Brotli-1.1.0-cp37-cp37m-musllinux_1_1_i686.whl", hash = "sha256:919e32f147ae93a09fe064d77d5ebf4e35502a8df75c29fb05788528e330fe74"},
     {file = "Brotli-1.1.0-cp37-cp37m-musllinux_1_1_ppc64le.whl", hash = "sha256:23032ae55523cc7bccb4f6a0bf368cd25ad9bcdcc1990b64a647e7bbcce9cb5b"},
     {file = "Brotli-1.1.0-cp37-cp37m-musllinux_1_1_x86_64.whl", hash = "sha256:224e57f6eac61cc449f498cc5f0e1725ba2071a3d4f48d5d9dffba42db196438"},
+    {file = "Brotli-1.1.0-cp37-cp37m-musllinux_1_2_aarch64.whl", hash = "sha256:cb1dac1770878ade83f2ccdf7d25e494f05c9165f5246b46a621cc849341dc01"},
+    {file = "Brotli-1.1.0-cp37-cp37m-musllinux_1_2_i686.whl", hash = "sha256:3ee8a80d67a4334482d9712b8e83ca6b1d9bc7e351931252ebef5d8f7335a547"},
+    {file = "Brotli-1.1.0-cp37-cp37m-musllinux_1_2_ppc64le.whl", hash = "sha256:5e55da2c8724191e5b557f8e18943b1b4839b8efc3ef60d65985bcf6f587dd38"},
+    {file = "Brotli-1.1.0-cp37-cp37m-musllinux_1_2_x86_64.whl", hash = "sha256:d342778ef319e1026af243ed0a07c97acf3bad33b9f29e7ae6a1f68fd083e90c"},
     {file = "Brotli-1.1.0-cp37-cp37m-win32.whl", hash = "sha256:587ca6d3cef6e4e868102672d3bd9dc9698c309ba56d41c2b9c85bbb903cdb95"},
     {file = "Brotli-1.1.0-cp37-cp37m-win_amd64.whl", hash = "sha256:2954c1c23f81c2eaf0b0717d9380bd348578a94161a65b3a2afc62c86467dd68"},
     {file = "Brotli-1.1.0-cp38-cp38-macosx_10_9_universal2.whl", hash = "sha256:efa8b278894b14d6da122a72fefcebc28445f2d3f880ac59d46c90f4c13be9a3"},
@@ -990,6 +1024,10 @@ files = [
     {file = "Brotli-1.1.0-cp38-cp38-musllinux_1_1_i686.whl", hash = "sha256:1ab4fbee0b2d9098c74f3057b2bc055a8bd92ccf02f65944a241b4349229185a"},
     {file = "Brotli-1.1.0-cp38-cp38-musllinux_1_1_ppc64le.whl", hash = "sha256:141bd4d93984070e097521ed07e2575b46f817d08f9fa42b16b9b5f27b5ac088"},
     {file = "Brotli-1.1.0-cp38-cp38-musllinux_1_1_x86_64.whl", hash = "sha256:fce1473f3ccc4187f75b4690cfc922628aed4d3dd013d047f95a9b3919a86596"},
+    {file = "Brotli-1.1.0-cp38-cp38-musllinux_1_2_aarch64.whl", hash = "sha256:d2b35ca2c7f81d173d2fadc2f4f31e88cc5f7a39ae5b6db5513cf3383b0e0ec7"},
+    {file = "Brotli-1.1.0-cp38-cp38-musllinux_1_2_i686.whl", hash = "sha256:af6fa6817889314555aede9a919612b23739395ce767fe7fcbea9a80bf140fe5"},
+    {file = "Brotli-1.1.0-cp38-cp38-musllinux_1_2_ppc64le.whl", hash = "sha256:2feb1d960f760a575dbc5ab3b1c00504b24caaf6986e2dc2b01c09c87866a943"},
+    {file = "Brotli-1.1.0-cp38-cp38-musllinux_1_2_x86_64.whl", hash = "sha256:4410f84b33374409552ac9b6903507cdb31cd30d2501fc5ca13d18f73548444a"},
     {file = "Brotli-1.1.0-cp38-cp38-win32.whl", hash = "sha256:db85ecf4e609a48f4b29055f1e144231b90edc90af7481aa731ba2d059226b1b"},
     {file = "Brotli-1.1.0-cp38-cp38-win_amd64.whl", hash = "sha256:3d7954194c36e304e1523f55d7042c59dc53ec20dd4e9ea9d151f1b62b4415c0"},
     {file = "Brotli-1.1.0-cp39-cp39-macosx_10_9_universal2.whl", hash = "sha256:5fb2ce4b8045c78ebbc7b8f3c15062e435d47e7393cc57c25115cfd49883747a"},
@@ -1002,6 +1040,10 @@ files = [
     {file = "Brotli-1.1.0-cp39-cp39-musllinux_1_1_i686.whl", hash = "sha256:949f3b7c29912693cee0afcf09acd6ebc04c57af949d9bf77d6101ebb61e388c"},
     {file = "Brotli-1.1.0-cp39-cp39-musllinux_1_1_ppc64le.whl", hash = "sha256:89f4988c7203739d48c6f806f1e87a1d96e0806d44f0fba61dba81392c9e474d"},
     {file = "Brotli-1.1.0-cp39-cp39-musllinux_1_1_x86_64.whl", hash = "sha256:de6551e370ef19f8de1807d0a9aa2cdfdce2e85ce88b122fe9f6b2b076837e59"},
+    {file = "Brotli-1.1.0-cp39-cp39-musllinux_1_2_aarch64.whl", hash = "sha256:0737ddb3068957cf1b054899b0883830bb1fec522ec76b1098f9b6e0f02d9419"},
+    {file = "Brotli-1.1.0-cp39-cp39-musllinux_1_2_i686.whl", hash = "sha256:4f3607b129417e111e30637af1b56f24f7a49e64763253bbc275c75fa887d4b2"},
+    {file = "Brotli-1.1.0-cp39-cp39-musllinux_1_2_ppc64le.whl", hash = "sha256:6c6e0c425f22c1c719c42670d561ad682f7bfeeef918edea971a79ac5252437f"},
+    {file = "Brotli-1.1.0-cp39-cp39-musllinux_1_2_x86_64.whl", hash = "sha256:494994f807ba0b92092a163a0a283961369a65f6cbe01e8891132b7a320e61eb"},
     {file = "Brotli-1.1.0-cp39-cp39-win32.whl", hash = "sha256:f0d8a7a6b5983c2496e364b969f0e526647a06b075d034f3297dc66f3b360c64"},
     {file = "Brotli-1.1.0-cp39-cp39-win_amd64.whl", hash = "sha256:cdad5b9014d83ca68c25d2e9444e28e967ef16e80f6b436918c700c117a85467"},
     {file = "Brotli-1.1.0.tar.gz", hash = "sha256:81de08ac11bcb85841e440c13611c00b67d3bf82698314928d0b676362546724"},
@@ -7269,6 +7311,22 @@ files = [
 ed25519 = ["PyNaCl (>=1.4.0)"]
 rsa = ["cryptography"]
 
+[[package]]
+name = "pyobvector"
+version = "0.1.6"
+description = "A python SDK for OceanBase Vector Store, based on SQLAlchemy, compatible with Milvus API."
+optional = false
+python-versions = "<4.0,>=3.9"
+files = [
+    {file = "pyobvector-0.1.6-py3-none-any.whl", hash = "sha256:0d700e865a85b4716b9a03384189e49288cd9d5f3cef88aed4740bc82d5fd136"},
+    {file = "pyobvector-0.1.6.tar.gz", hash = "sha256:05551addcac8c596992d5e38b480c83ca3481c6cfc6f56a1a1bddfb2e6ae037e"},
+]
+
+[package.dependencies]
+numpy = ">=1.26.0,<2.0.0"
+pymysql = ">=1.1.1,<2.0.0"
+sqlalchemy = ">=2.0.32,<3.0.0"
+
 [[package]]
 name = "pyopenssl"
 version = "24.2.1"
@@ -8677,6 +8735,11 @@ files = [
     {file = "scikit_learn-1.5.2-cp312-cp312-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:f60021ec1574e56632be2a36b946f8143bf4e5e6af4a06d85281adc22938e0dd"},
     {file = "scikit_learn-1.5.2-cp312-cp312-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:394397841449853c2290a32050382edaec3da89e35b3e03d6cc966aebc6a8ae6"},
     {file = "scikit_learn-1.5.2-cp312-cp312-win_amd64.whl", hash = "sha256:57cc1786cfd6bd118220a92ede80270132aa353647684efa385a74244a41e3b1"},
+    {file = "scikit_learn-1.5.2-cp313-cp313-macosx_10_13_x86_64.whl", hash = "sha256:e9a702e2de732bbb20d3bad29ebd77fc05a6b427dc49964300340e4c9328b3f5"},
+    {file = "scikit_learn-1.5.2-cp313-cp313-macosx_12_0_arm64.whl", hash = "sha256:b0768ad641981f5d3a198430a1d31c3e044ed2e8a6f22166b4d546a5116d7908"},
+    {file = "scikit_learn-1.5.2-cp313-cp313-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:178ddd0a5cb0044464fc1bfc4cca5b1833bfc7bb022d70b05db8530da4bb3dd3"},
+    {file = "scikit_learn-1.5.2-cp313-cp313-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:f7284ade780084d94505632241bf78c44ab3b6f1e8ccab3d2af58e0e950f9c12"},
+    {file = "scikit_learn-1.5.2-cp313-cp313-win_amd64.whl", hash = "sha256:b7b0f9a0b1040830d38c39b91b3a44e1b643f4b36e36567b80b7c6bd2202a27f"},
     {file = "scikit_learn-1.5.2-cp39-cp39-macosx_10_9_x86_64.whl", hash = "sha256:757c7d514ddb00ae249832fe87100d9c73c6ea91423802872d9e74970a0e40b9"},
     {file = "scikit_learn-1.5.2-cp39-cp39-macosx_12_0_arm64.whl", hash = "sha256:52788f48b5d8bca5c0736c175fa6bdaab2ef00a8f536cda698db61bd89c551c1"},
     {file = "scikit_learn-1.5.2-cp39-cp39-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:643964678f4b5fbdc95cbf8aec638acc7aa70f5f79ee2cdad1eec3df4ba6ead8"},
@@ -10919,4 +10982,4 @@ cffi = ["cffi (>=1.11)"]
 [metadata]
 lock-version = "2.0"
 python-versions = ">=3.10,<3.13"
-content-hash = "52552faf5f4823056eb48afe05349ab2f0e9a5bc42105211ccbbb54b59e27b59"
+content-hash = "ef927b98c33d704d680e08db0e5c7d9a4e05454c66fcd6a5f656a65eb08e886b"
diff --git a/api/pyproject.toml b/api/pyproject.toml
index a3313f0ff5..ee7cf4d618 100644
--- a/api/pyproject.toml
+++ b/api/pyproject.toml
@@ -247,6 +247,7 @@ pgvecto-rs = { version = "~0.2.1", extras = ['sqlalchemy'] }
 pgvector = "0.2.5"
 pymilvus = "~2.4.4"
 pymochow = "1.3.1"
+pyobvector = "~0.1.6"
 qdrant-client = "1.7.3"
 tcvectordb = "1.3.2"
 tidb-vector = "0.0.9"
diff --git a/api/tests/integration_tests/vdb/oceanbase/__init__.py b/api/tests/integration_tests/vdb/oceanbase/__init__.py
new file mode 100644
index 0000000000..e69de29bb2
diff --git a/api/tests/integration_tests/vdb/oceanbase/test_oceanbase.py b/api/tests/integration_tests/vdb/oceanbase/test_oceanbase.py
new file mode 100644
index 0000000000..ebcb134168
--- /dev/null
+++ b/api/tests/integration_tests/vdb/oceanbase/test_oceanbase.py
@@ -0,0 +1,71 @@
+from unittest.mock import MagicMock, patch
+
+import pytest
+
+from core.rag.datasource.vdb.oceanbase.oceanbase_vector import (
+    OceanBaseVector,
+    OceanBaseVectorConfig,
+)
+from tests.integration_tests.vdb.__mock.tcvectordb import setup_tcvectordb_mock
+from tests.integration_tests.vdb.test_vector_store import (
+    AbstractVectorTest,
+    get_example_text,
+    setup_mock_redis,
+)
+
+
+@pytest.fixture
+def oceanbase_vector():
+    return OceanBaseVector(
+        "dify_test_collection",
+        config=OceanBaseVectorConfig(
+            host="127.0.0.1",
+            port="2881",
+            user="root@test",
+            database="test",
+            password="test",
+        ),
+    )
+
+
+class OceanBaseVectorTest(AbstractVectorTest):
+    def __init__(self, vector: OceanBaseVector):
+        super().__init__()
+        self.vector = vector
+
+    def search_by_vector(self):
+        hits_by_vector = self.vector.search_by_vector(query_vector=self.example_embedding)
+        assert len(hits_by_vector) == 0
+
+    def search_by_full_text(self):
+        hits_by_full_text = self.vector.search_by_full_text(query=get_example_text())
+        assert len(hits_by_full_text) == 0
+
+    def text_exists(self):
+        exist = self.vector.text_exists(self.example_doc_id)
+        assert exist == True
+
+    def get_ids_by_metadata_field(self):
+        ids = self.vector.get_ids_by_metadata_field(key="document_id", value=self.example_doc_id)
+        assert len(ids) == 0
+
+
+@pytest.fixture
+def setup_mock_oceanbase_client():
+    with patch("core.rag.datasource.vdb.oceanbase.oceanbase_vector.ObVecClient", new_callable=MagicMock) as mock_client:
+        yield mock_client
+
+
+@pytest.fixture
+def setup_mock_oceanbase_vector(oceanbase_vector):
+    with patch.object(oceanbase_vector, "_client"):
+        yield oceanbase_vector
+
+
+def test_oceanbase_vector(
+    setup_mock_redis,
+    setup_mock_oceanbase_client,
+    setup_mock_oceanbase_vector,
+    oceanbase_vector,
+):
+    OceanBaseVectorTest(oceanbase_vector).run_all_tests()
diff --git a/dev/pytest/pytest_vdb.sh b/dev/pytest/pytest_vdb.sh
index 418a129693..02a9f49279 100755
--- a/dev/pytest/pytest_vdb.sh
+++ b/dev/pytest/pytest_vdb.sh
@@ -13,3 +13,4 @@ pytest api/tests/integration_tests/vdb/chroma \
   api/tests/integration_tests/vdb/tcvectordb \
   api/tests/integration_tests/vdb/upstash \
   api/tests/integration_tests/vdb/couchbase \
+  api/tests/integration_tests/vdb/oceanbase \
diff --git a/docker/.env.example b/docker/.env.example
index c506a9d92e..db99701c52 100644
--- a/docker/.env.example
+++ b/docker/.env.example
@@ -517,6 +517,14 @@ VIKINGDB_SCHEMA=http
 VIKINGDB_CONNECTION_TIMEOUT=30
 VIKINGDB_SOCKET_TIMEOUT=30
 
+# OceanBase Vector configuration, only available when VECTOR_STORE is `oceanbase`
+OCEANBASE_VECTOR_HOST=oceanbase-vector
+OCEANBASE_VECTOR_PORT=2881
+OCEANBASE_VECTOR_USER=root@test
+OCEANBASE_VECTOR_PASSWORD=
+OCEANBASE_VECTOR_DATABASE=test
+OCEANBASE_MEMORY_LIMIT=6G
+
 # ------------------------------
 # Knowledge Configuration
 # ------------------------------
diff --git a/docker/docker-compose.yaml b/docker/docker-compose.yaml
index 2a756ead9c..28a70b0f56 100644
--- a/docker/docker-compose.yaml
+++ b/docker/docker-compose.yaml
@@ -243,6 +243,12 @@ x-shared-env: &shared-api-worker-env
   POSITION_PROVIDER_INCLUDES: ${POSITION_PROVIDER_INCLUDES:-}
   POSITION_PROVIDER_EXCLUDES: ${POSITION_PROVIDER_EXCLUDES:-}
   MAX_VARIABLE_SIZE: ${MAX_VARIABLE_SIZE:-204800}
+  OCEANBASE_VECTOR_HOST: ${OCEANBASE_VECTOR_HOST:-http://oceanbase-vector}
+  OCEANBASE_VECTOR_PORT: ${OCEANBASE_VECTOR_PORT:-2881}
+  OCEANBASE_VECTOR_USER: ${OCEANBASE_VECTOR_USER:-root@test}
+  OCEANBASE_VECTOR_PASSWORD: ${OCEANBASE_VECTOR_PASSWORD:-""}
+  OCEANBASE_VECTOR_DATABASE: ${OCEANBASE_VECTOR_DATABASE:-test}
+  OCEANBASE_MEMORY_LIMIT: ${OCEANBASE_MEMORY_LIMIT:-6G}
 
 services:
   # API service
@@ -570,6 +576,18 @@ services:
       CHROMA_SERVER_AUTHN_PROVIDER: ${CHROMA_SERVER_AUTHN_PROVIDER:-chromadb.auth.token_authn.TokenAuthenticationServerProvider}
       IS_PERSISTENT: ${CHROMA_IS_PERSISTENT:-TRUE}
 
+  # OceanBase vector database
+  oceanbase-vector:
+    image: quay.io/oceanbase/oceanbase-ce:4.3.3.0-100000142024101215
+    profiles:
+      - oceanbase-vector
+    restart: always
+    volumes:
+      - ./volumes/oceanbase/data:/root/ob
+      - ./volumes/oceanbase/conf:/root/.obd/cluster
+    environment:
+      OB_MEMORY_LIMIT: ${OCEANBASE_MEMORY_LIMIT:-6G}
+
   # Oracle vector database
   oracle:
     image: container-registry.oracle.com/database/free:latest

From c6e54c83c87917334a4c95fdb5599d1597f32e4c Mon Sep 17 00:00:00 2001
From: zhuhao <37029601+hwzhuhao@users.noreply.github.com>
Date: Tue, 29 Oct 2024 21:11:10 +0800
Subject: [PATCH 20/29] chore: add tidb-on-qdrant configuration in env and
 docker-compose file (#10015)

---
 api/.env.example           | 14 ++++++++++++++
 docker/.env.example        | 14 ++++++++++++++
 docker/docker-compose.yaml | 12 ++++++++++++
 3 files changed, 40 insertions(+)

diff --git a/api/.env.example b/api/.env.example
index 984985803e..79d6ffdf6a 100644
--- a/api/.env.example
+++ b/api/.env.example
@@ -202,6 +202,20 @@ TIDB_VECTOR_USER=xxx.root
 TIDB_VECTOR_PASSWORD=xxxxxx
 TIDB_VECTOR_DATABASE=dify
 
+# Tidb on qdrant configuration
+TIDB_ON_QDRANT_URL=http://127.0.0.1
+TIDB_ON_QDRANT_API_KEY=dify
+TIDB_ON_QDRANT_CLIENT_TIMEOUT=20
+TIDB_ON_QDRANT_GRPC_ENABLED=false
+TIDB_ON_QDRANT_GRPC_PORT=6334
+TIDB_PUBLIC_KEY=dify
+TIDB_PRIVATE_KEY=dify
+TIDB_API_URL=http://127.0.0.1
+TIDB_IAM_API_URL=http://127.0.0.1
+TIDB_REGION=regions/aws-us-east-1
+TIDB_PROJECT_ID=dify
+TIDB_SPEND_LIMIT=100
+
 # Chroma configuration
 CHROMA_HOST=127.0.0.1
 CHROMA_PORT=8000
diff --git a/docker/.env.example b/docker/.env.example
index db99701c52..ef2f331c11 100644
--- a/docker/.env.example
+++ b/docker/.env.example
@@ -455,6 +455,20 @@ TIDB_VECTOR_USER=xxx.root
 TIDB_VECTOR_PASSWORD=xxxxxx
 TIDB_VECTOR_DATABASE=dify
 
+# Tidb on qdrant configuration, only available when VECTOR_STORE is `tidb_on_qdrant`
+TIDB_ON_QDRANT_URL=http://127.0.0.1
+TIDB_ON_QDRANT_API_KEY=dify
+TIDB_ON_QDRANT_CLIENT_TIMEOUT=20
+TIDB_ON_QDRANT_GRPC_ENABLED=false
+TIDB_ON_QDRANT_GRPC_PORT=6334
+TIDB_PUBLIC_KEY=dify
+TIDB_PRIVATE_KEY=dify
+TIDB_API_URL=http://127.0.0.1
+TIDB_IAM_API_URL=http://127.0.0.1
+TIDB_REGION=regions/aws-us-east-1
+TIDB_PROJECT_ID=dify
+TIDB_SPEND_LIMIT=100
+
 # Chroma configuration, only available when VECTOR_STORE is `chroma`
 CHROMA_HOST=127.0.0.1
 CHROMA_PORT=8000
diff --git a/docker/docker-compose.yaml b/docker/docker-compose.yaml
index 28a70b0f56..47e4a0ddbb 100644
--- a/docker/docker-compose.yaml
+++ b/docker/docker-compose.yaml
@@ -140,6 +140,18 @@ x-shared-env: &shared-api-worker-env
   TIDB_VECTOR_USER: ${TIDB_VECTOR_USER:-}
   TIDB_VECTOR_PASSWORD: ${TIDB_VECTOR_PASSWORD:-}
   TIDB_VECTOR_DATABASE: ${TIDB_VECTOR_DATABASE:-dify}
+  TIDB_ON_QDRANT_URL: ${TIDB_ON_QDRANT_URL:-http://127.0.0.1}
+  TIDB_ON_QDRANT_API_KEY: ${TIDB_ON_QDRANT_API_KEY:-dify}
+  TIDB_ON_QDRANT_CLIENT_TIMEOUT: ${TIDB_ON_QDRANT_API_KEY:-20}
+  TIDB_ON_QDRANT_GRPC_ENABLED: ${TIDB_ON_QDRANT_GRPC_ENABLED:-false}
+  TIDB_ON_QDRANT_GRPC_PORT: ${TIDB_ON_QDRANT_GRPC_PORT:-6334}
+  TIDB_PUBLIC_KEY: ${TIDB_PUBLIC_KEY:-dify}
+  TIDB_PRIVATE_KEY: ${TIDB_PRIVATE_KEY:-dify}
+  TIDB_API_URL: ${TIDB_API_URL:-http://127.0.0.1}
+  TIDB_IAM_API_URL: ${TIDB_IAM_API_URL:-http://127.0.0.1}
+  TIDB_REGION: ${TIDB_REGION:-regions/aws-us-east-1}
+  TIDB_PROJECT_ID: ${TIDB_PROJECT_ID:-dify}
+  TIDB_SPEND_LIMIT: ${TIDB_SPEND_LIMIT:-100}
   ORACLE_HOST: ${ORACLE_HOST:-oracle}
   ORACLE_PORT: ${ORACLE_PORT:-1521}
   ORACLE_USER: ${ORACLE_USER:-dify}

From 539fc8b7608c8f3046a6fd1fa247e4e96a0053ff Mon Sep 17 00:00:00 2001
From: Hiroshi Fujita <fujita-h@users.noreply.github.com>
Date: Wed, 30 Oct 2024 03:11:18 +0900
Subject: [PATCH 21/29] Fix content-type header case sensitivity (#9961)

---
 .../workflow/nodes/http_request/entities.py   |  4 +--
 api/core/workflow/nodes/http_request/node.py  |  3 +-
 .../workflow/nodes/test_http.py               | 34 +++++++++++++++++++
 3 files changed, 38 insertions(+), 3 deletions(-)

diff --git a/api/core/workflow/nodes/http_request/entities.py b/api/core/workflow/nodes/http_request/entities.py
index dec76a277e..36ded104c1 100644
--- a/api/core/workflow/nodes/http_request/entities.py
+++ b/api/core/workflow/nodes/http_request/entities.py
@@ -94,7 +94,7 @@ class Response:
     @property
     def is_file(self):
         content_type = self.content_type
-        content_disposition = self.response.headers.get("Content-Disposition", "")
+        content_disposition = self.response.headers.get("content-disposition", "")
 
         return "attachment" in content_disposition or (
             not any(non_file in content_type for non_file in NON_FILE_CONTENT_TYPES)
@@ -103,7 +103,7 @@ class Response:
 
     @property
     def content_type(self) -> str:
-        return self.headers.get("Content-Type", "")
+        return self.headers.get("content-type", "")
 
     @property
     def text(self) -> str:
diff --git a/api/core/workflow/nodes/http_request/node.py b/api/core/workflow/nodes/http_request/node.py
index 483d0e2b7e..a037bee665 100644
--- a/api/core/workflow/nodes/http_request/node.py
+++ b/api/core/workflow/nodes/http_request/node.py
@@ -142,10 +142,11 @@ class HttpRequestNode(BaseNode[HttpRequestNodeData]):
         Extract files from response
         """
         files = []
+        is_file = response.is_file
         content_type = response.content_type
         content = response.content
 
-        if content_type:
+        if is_file and content_type:
             # extract filename from url
             filename = path.basename(url)
             # extract extension if possible
diff --git a/api/tests/integration_tests/workflow/nodes/test_http.py b/api/tests/integration_tests/workflow/nodes/test_http.py
index 9eea63f722..0da6622658 100644
--- a/api/tests/integration_tests/workflow/nodes/test_http.py
+++ b/api/tests/integration_tests/workflow/nodes/test_http.py
@@ -430,3 +430,37 @@ def test_multi_colons_parse(setup_http_mock):
     assert urlencode({"Redirect": "http://example2.com"}) in result.process_data.get("request", "")
     assert 'form-data; name="Redirect"\r\n\r\nhttp://example6.com' in result.process_data.get("request", "")
     # assert "http://example3.com" == resp.get("headers", {}).get("referer")
+
+
+def test_image_file(monkeypatch):
+    from types import SimpleNamespace
+
+    monkeypatch.setattr(
+        "core.tools.tool_file_manager.ToolFileManager.create_file_by_raw",
+        lambda *args, **kwargs: SimpleNamespace(id="1"),
+    )
+
+    node = init_http_node(
+        config={
+            "id": "1",
+            "data": {
+                "title": "http",
+                "desc": "",
+                "method": "get",
+                "url": "https://cloud.dify.ai/logo/logo-site.png",
+                "authorization": {
+                    "type": "no-auth",
+                    "config": None,
+                },
+                "params": "",
+                "headers": "",
+                "body": None,
+            },
+        }
+    )
+
+    result = node._run()
+    assert result.process_data is not None
+    assert result.outputs is not None
+    resp = result.outputs
+    assert len(resp.get("files", [])) == 1

From eb87e690ed6dbfce11b5a5bd41b063691e788fbf Mon Sep 17 00:00:00 2001
From: -LAN- <laipz8200@outlook.com>
Date: Wed, 30 Oct 2024 08:46:11 +0800
Subject: [PATCH 22/29] fix(llm-node): handle NoneSegment variables properly
 (#9978)

---
 api/core/workflow/nodes/llm/node.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/api/core/workflow/nodes/llm/node.py b/api/core/workflow/nodes/llm/node.py
index abf77f3339..472587cb03 100644
--- a/api/core/workflow/nodes/llm/node.py
+++ b/api/core/workflow/nodes/llm/node.py
@@ -327,7 +327,7 @@ class LLMNode(BaseNode[LLMNodeData]):
             if variable is None:
                 raise ValueError(f"Variable {variable_selector.variable} not found")
             if isinstance(variable, NoneSegment):
-                continue
+                inputs[variable_selector.variable] = ""
             inputs[variable_selector.variable] = variable.to_object()
 
         memory = node_data.memory

From c7fb8a4f20ad07be09d8d4b8003a8f00928ef9f9 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?=E9=9D=9E=E6=B3=95=E6=93=8D=E4=BD=9C?= <hjlarry@163.com>
Date: Wed, 30 Oct 2024 11:10:31 +0800
Subject: [PATCH 23/29] fix: conversation variable may not change in the answer
 node (#10034)

---
 api/core/workflow/nodes/answer/answer_stream_generate_router.py | 1 +
 1 file changed, 1 insertion(+)

diff --git a/api/core/workflow/nodes/answer/answer_stream_generate_router.py b/api/core/workflow/nodes/answer/answer_stream_generate_router.py
index bc4b056148..96e24a7db3 100644
--- a/api/core/workflow/nodes/answer/answer_stream_generate_router.py
+++ b/api/core/workflow/nodes/answer/answer_stream_generate_router.py
@@ -153,6 +153,7 @@ class AnswerStreamGeneratorRouter:
                 NodeType.IF_ELSE,
                 NodeType.QUESTION_CLASSIFIER,
                 NodeType.ITERATION,
+                NodeType.CONVERSATION_VARIABLE_ASSIGNER,
             }:
                 answer_dependencies[answer_node_id].append(source_node_id)
             else:

From f5d1c7cc0abe415d51e054bca179940dabb1f480 Mon Sep 17 00:00:00 2001
From: Lucas Rezende <lucas.c.rezende@gmail.com>
Date: Wed, 30 Oct 2024 00:12:31 -0300
Subject: [PATCH 24/29] Added: README_PT.md in Brazilian Portuguese (#10026)

Co-authored-by: Lucas Rezende <lucasrezende@MacBook-Pro-de-Lucas.local>
---
 README_PT.md | 241 +++++++++++++++++++++++++++++++++++++++++++++++++++
 1 file changed, 241 insertions(+)
 create mode 100644 README_PT.md

diff --git a/README_PT.md b/README_PT.md
new file mode 100644
index 0000000000..3d66b76802
--- /dev/null
+++ b/README_PT.md
@@ -0,0 +1,241 @@
+![cover-v5-optimized](https://github.com/langgenius/dify/assets/13230914/f9e19af5-61ba-4119-b926-d10c4c06ebab)
+
+<p align="center">
+  📌 <a href="https://dify.ai/blog/introducing-dify-workflow-file-upload-a-demo-on-ai-podcast">Introduzindo o Dify Workflow com Upload de Arquivo: Recrie o Podcast Google NotebookLM</a>
+</p>
+
+<p align="center">
+  <a href="https://cloud.dify.ai">Dify Cloud</a> ·
+  <a href="https://docs.dify.ai/getting-started/install-self-hosted">Auto-hospedagem</a> ·
+  <a href="https://docs.dify.ai">Documentação</a> ·
+  <a href="https://udify.app/chat/22L1zSxg6yW1cWQg">Consultas empresariais</a>
+</p>
+
+<p align="center">
+    <a href="https://dify.ai" target="_blank">
+        <img alt="Static Badge" src="https://img.shields.io/badge/Product-F04438"></a>
+    <a href="https://dify.ai/pricing" target="_blank">
+        <img alt="Static Badge" src="https://img.shields.io/badge/free-pricing?logo=free&color=%20%23155EEF&label=pricing&labelColor=%20%23528bff"></a>
+    <a href="https://discord.gg/FngNHpbcY7" target="_blank">
+        <img src="https://img.shields.io/discord/1082486657678311454?logo=discord&labelColor=%20%235462eb&logoColor=%20%23f5f5f5&color=%20%235462eb"
+            alt="chat on Discord"></a>
+    <a href="https://twitter.com/intent/follow?screen_name=dify_ai" target="_blank">
+        <img src="https://img.shields.io/twitter/follow/dify_ai?logo=X&color=%20%23f5f5f5"
+            alt="follow on X(Twitter)"></a>
+    <a href="https://hub.docker.com/u/langgenius" target="_blank">
+        <img alt="Docker Pulls" src="https://img.shields.io/docker/pulls/langgenius/dify-web?labelColor=%20%23FDB062&color=%20%23f79009"></a>
+    <a href="https://github.com/langgenius/dify/graphs/commit-activity" target="_blank">
+        <img alt="Commits last month" src="https://img.shields.io/github/commit-activity/m/langgenius/dify?labelColor=%20%2332b583&color=%20%2312b76a"></a>
+    <a href="https://github.com/langgenius/dify/" target="_blank">
+        <img alt="Issues closed" src="https://img.shields.io/github/issues-search?query=repo%3Alanggenius%2Fdify%20is%3Aclosed&label=issues%20closed&labelColor=%20%237d89b0&color=%20%235d6b98"></a>
+    <a href="https://github.com/langgenius/dify/discussions/" target="_blank">
+        <img alt="Discussion posts" src="https://img.shields.io/github/discussions/langgenius/dify?labelColor=%20%239b8afb&color=%20%237a5af8"></a>
+</p>
+
+<p align="center">
+  <a href="./README.md"><img alt="README em Inglês" src="https://img.shields.io/badge/English-d9d9d9"></a>
+  <a href="./README_CN.md"><img alt="简体中文版自述文件" src="https://img.shields.io/badge/简体中文-d9d9d9"></a>
+  <a href="./README_JA.md"><img alt="日本語のREADME" src="https://img.shields.io/badge/日本語-d9d9d9"></a>
+  <a href="./README_ES.md"><img alt="README em Espanhol" src="https://img.shields.io/badge/Español-d9d9d9"></a>
+  <a href="./README_FR.md"><img alt="README em Francês" src="https://img.shields.io/badge/Français-d9d9d9"></a>
+  <a href="./README_KL.md"><img alt="README tlhIngan Hol" src="https://img.shields.io/badge/Klingon-d9d9d9"></a>
+  <a href="./README_KR.md"><img alt="README em Coreano" src="https://img.shields.io/badge/한국어-d9d9d9"></a>
+  <a href="./README_AR.md"><img alt="README em Árabe" src="https://img.shields.io/badge/العربية-d9d9d9"></a>
+  <a href="./README_TR.md"><img alt="README em Turco" src="https://img.shields.io/badge/Türkçe-d9d9d9"></a>
+  <a href="./README_VI.md"><img alt="README em Vietnamita" src="https://img.shields.io/badge/Ti%E1%BA%BFng%20Vi%E1%BB%87t-d9d9d9"></a>
+  <a href="./README_PT.md"><img alt="README em Português - BR" src="https://img.shields.io/badge/Portugu%C3%AAs-BR?style=flat&label=BR&color=d9d9d9"></a>
+</p>
+
+Dify é uma plataforma de desenvolvimento de aplicativos LLM de código aberto. Sua interface intuitiva combina workflow de IA, pipeline RAG, capacidades de agente, gerenciamento de modelos, recursos de observabilidade e muito mais, permitindo que você vá rapidamente do protótipo à produção. Aqui está uma lista das principais funcionalidades:
+</br> </br>
+
+**1. Workflow**: 
+  Construa e teste workflows poderosos de IA em uma interface visual, aproveitando todos os recursos a seguir e muito mais.
+
+
+  https://github.com/langgenius/dify/assets/13230914/356df23e-1604-483d-80a6-9517ece318aa
+
+
+
+**2. Suporte abrangente a modelos**: 
+  Integração perfeita com centenas de LLMs proprietários e de código aberto de diversas provedoras e soluções auto-hospedadas, abrangendo GPT, Mistral, Llama3 e qualquer modelo compatível com a API da OpenAI. A lista completa de provedores suportados pode ser encontrada [aqui](https://docs.dify.ai/getting-started/readme/model-providers).
+
+![providers-v5](https://github.com/langgenius/dify/assets/13230914/5a17bdbe-097a-4100-8363-40255b70f6e3)
+
+
+**3. IDE de Prompt**: 
+  Interface intuitiva para criação de prompts, comparação de desempenho de modelos e adição de recursos como conversão de texto para fala em um aplicativo baseado em chat. 
+
+**4. Pipeline RAG**: 
+  Extensas capacidades de RAG que cobrem desde a ingestão de documentos até a recuperação, com suporte nativo para extração de texto de PDFs, PPTs e outros formatos de documentos comuns.
+
+**5. Capacidades de agente**: 
+  Você pode definir agentes com base em LLM Function Calling ou ReAct e adicionar ferramentas pré-construídas ou personalizadas para o agente. O Dify oferece mais de 50 ferramentas integradas para agentes de IA, como Google Search, DALL·E, Stable Diffusion e WolframAlpha.
+
+**6. LLMOps**: 
+  Monitore e analise os registros e o desempenho do aplicativo ao longo do tempo. É possível melhorar continuamente prompts, conjuntos de dados e modelos com base nos dados de produção e anotações.
+
+**7. Backend como Serviço**: 
+  Todas os recursos do Dify vêm com APIs correspondentes, permitindo que você integre o Dify sem esforço na lógica de negócios da sua empresa.
+
+
+## Comparação de recursos
+<table style="width: 100%;">
+  <tr>
+    <th align="center">Recurso</th>
+    <th align="center">Dify.AI</th>
+    <th align="center">LangChain</th>
+    <th align="center">Flowise</th>
+    <th align="center">OpenAI Assistants API</th>
+  </tr>
+  <tr>
+    <td align="center">Abordagem de Programação</td>
+    <td align="center">Orientada a API + Aplicativo</td>
+    <td align="center">Código Python</td>
+    <td align="center">Orientada a Aplicativo</td>
+    <td align="center">Orientada a API</td>
+  </tr>
+  <tr>
+    <td align="center">LLMs Suportados</td>
+    <td align="center">Variedade Rica</td>
+    <td align="center">Variedade Rica</td>
+    <td align="center">Variedade Rica</td>
+    <td align="center">Apenas OpenAI</td>
+  </tr>
+  <tr>
+    <td align="center">RAG Engine</td>
+    <td align="center">✅</td>
+    <td align="center">✅</td>
+    <td align="center">✅</td>
+    <td align="center">✅</td>
+  </tr>
+  <tr>
+    <td align="center">Agente</td>
+    <td align="center">✅</td>
+    <td align="center">✅</td>
+    <td align="center">❌</td>
+    <td align="center">✅</td>
+  </tr>
+  <tr>
+    <td align="center">Workflow</td>
+    <td align="center">✅</td>
+    <td align="center">❌</td>
+    <td align="center">✅</td>
+    <td align="center">❌</td>
+  </tr>
+  <tr>
+    <td align="center">Observabilidade</td>
+    <td align="center">✅</td>
+    <td align="center">✅</td>
+    <td align="center">❌</td>
+    <td align="center">❌</td>
+  </tr>
+  <tr>
+    <td align="center">Recursos Empresariais (SSO/Controle de Acesso)</td>
+    <td align="center">✅</td>
+    <td align="center">❌</td>
+    <td align="center">❌</td>
+    <td align="center">❌</td>
+  </tr>
+  <tr>
+    <td align="center">Implantação Local</td>
+    <td align="center">✅</td>
+    <td align="center">✅</td>
+    <td align="center">✅</td>
+    <td align="center">❌</td>
+  </tr>
+</table>
+
+## Usando o Dify
+
+- **Nuvem </br>**
+Oferecemos o serviço [Dify Cloud](https://dify.ai) para qualquer pessoa experimentar sem nenhuma configuração. Ele fornece todas as funcionalidades da versão auto-hospedada, incluindo 200 chamadas GPT-4 gratuitas no plano sandbox.
+
+- **Auto-hospedagem do Dify Community Edition</br>**
+Configure rapidamente o Dify no seu ambiente com este [guia inicial](#quick-start).
+Use nossa [documentação](https://docs.dify.ai) para referências adicionais e instruções mais detalhadas.
+
+- **Dify para empresas/organizações</br>**
+Oferecemos recursos adicionais voltados para empresas. [Envie suas perguntas através deste chatbot](https://udify.app/chat/22L1zSxg6yW1cWQg) ou [envie-nos um e-mail](mailto:business@dify.ai?subject=[GitHub]Business%20License%20Inquiry) para discutir necessidades empresariais. </br>
+  > Para startups e pequenas empresas que utilizam AWS, confira o [Dify Premium no AWS Marketplace](https://aws.amazon.com/marketplace/pp/prodview-t22mebxzwjhu6) e implemente no seu próprio AWS VPC com um clique. É uma oferta AMI acessível com a opção de criar aplicativos com logotipo e marca personalizados.
+
+
+## Mantendo-se atualizado
+
+Dê uma estrela no Dify no GitHub e seja notificado imediatamente sobre novos lançamentos.
+
+![star-us](https://github.com/langgenius/dify/assets/13230914/b823edc1-6388-4e25-ad45-2f6b187adbb4)
+
+
+
+## Início rápido
+> Antes de instalar o Dify, certifique-se de que sua máquina atenda aos seguintes requisitos mínimos de sistema:
+> 
+>- CPU >= 2 Núcleos
+>- RAM >= 4 GiB
+
+</br>
+
+A maneira mais fácil de iniciar o servidor Dify é executar nosso arquivo [docker-compose.yml](docker/docker-compose.yaml). Antes de rodar o comando de instalação, certifique-se de que o [Docker](https://docs.docker.com/get-docker/) e o [Docker Compose](https://docs.docker.com/compose/install/) estão instalados na sua máquina:
+
+```bash
+cd docker
+cp .env.example .env
+docker compose up -d
+```
+
+Após a execução, você pode acessar o painel do Dify no navegador em [http://localhost/install](http://localhost/install) e iniciar o processo de inicialização.
+
+> Se você deseja contribuir com o Dify ou fazer desenvolvimento adicional, consulte nosso [guia para implantar a partir do código fonte](https://docs.dify.ai/getting-started/install-self-hosted/local-source-code).
+
+## Próximos passos
+
+Se precisar personalizar a configuração, consulte os comentários no nosso arquivo [.env.example](docker/.env.example) e atualize os valores correspondentes no seu arquivo `.env`. Além disso, talvez seja necessário fazer ajustes no próprio arquivo `docker-compose.yaml`, como alterar versões de imagem, mapeamentos de portas ou montagens de volumes, com base no seu ambiente de implantação específico e nas suas necessidades. Após fazer quaisquer alterações, execute novamente `docker-compose up -d`. Você pode encontrar a lista completa de variáveis de ambiente disponíveis [aqui](https://docs.dify.ai/getting-started/install-self-hosted/environments).
+
+Se deseja configurar uma instalação de alta disponibilidade, há [Helm Charts](https://helm.sh/) e arquivos YAML contribuídos pela comunidade que permitem a implantação do Dify no Kubernetes.
+
+- [Helm Chart de @LeoQuote](https://github.com/douban/charts/tree/master/charts/dify)
+- [Helm Chart de @BorisPolonsky](https://github.com/BorisPolonsky/dify-helm)
+- [Arquivo YAML de @Winson-030](https://github.com/Winson-030/dify-kubernetes)
+
+#### Usando o Terraform para Implantação
+
+Implante o Dify na Plataforma Cloud com um único clique usando [terraform](https://www.terraform.io/)
+
+##### Azure Global
+- [Azure Terraform por @nikawang](https://github.com/nikawang/dify-azure-terraform)
+
+##### Google Cloud
+- [Google Cloud Terraform por @sotazum](https://github.com/DeNA/dify-google-cloud-terraform)
+
+## Contribuindo
+
+Para aqueles que desejam contribuir com código, veja nosso [Guia de Contribuição](https://github.com/langgenius/dify/blob/main/CONTRIBUTING.md). 
+Ao mesmo tempo, considere apoiar o Dify compartilhando-o nas redes sociais e em eventos e conferências.
+
+> Estamos buscando contribuidores para ajudar na tradução do Dify para idiomas além de Mandarim e Inglês. Se você tiver interesse em ajudar, consulte o [README i18n](https://github.com/langgenius/dify/blob/main/web/i18n/README.md) para mais informações e deixe-nos um comentário no canal `global-users` em nosso [Servidor da Comunidade no Discord](https://discord.gg/8Tpq4AcN9c).
+
+**Contribuidores**
+
+<a href="https://github.com/langgenius/dify/graphs/contributors">
+  <img src="https://contrib.rocks/image?repo=langgenius/dify" />
+</a>
+
+## Comunidade e contato
+
+* [Discussões no GitHub](https://github.com/langgenius/dify/discussions). Melhor para: compartilhar feedback e fazer perguntas.
+* [Problemas no GitHub](https://github.com/langgenius/dify/issues). Melhor para: relatar bugs encontrados no Dify.AI e propor novos recursos. Veja nosso [Guia de Contribuição](https://github.com/langgenius/dify/blob/main/CONTRIBUTING.md).
+* [Discord](https://discord.gg/FngNHpbcY7). Melhor para: compartilhar suas aplicações e interagir com a comunidade.
+* [X(Twitter)](https://twitter.com/dify_ai). Melhor para: compartilhar suas aplicações e interagir com a comunidade.
+
+## Histórico de estrelas
+
+[![Gráfico de Histórico de Estrelas](https://api.star-history.com/svg?repos=langgenius/dify&type=Date)](https://star-history.com/#langgenius/dify&Date)
+
+## Divulgação de segurança
+
+Para proteger sua privacidade, evite postar problemas de segurança no GitHub. Em vez disso, envie suas perguntas para security@dify.ai e forneceremos uma resposta mais detalhada.
+
+## Licença
+
+Este repositório está disponível sob a [Licença de Código Aberto Dify](LICENSE), que é essencialmente Apache 2.0 com algumas restrições adicionais.
\ No newline at end of file

From 68cb3822429c933597d2f4b187c2a8250ef35d61 Mon Sep 17 00:00:00 2001
From: Mab <shun.mab.37+github@gmail.com>
Date: Wed, 30 Oct 2024 12:15:55 +0900
Subject: [PATCH 25/29] =?UTF-8?q?Fix=20#10023=20:=20error=20in=20docker-co?=
 =?UTF-8?q?mpose.yaml=20about=20TIDB=5FON=5FQDRANT=5FCLIENT=E2=80=A6=20(#1?=
 =?UTF-8?q?0025)?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

---
 docker/docker-compose.yaml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docker/docker-compose.yaml b/docker/docker-compose.yaml
index 47e4a0ddbb..06c99b5eab 100644
--- a/docker/docker-compose.yaml
+++ b/docker/docker-compose.yaml
@@ -142,7 +142,7 @@ x-shared-env: &shared-api-worker-env
   TIDB_VECTOR_DATABASE: ${TIDB_VECTOR_DATABASE:-dify}
   TIDB_ON_QDRANT_URL: ${TIDB_ON_QDRANT_URL:-http://127.0.0.1}
   TIDB_ON_QDRANT_API_KEY: ${TIDB_ON_QDRANT_API_KEY:-dify}
-  TIDB_ON_QDRANT_CLIENT_TIMEOUT: ${TIDB_ON_QDRANT_API_KEY:-20}
+  TIDB_ON_QDRANT_CLIENT_TIMEOUT: ${TIDB_ON_QDRANT_CLIENT_TIMEOUT:-20}
   TIDB_ON_QDRANT_GRPC_ENABLED: ${TIDB_ON_QDRANT_GRPC_ENABLED:-false}
   TIDB_ON_QDRANT_GRPC_PORT: ${TIDB_ON_QDRANT_GRPC_PORT:-6334}
   TIDB_PUBLIC_KEY: ${TIDB_PUBLIC_KEY:-dify}

From 5ad5d0cff4e4922b2f8ff561770793322f978bdc Mon Sep 17 00:00:00 2001
From: ice yao <yao3690093@gmail.com>
Date: Wed, 30 Oct 2024 11:17:30 +0800
Subject: [PATCH 26/29] chore: Add aliyun oss tests (#10031)

---
 api/tests/unit_tests/oss/__mock/aliyun_oss.py | 100 ++++++++++++++++++
 .../oss/aliyun_oss/aliyun_oss/__init__.py     |   0
 .../aliyun_oss/aliyun_oss/test_aliyun_oss.py  |  22 ++++
 3 files changed, 122 insertions(+)
 create mode 100644 api/tests/unit_tests/oss/__mock/aliyun_oss.py
 create mode 100644 api/tests/unit_tests/oss/aliyun_oss/aliyun_oss/__init__.py
 create mode 100644 api/tests/unit_tests/oss/aliyun_oss/aliyun_oss/test_aliyun_oss.py

diff --git a/api/tests/unit_tests/oss/__mock/aliyun_oss.py b/api/tests/unit_tests/oss/__mock/aliyun_oss.py
new file mode 100644
index 0000000000..27e1c0ad85
--- /dev/null
+++ b/api/tests/unit_tests/oss/__mock/aliyun_oss.py
@@ -0,0 +1,100 @@
+import os
+import posixpath
+from unittest.mock import MagicMock
+
+import pytest
+from _pytest.monkeypatch import MonkeyPatch
+from oss2 import Bucket
+from oss2.models import GetObjectResult, PutObjectResult
+
+from tests.unit_tests.oss.__mock.base import (
+    get_example_bucket,
+    get_example_data,
+    get_example_filename,
+    get_example_filepath,
+    get_example_folder,
+)
+
+
+class MockResponse:
+    def __init__(self, status, headers, request_id):
+        self.status = status
+        self.headers = headers
+        self.request_id = request_id
+
+
+class MockAliyunOssClass:
+    def __init__(
+        self,
+        auth,
+        endpoint,
+        bucket_name,
+        is_cname=False,
+        session=None,
+        connect_timeout=None,
+        app_name="",
+        enable_crc=True,
+        proxies=None,
+        region=None,
+        cloudbox_id=None,
+        is_path_style=False,
+        is_verify_object_strict=True,
+    ):
+        self.bucket_name = get_example_bucket()
+        self.key = posixpath.join(get_example_folder(), get_example_filename())
+        self.content = get_example_data()
+        self.filepath = get_example_filepath()
+        self.resp = MockResponse(
+            200,
+            {
+                "etag": "ee8de918d05640145b18f70f4c3aa602",
+                "x-oss-version-id": "CAEQNhiBgMDJgZCA0BYiIDc4MGZjZGI2OTBjOTRmNTE5NmU5NmFhZjhjYmY0****",
+            },
+            "request_id",
+        )
+
+    def put_object(self, key, data, headers=None, progress_callback=None):
+        assert key == self.key
+        assert data == self.content
+        return PutObjectResult(self.resp)
+
+    def get_object(self, key, byte_range=None, headers=None, progress_callback=None, process=None, params=None):
+        assert key == self.key
+
+        get_object_output = MagicMock(GetObjectResult)
+        get_object_output.read.return_value = self.content
+        return get_object_output
+
+    def get_object_to_file(
+        self, key, filename, byte_range=None, headers=None, progress_callback=None, process=None, params=None
+    ):
+        assert key == self.key
+        assert filename == self.filepath
+
+    def object_exists(self, key, headers=None):
+        assert key == self.key
+        return True
+
+    def delete_object(self, key, params=None, headers=None):
+        assert key == self.key
+        self.resp.headers["x-oss-delete-marker"] = True
+        return self.resp
+
+
+MOCK = os.getenv("MOCK_SWITCH", "false").lower() == "true"
+
+
+@pytest.fixture
+def setup_aliyun_oss_mock(monkeypatch: MonkeyPatch):
+    if MOCK:
+        monkeypatch.setattr(Bucket, "__init__", MockAliyunOssClass.__init__)
+        monkeypatch.setattr(Bucket, "put_object", MockAliyunOssClass.put_object)
+        monkeypatch.setattr(Bucket, "get_object", MockAliyunOssClass.get_object)
+        monkeypatch.setattr(Bucket, "get_object_to_file", MockAliyunOssClass.get_object_to_file)
+        monkeypatch.setattr(Bucket, "object_exists", MockAliyunOssClass.object_exists)
+        monkeypatch.setattr(Bucket, "delete_object", MockAliyunOssClass.delete_object)
+
+    yield
+
+    if MOCK:
+        monkeypatch.undo()
diff --git a/api/tests/unit_tests/oss/aliyun_oss/aliyun_oss/__init__.py b/api/tests/unit_tests/oss/aliyun_oss/aliyun_oss/__init__.py
new file mode 100644
index 0000000000..e69de29bb2
diff --git a/api/tests/unit_tests/oss/aliyun_oss/aliyun_oss/test_aliyun_oss.py b/api/tests/unit_tests/oss/aliyun_oss/aliyun_oss/test_aliyun_oss.py
new file mode 100644
index 0000000000..65d31352bd
--- /dev/null
+++ b/api/tests/unit_tests/oss/aliyun_oss/aliyun_oss/test_aliyun_oss.py
@@ -0,0 +1,22 @@
+from unittest.mock import MagicMock, patch
+
+import pytest
+from oss2 import Auth
+
+from extensions.storage.aliyun_oss_storage import AliyunOssStorage
+from tests.unit_tests.oss.__mock.aliyun_oss import setup_aliyun_oss_mock
+from tests.unit_tests.oss.__mock.base import (
+    BaseStorageTest,
+    get_example_bucket,
+    get_example_folder,
+)
+
+
+class TestAliyunOss(BaseStorageTest):
+    @pytest.fixture(autouse=True)
+    def setup_method(self, setup_aliyun_oss_mock):
+        """Executed before each test method."""
+        with patch.object(Auth, "__init__", return_value=None):
+            self.storage = AliyunOssStorage()
+        self.storage.bucket_name = get_example_bucket()
+        self.storage.folder = get_example_folder()

From 9ebd453b87cd60a3d9d35157b3e337333e79be53 Mon Sep 17 00:00:00 2001
From: Jyong <76649700+JohnJyong@users.noreply.github.com>
Date: Wed, 30 Oct 2024 11:17:39 +0800
Subject: [PATCH 27/29] add rerank check when doing mutil-retrieval (#9998)

---
 api/core/rag/rerank/rerank_type.py          |  2 +-
 api/core/rag/retrieval/dataset_retrieval.py | 32 ++++++++++++++++++++-
 2 files changed, 32 insertions(+), 2 deletions(-)

diff --git a/api/core/rag/rerank/rerank_type.py b/api/core/rag/rerank/rerank_type.py
index d4894e3cc6..d71eb2daa8 100644
--- a/api/core/rag/rerank/rerank_type.py
+++ b/api/core/rag/rerank/rerank_type.py
@@ -1,6 +1,6 @@
 from enum import Enum
 
 
-class RerankMode(Enum):
+class RerankMode(str, Enum):
     RERANKING_MODEL = "reranking_model"
     WEIGHTED_SCORE = "weighted_score"
diff --git a/api/core/rag/retrieval/dataset_retrieval.py b/api/core/rag/retrieval/dataset_retrieval.py
index 3455cdc3c4..7a5bf39fa6 100644
--- a/api/core/rag/retrieval/dataset_retrieval.py
+++ b/api/core/rag/retrieval/dataset_retrieval.py
@@ -22,6 +22,7 @@ from core.rag.datasource.keyword.jieba.jieba_keyword_table_handler import JiebaK
 from core.rag.datasource.retrieval_service import RetrievalService
 from core.rag.entities.context_entities import DocumentContext
 from core.rag.models.document import Document
+from core.rag.rerank.rerank_type import RerankMode
 from core.rag.retrieval.retrieval_methods import RetrievalMethod
 from core.rag.retrieval.router.multi_dataset_function_call_router import FunctionCallMultiDatasetRouter
 from core.rag.retrieval.router.multi_dataset_react_route import ReactMultiDatasetRouter
@@ -361,10 +362,39 @@ class DatasetRetrieval:
         reranking_enable: bool = True,
         message_id: Optional[str] = None,
     ):
+        if not available_datasets:
+            return []
         threads = []
         all_documents = []
         dataset_ids = [dataset.id for dataset in available_datasets]
-        index_type = None
+        index_type_check = all(
+            item.indexing_technique == available_datasets[0].indexing_technique for item in available_datasets
+        )
+        if not index_type_check and (not reranking_enable or reranking_mode != RerankMode.RERANKING_MODEL):
+            raise ValueError(
+                "The configured knowledge base list have different indexing technique, please set reranking model."
+            )
+        index_type = available_datasets[0].indexing_technique
+        if index_type == "high_quality":
+            embedding_model_check = all(
+                item.embedding_model == available_datasets[0].embedding_model for item in available_datasets
+            )
+            embedding_model_provider_check = all(
+                item.embedding_model_provider == available_datasets[0].embedding_model_provider
+                for item in available_datasets
+            )
+            if (
+                reranking_enable
+                and reranking_mode == "weighted_score"
+                and (not embedding_model_check or not embedding_model_provider_check)
+            ):
+                raise ValueError(
+                    "The configured knowledge base list have different embedding model, please set reranking model."
+                )
+            if reranking_enable and reranking_mode == RerankMode.WEIGHTED_SCORE:
+                weights["vector_setting"]["embedding_provider_name"] = available_datasets[0].embedding_model_provider
+                weights["vector_setting"]["embedding_model_name"] = available_datasets[0].embedding_model
+
         for dataset in available_datasets:
             index_type = dataset.indexing_technique
             retrieval_thread = threading.Thread(

From e74479717a2d72b6d0ef76a9a057a5d8dbfc4b05 Mon Sep 17 00:00:00 2001
From: Jyong <76649700+JohnJyong@users.noreply.github.com>
Date: Wed, 30 Oct 2024 11:17:46 +0800
Subject: [PATCH 28/29] fix update_by_api batch field issue (#10001)

---
 api/controllers/service_api/dataset/document.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/api/controllers/service_api/dataset/document.py b/api/controllers/service_api/dataset/document.py
index fb48a6c76c..0a0a38c4c6 100644
--- a/api/controllers/service_api/dataset/document.py
+++ b/api/controllers/service_api/dataset/document.py
@@ -230,7 +230,7 @@ class DocumentUpdateByFileApi(DatasetApiResource):
         except ProviderTokenNotInitError as ex:
             raise ProviderNotInitializeError(ex.description)
         document = documents[0]
-        documents_and_batch_fields = {"document": marshal(document, document_fields), "batch": batch}
+        documents_and_batch_fields = {"document": marshal(document, document_fields), "batch": document.batch}
         return documents_and_batch_fields, 200
 
 

From bab5c542197f935d35fe75eb5d2c3301fbbf58b4 Mon Sep 17 00:00:00 2001
From: Bowen Liang <liangbowen@gf.com.cn>
Date: Wed, 30 Oct 2024 11:18:23 +0800
Subject: [PATCH 29/29] chore: improve validation and handler of logging
 timezone with TimezoneName (#9595)

---
 api/configs/feature/__init__.py |  6 ++++--
 api/extensions/ext_logging.py   | 16 ++++++----------
 2 files changed, 10 insertions(+), 12 deletions(-)

diff --git a/api/configs/feature/__init__.py b/api/configs/feature/__init__.py
index 0fa926038d..a8a4170f67 100644
--- a/api/configs/feature/__init__.py
+++ b/api/configs/feature/__init__.py
@@ -10,6 +10,7 @@ from pydantic import (
     PositiveInt,
     computed_field,
 )
+from pydantic_extra_types.timezone_name import TimeZoneName
 from pydantic_settings import BaseSettings
 
 from configs.feature.hosted_service import HostedServiceConfig
@@ -339,8 +340,9 @@ class LoggingConfig(BaseSettings):
         default=None,
     )
 
-    LOG_TZ: Optional[str] = Field(
-        description="Timezone for log timestamps (e.g., 'America/New_York')",
+    LOG_TZ: Optional[TimeZoneName] = Field(
+        description="Timezone for log timestamps. Allowed timezone values can be referred to IANA Time Zone Database,"
+        " e.g., 'America/New_York')",
         default=None,
     )
 
diff --git a/api/extensions/ext_logging.py b/api/extensions/ext_logging.py
index 56b1d6bd28..0fa832f420 100644
--- a/api/extensions/ext_logging.py
+++ b/api/extensions/ext_logging.py
@@ -1,8 +1,10 @@
 import logging
 import os
 import sys
+from datetime import datetime
 from logging.handlers import RotatingFileHandler
 
+import pytz
 from flask import Flask
 
 from configs import dify_config
@@ -30,16 +32,10 @@ def init_app(app: Flask):
         handlers=log_handlers,
         force=True,
     )
+
     log_tz = dify_config.LOG_TZ
     if log_tz:
-        from datetime import datetime
-
-        import pytz
-
-        timezone = pytz.timezone(log_tz)
-
-        def time_converter(seconds):
-            return datetime.utcfromtimestamp(seconds).astimezone(timezone).timetuple()
-
         for handler in logging.root.handlers:
-            handler.formatter.converter = time_converter
+            handler.formatter.converter = lambda seconds: (
+                datetime.fromtimestamp(seconds, tz=pytz.UTC).astimezone(log_tz).timetuple()
+            )