docs: add example implementation of Redux Slice for message management

- Introduced a new section in the technical documentation detailing the implementation of a `messages` slice using `createEntityAdapter`. - Provided TypeScript code for the slice, including actions for adding, updating, and removing messages. - Summarized the core principles of the slice's design, emphasizing single responsibility, logical separation of concerns, and performance optimization. - Included a migration strategy for transitioning from the previous state structure to the new message pool approach.
docs: finalize technical report for message history version management system with multi-model support
2025-06-12 18:34:36 +08:00 · 2025-06-12 15:59:54 +08:00 · 2025-06-12 14:25:42 +08:00
752 changed files with 13703 additions and 72627 deletions
--- a/.github/dependabot.yml
+++ b/.github/dependabot.yml
@@ -1,17 +1,86 @@
 version: 2
 updates:
-  - package-ecosystem: 'github-actions'
-    directory: '/'
+  - package-ecosystem: "npm"
+    directory: "/"
    schedule:
-      interval: 'monthly'
+      interval: "monthly"
+    open-pull-requests-limit: 7
+    target-branch: "main"
+    commit-message:
+      prefix: "chore"
+      include: "scope"
+    groups:
+      # 核心框架
+      core-framework:
+        patterns:
+          - "react"
+          - "react-dom"
+          - "electron"
+          - "typescript"
+          - "@types/react*"
+          - "@types/node"
+        update-types:
+          - "minor"
+          - "patch"
+
+      # Electron 生态和构建工具
+      electron-build:
+        patterns:
+          - "electron-*"
+          - "@electron*"
+          - "vite"
+          - "@vitejs/*"
+          - "dotenv-cli"
+          - "rollup-plugin-*"
+          - "@swc/*"
+        update-types:
+          - "minor"
+          - "patch"
+
+      # 测试工具
+      testing-tools:
+        patterns:
+          - "vitest"
+          - "@vitest/*"
+          - "playwright"
+          - "@playwright/*"
+          - "eslint*"
+          - "@eslint*"
+          - "prettier"
+          - "husky"
+          - "lint-staged"
+        update-types:
+          - "minor"
+          - "patch"
+
+      # CherryStudio 自定义包
+      cherrystudio-packages:
+        patterns:
+          - "@cherrystudio/*"
+        update-types:
+          - "minor"
+          - "patch"
+
+      # 兜底其他 dependencies
+      other-dependencies:
+        dependency-type: "production"
+
+      # 兜底其他 devDependencies
+      other-dev-dependencies:
+        dependency-type: "development"
+
+  - package-ecosystem: "github-actions"
+    directory: "/"
+    schedule:
+      interval: "weekly"
    open-pull-requests-limit: 3
    commit-message:
-      prefix: 'ci'
-      include: 'scope'
+      prefix: "ci"
+      include: "scope"
    groups:
      github-actions:
        patterns:
-          - '*'
+          - "*"
        update-types:
-          - 'minor'
-          - 'patch'
+          - "minor"
+          - "patch"
--- a/.github/workflows/dispatch-docs-update.yml
+++ b/.github/workflows/dispatch-docs-update.yml
@@ -1,27 +0,0 @@
-name: Dispatch Docs Update on Release
-
-on:
-  release:
-    types: [released]
-
-permissions:
-  contents: write
-
-jobs:
-  dispatch-docs-update:
-    runs-on: ubuntu-latest
-    steps:
-      - name: Get Release Tag from Event
-        id: get-event-tag
-        shell: bash
-        run: |
-          # 从当前 Release 事件中获取 tag_name
-          echo "tag=${{ github.event.release.tag_name }}" >> $GITHUB_OUTPUT
-
-      - name: Dispatch update-download-version workflow to cherry-studio-docs
-        uses: peter-evans/repository-dispatch@v3
-        with:
-          token: ${{ secrets.REPO_DISPATCH_TOKEN }}
-          repository: CherryHQ/cherry-studio-docs
-          event-type: update-download-version
-          client-payload: '{"version": "${{ steps.get-event-tag.outputs.tag }}"}'
--- a/.github/workflows/pr-ci.yml
+++ b/.github/workflows/pr-ci.yml
@@ -44,4 +44,4 @@ jobs:
        run: yarn build:check

      - name: Lint Check
-        run: yarn test:lint
+        run: yarn lint
--- a/.github/workflows/release.yml
+++ b/.github/workflows/release.yml
@@ -27,7 +27,7 @@ jobs:
      - name: Check out Git repository
        uses: actions/checkout@v4
        with:
-          fetch-depth: 0
+          ref: main

      - name: Get release tag
        id: get-tag
@@ -79,7 +79,6 @@ jobs:
          GH_TOKEN: ${{ secrets.GITHUB_TOKEN }}
          RENDERER_VITE_AIHUBMIX_SECRET: ${{ vars.RENDERER_VITE_AIHUBMIX_SECRET }}
          NODE_OPTIONS: --max-old-space-size=8192
-          MAIN_VITE_MINERU_API_KEY: ${{ vars.MAIN_VITE_MINERU_API_KEY }}

      - name: Build Mac
        if: matrix.os == 'macos-latest'
@@ -96,7 +95,6 @@ jobs:
          RENDERER_VITE_AIHUBMIX_SECRET: ${{ vars.RENDERER_VITE_AIHUBMIX_SECRET }}
          GH_TOKEN: ${{ secrets.GITHUB_TOKEN }}
          NODE_OPTIONS: --max-old-space-size=8192
-          MAIN_VITE_MINERU_API_KEY: ${{ vars.MAIN_VITE_MINERU_API_KEY }}

      - name: Build Windows
        if: matrix.os == 'windows-latest'
@@ -107,7 +105,6 @@ jobs:
          GH_TOKEN: ${{ secrets.GITHUB_TOKEN }}
          RENDERER_VITE_AIHUBMIX_SECRET: ${{ vars.RENDERER_VITE_AIHUBMIX_SECRET }}
          NODE_OPTIONS: --max-old-space-size=8192
-          MAIN_VITE_MINERU_API_KEY: ${{ vars.MAIN_VITE_MINERU_API_KEY }}

      - name: Release
        uses: ncipollo/release-action@v1
@@ -117,4 +114,39 @@ jobs:
          makeLatest: false
          tag: ${{ steps.get-tag.outputs.tag }}
          artifacts: 'dist/*.exe,dist/*.zip,dist/*.dmg,dist/*.AppImage,dist/*.snap,dist/*.deb,dist/*.rpm,dist/*.tar.gz,dist/latest*.yml,dist/rc*.yml,dist/*.blockmap'
-          token: ${{ secrets.GITHUB_TOKEN }}
+          token: ${{ secrets.GITHUB_TOKEN }}
+
+  dispatch-docs-update:
+    needs: release
+    if: success() && github.repository == 'CherryHQ/cherry-studio' # 确保所有构建成功且在主仓库中运行
+    runs-on: ubuntu-latest
+    steps:
+      - name: Get release tag
+        id: get-tag
+        shell: bash
+        run: |
+          if [ "${{ github.event_name }}" = "workflow_dispatch" ]; then
+            echo "tag=${{ github.event.inputs.tag }}" >> $GITHUB_OUTPUT
+          else
+            echo "tag=${GITHUB_REF#refs/tags/}" >> $GITHUB_OUTPUT
+          fi
+
+      - name: Check if tag is pre-release
+        id: check-tag
+        shell: bash
+        run: |
+          TAG="${{ steps.get-tag.outputs.tag }}"
+          if [[ "$TAG" == *"rc"* || "$TAG" == *"pre-release"* ]]; then
+            echo "is_pre_release=true" >> $GITHUB_OUTPUT
+          else
+            echo "is_pre_release=false" >> $GITHUB_OUTPUT
+          fi
+
+      - name: Dispatch update-download-version workflow to cherry-studio-docs
+        if: steps.check-tag.outputs.is_pre_release == 'false'
+        uses: peter-evans/repository-dispatch@v3
+        with:
+          token: ${{ secrets.REPO_DISPATCH_TOKEN }}
+          repository: CherryHQ/cherry-studio-docs
+          event-type: update-download-version
+          client-payload: '{"version": "${{ steps.get-tag.outputs.tag }}"}'
--- a/.vscode/launch.json
+++ b/.vscode/launch.json
@@ -7,6 +7,7 @@
      "request": "launch",
      "cwd": "${workspaceRoot}",
      "runtimeExecutable": "${workspaceRoot}/node_modules/.bin/electron-vite",
+      "runtimeVersion": "20",
      "windows": {
        "runtimeExecutable": "${workspaceRoot}/node_modules/.bin/electron-vite.cmd"
      },
--- a/.vscode/settings.json
+++ b/.vscode/settings.json
@@ -1,8 +1,7 @@
 {
  "editor.formatOnSave": true,
  "editor.codeActionsOnSave": {
-    "source.fixAll.eslint": "explicit",
-    "source.organizeImports": "never"
+    "source.fixAll.eslint": "explicit"
  },
  "search.exclude": {
    "**/dist/**": true,
--- a/.yarn/patches/@google-genai-npm-1.0.1-e26f0f9af7.patch
+++ b/.yarn/patches/@google-genai-npm-1.0.1-e26f0f9af7.patch
--- a/.yarn/patches/antd-npm-5.24.7-356a553ae5.patch
+++ b/.yarn/patches/antd-npm-5.24.7-356a553ae5.patch
@@ -1,69 +0,0 @@
-diff --git a/es/dropdown/dropdown.js b/es/dropdown/dropdown.js
-index 986877a762b9ad0aca596a8552732cd12d2eaabb..1f18aa2ea745e68950e4cee16d4d655f5c835fd5 100644
--- a/es/dropdown/dropdown.js
-+++ b/es/dropdown/dropdown.js
-@@ -2,7 +2,7 @@
- 
- import * as React from 'react';
- import LeftOutlined from "@ant-design/icons/es/icons/LeftOutlined";
-import RightOutlined from "@ant-design/icons/es/icons/RightOutlined";
-+import { ChevronRight } from 'lucide-react';
- import classNames from 'classnames';
- import RcDropdown from 'rc-dropdown';
- import useEvent from "rc-util/es/hooks/useEvent";
-@@ -158,8 +158,10 @@ const Dropdown = props => {
-         className: `${prefixCls}-menu-submenu-arrow`
-       }, direction === 'rtl' ? (/*#__PURE__*/React.createElement(LeftOutlined, {
-         className: `${prefixCls}-menu-submenu-arrow-icon`
-      })) : (/*#__PURE__*/React.createElement(RightOutlined, {
-        className: `${prefixCls}-menu-submenu-arrow-icon`
-+      })) : (/*#__PURE__*/React.createElement(ChevronRight, {
-+        size: 16,
-+        strokeWidth: 1.8,
-+        className: `${prefixCls}-menu-submenu-arrow-icon lucide-custom`
-       }))),
-       mode: "vertical",
-       selectable: false,
-diff --git a/es/dropdown/style/index.js b/es/dropdown/style/index.js
-index 768c01783002c6901c85a73061ff6b3e776a60ce..39b1b95a56cdc9fb586a193c3adad5141f5cf213 100644
--- a/es/dropdown/style/index.js
-+++ b/es/dropdown/style/index.js
-@@ -240,7 +240,8 @@ const genBaseStyle = token => {
-               marginInlineEnd: '0 !important',
-               color: token.colorTextDescription,
-               fontSize: fontSizeIcon,
-              fontStyle: 'normal'
-+              fontStyle: 'normal',
-+              marginTop: 3,
-             }
-           }
-         }),
-diff --git a/es/select/useIcons.js b/es/select/useIcons.js
-index 959115be936ef8901548af2658c5dcfdc5852723..c812edd52123eb0faf4638b1154fcfa1b05b513b 100644
--- a/es/select/useIcons.js
-+++ b/es/select/useIcons.js
-@@ -4,10 +4,10 @@ import * as React from 'react';
- import CheckOutlined from "@ant-design/icons/es/icons/CheckOutlined";
- import CloseCircleFilled from "@ant-design/icons/es/icons/CloseCircleFilled";
- import CloseOutlined from "@ant-design/icons/es/icons/CloseOutlined";
-import DownOutlined from "@ant-design/icons/es/icons/DownOutlined";
- import LoadingOutlined from "@ant-design/icons/es/icons/LoadingOutlined";
- import SearchOutlined from "@ant-design/icons/es/icons/SearchOutlined";
- import { devUseWarning } from '../_util/warning';
-+import { ChevronDown } from 'lucide-react';
- export default function useIcons(_ref) {
-   let {
-     suffixIcon,
-@@ -56,8 +56,10 @@ export default function useIcons(_ref) {
-           className: iconCls
-         }));
-       }
-      return getSuffixIconNode(/*#__PURE__*/React.createElement(DownOutlined, {
-        className: iconCls
-+      return getSuffixIconNode(/*#__PURE__*/React.createElement(ChevronDown, {
-+        size: 16,
-+        strokeWidth: 1.8,
-+        className: `${iconCls} lucide-custom`
-       }));
-     };
-   }
--- a/.yarn/patches/app-builder-lib-npm-26.0.15-360e5b0476.patch
+++ b/.yarn/patches/app-builder-lib-npm-26.0.15-360e5b0476.patch
@@ -65,44 +65,11 @@ index e8bd7bb46c8a54b3f55cf3a853ef924195271e01..f956e9f3fe9eb903c78aef3502553b01
             await packager.info.emitArtifactBuildCompleted({
                 file: installerPath,
                 updateInfo,
-diff --git a/out/util/yarn.js b/out/util/yarn.js
-index 1ee20f8b252a8f28d0c7b103789cf0a9a427aec1..c2878ec54d57da50bf14225e0c70c9c88664eb8a 100644
--- a/out/util/yarn.js
-+++ b/out/util/yarn.js
-@@ -140,6 +140,7 @@ async function rebuild(config, { appDir, projectDir }, options) {
-         arch,
-         platform,
-         buildFromSource,
-+        ignoreModules: config.excludeReBuildModules || undefined,
-         projectRootPath: projectDir,
-         mode: config.nativeRebuilder || "sequential",
-         disablePreGypCopy: true,
 diff --git a/scheme.json b/scheme.json
-index 433e2efc9cef156ff5444f0c4520362ed2ef9ea7..0167441bf928a92f59b5dbe70b2317a74dda74c9 100644
+index 433e2efc9cef156ff5444f0c4520362ed2ef9ea7..a89c7a9b0b608fef67902c49106a43ebd0fa8b61 100644
 --- a/scheme.json
 +++ b/scheme.json
-@@ -1825,6 +1825,20 @@
-             "string"
-           ]
-         },
-+        "excludeReBuildModules": {
-+          "anyOf": [
-+            {
-+              "items": {
-+                "type": "string"
-+              },
-+              "type": "array"
-+            },
-+            {
-+              "type": "null"
-+            }
-+          ],
-+          "description": "The modules to exclude from the rebuild."
-+        },
-         "executableArgs": {
-           "anyOf": [
-             {
-@@ -1975,6 +1989,13 @@
+@@ -1975,6 +1975,13 @@
           ],
           "description": "The mime types in addition to specified in the file associations. Use it if you don't want to register a new mime type, but reuse existing."
         },
@@ -116,7 +83,7 @@ index 433e2efc9cef156ff5444f0c4520362ed2ef9ea7..0167441bf928a92f59b5dbe70b2317a7
         "packageCategory": {
           "description": "backward compatibility + to allow specify fpm-only category for all possible fpm targets in one place",
           "type": [
-@@ -2327,6 +2348,13 @@
+@@ -2327,6 +2334,13 @@
     "MacConfiguration": {
       "additionalProperties": false,
       "properties": {
@@ -130,28 +97,7 @@ index 433e2efc9cef156ff5444f0c4520362ed2ef9ea7..0167441bf928a92f59b5dbe70b2317a7
         "additionalArguments": {
           "anyOf": [
             {
-@@ -2527,6 +2555,20 @@
-             "string"
-           ]
-         },
-+        "excludeReBuildModules": {
-+          "anyOf": [
-+            {
-+              "items": {
-+                "type": "string"
-+              },
-+              "type": "array"
-+            },
-+            {
-+              "type": "null"
-+            }
-+          ],
-+          "description": "The modules to exclude from the rebuild."
-+        },
-         "executableName": {
-           "description": "The executable name. Defaults to `productName`.",
-           "type": [
-@@ -2737,7 +2779,7 @@
+@@ -2737,7 +2751,7 @@
           "type": "boolean"
         },
         "minimumSystemVersion": {
@@ -160,7 +106,7 @@ index 433e2efc9cef156ff5444f0c4520362ed2ef9ea7..0167441bf928a92f59b5dbe70b2317a7
           "type": [
             "null",
             "string"
-@@ -2959,6 +3001,13 @@
+@@ -2959,6 +2973,13 @@
     "MasConfiguration": {
       "additionalProperties": false,
       "properties": {
@@ -174,28 +120,7 @@ index 433e2efc9cef156ff5444f0c4520362ed2ef9ea7..0167441bf928a92f59b5dbe70b2317a7
         "additionalArguments": {
           "anyOf": [
             {
-@@ -3159,6 +3208,20 @@
-             "string"
-           ]
-         },
-+        "excludeReBuildModules": {
-+          "anyOf": [
-+            {
-+              "items": {
-+                "type": "string"
-+              },
-+              "type": "array"
-+            },
-+            {
-+              "type": "null"
-+            }
-+          ],
-+          "description": "The modules to exclude from the rebuild."
-+        },
-         "executableName": {
-           "description": "The executable name. Defaults to `productName`.",
-           "type": [
-@@ -3369,7 +3432,7 @@
+@@ -3369,7 +3390,7 @@
           "type": "boolean"
         },
         "minimumSystemVersion": {
@@ -204,28 +129,7 @@ index 433e2efc9cef156ff5444f0c4520362ed2ef9ea7..0167441bf928a92f59b5dbe70b2317a7
           "type": [
             "null",
             "string"
-@@ -6381,6 +6444,20 @@
-             "string"
-           ]
-         },
-+        "excludeReBuildModules": {
-+          "anyOf": [
-+            {
-+              "items": {
-+                "type": "string"
-+              },
-+              "type": "array"
-+            },
-+            {
-+              "type": "null"
-+            }
-+          ],
-+          "description": "The modules to exclude from the rebuild."
-+        },
-         "executableName": {
-           "description": "The executable name. Defaults to `productName`.",
-           "type": [
-@@ -6507,6 +6584,13 @@
+@@ -6507,6 +6528,13 @@
             "string"
           ]
         },
@@ -239,28 +143,7 @@ index 433e2efc9cef156ff5444f0c4520362ed2ef9ea7..0167441bf928a92f59b5dbe70b2317a7
         "protocols": {
           "anyOf": [
             {
-@@ -7153,6 +7237,20 @@
-         "string"
-       ]
-     },
-+    "excludeReBuildModules": {
-+      "anyOf": [
-+        {
-+          "items": {
-+            "type": "string"
-+          },
-+          "type": "array"
-+        },
-+        {
-+          "type": "null"
-+        }
-+      ],
-+      "description": "The modules to exclude from the rebuild."
-+    },
-     "executableName": {
-       "description": "The executable name. Defaults to `productName`.",
-       "type": [
-@@ -7376,6 +7474,13 @@
+@@ -7376,6 +7404,13 @@
       ],
       "description": "MAS (Mac Application Store) development options (`mas-dev` target)."
     },
--- a/CONTRIBUTING.md
+++ b/CONTRIBUTING.md
@@ -1,4 +1,4 @@
-[中文](docs/CONTRIBUTING.zh.md) | [English](CONTRIBUTING.md)
+[中文](./docs/CONTRIBUTING.zh.md) | [English](./CONTRIBUTING.md)

 # Cherry Studio Contributor Guide

@@ -58,10 +58,6 @@ git commit --signoff -m "Your commit message"

 Maintainers are here to help you implement your use case within a reasonable timeframe. They will do their best to review your code and provide constructive feedback promptly. However, if you get stuck during the review process or feel your Pull Request is not receiving the attention it deserves, please contact us via comments in the Issue or through the [Community](README.md#-community).

-### Participating in the Test Plan
-
-The Test Plan aims to provide users with a more stable application experience and faster iteration speed. For details, please refer to the [Test Plan](docs/testplan-en.md).
-
 ### Other Suggestions

 - **Contact Developers**: Before submitting a PR, you can contact the developers first to discuss or get help.
--- a/README.md
+++ b/README.md
@@ -1,54 +1,34 @@
-<div align="right" >
-  <details>
-    <summary >🌐 Language</summary>
-    <div>
-      <div align="right">
-        <p><a href="https://openaitx.github.io/view.html?user=CherryHQ&project=cherry-studio&lang=en">English</a></p>
-        <p><a href="https://openaitx.github.io/view.html?user=CherryHQ&project=cherry-studio&lang=zh-CN">简体中文</a></p>
-        <p><a href="https://openaitx.github.io/view.html?user=CherryHQ&project=cherry-studio&lang=zh-TW">繁體中文</a></p>
-        <p><a href="https://openaitx.github.io/view.html?user=CherryHQ&project=cherry-studio&lang=ja">日本語</a></p>
-        <p><a href="https://openaitx.github.io/view.html?user=CherryHQ&project=cherry-studio&lang=ko">한국어</a></p>
-        <p><a href="https://openaitx.github.io/view.html?user=CherryHQ&project=cherry-studio&lang=hi">हिन्दी</a></p>
-        <p><a href="https://openaitx.github.io/view.html?user=CherryHQ&project=cherry-studio&lang=th">ไทย</a></p>
-        <p><a href="https://openaitx.github.io/view.html?user=CherryHQ&project=cherry-studio&lang=fr">Français</a></p>
-        <p><a href="https://openaitx.github.io/view.html?user=CherryHQ&project=cherry-studio&lang=de">Deutsch</a></p>
-        <p><a href="https://openaitx.github.io/view.html?user=CherryHQ&project=cherry-studio&lang=es">Español</a></p>
-        <p><a href="https://openaitx.github.io/view.html?user=CherryHQ&project=cherry-studio&lang=it">Itapano</a></p>
-        <p><a href="https://openaitx.github.io/view.html?user=CherryHQ&project=cherry-studio&lang=ru">Русский</a></p>
-        <p><a href="https://openaitx.github.io/view.html?user=CherryHQ&project=cherry-studio&lang=pt">Português</a></p>
-        <p><a href="https://openaitx.github.io/view.html?user=CherryHQ&project=cherry-studio&lang=nl">Nederlands</a></p>
-        <p><a href="https://openaitx.github.io/view.html?user=CherryHQ&project=cherry-studio&lang=pl">Polski</a></p>
-        <p><a href="https://openaitx.github.io/view.html?user=CherryHQ&project=cherry-studio&lang=ar">العربية</a></p>
-        <p><a href="https://openaitx.github.io/view.html?user=CherryHQ&project=cherry-studio&lang=fa">فارسی</a></p>
-        <p><a href="https://openaitx.github.io/view.html?user=CherryHQ&project=cherry-studio&lang=tr">Türkçe</a></p>
-        <p><a href="https://openaitx.github.io/view.html?user=CherryHQ&project=cherry-studio&lang=vi">Tiếng Việt</a></p>
-        <p><a href="https://openaitx.github.io/view.html?user=CherryHQ&project=cherry-studio&lang=id">Bahasa Indonesia</a></p>
-      </div>
-    </div>
-  </details>
-</div>
-
 <h1 align="center">
  <a href="https://github.com/CherryHQ/cherry-studio/releases">
    <img src="https://github.com/CherryHQ/cherry-studio/blob/main/build/icon.png?raw=true" width="150" height="150" alt="banner" /><br>
  </a>
 </h1>
+  <p align="center">English | <a href="./docs/README.zh.md">中文</a> | <a href="./docs/README.ja.md">日本語</a> | <a href="https://cherry-ai.com">Official Site</a> | <a href="https://docs.cherry-ai.com/cherry-studio-wen-dang/en-us">Documents</a> | <a href="./docs/dev.md">Development</a> | <a href="https://github.com/CherryHQ/cherry-studio/issues">Feedback</a><br></p>

-<p align="center">English | <a href="./docs/README.zh.md">中文</a> | <a href="https://cherry-ai.com">Official Site</a> | <a href="https://docs.cherry-ai.com/cherry-studio-wen-dang/en-us">Documents</a> | <a href="./docs/dev.md">Development</a> | <a href="https://github.com/CherryHQ/cherry-studio/issues">Feedback</a><br></p>
+<!-- 题头徽章组合 -->

 <div align="center">
-  
+
 [![][deepwiki-shield]][deepwiki-link]
 [![][twitter-shield]][twitter-link]
 [![][discord-shield]][discord-link]
 [![][telegram-shield]][telegram-link]

 </div>
+
+<!-- 项目统计徽章 -->
+
 <div align="center">
-  
+
+[![][github-stars-shield]][github-stars-link]
+[![][github-forks-shield]][github-forks-link]
 [![][github-release-shield]][github-release-link]
-[![][github-nightly-shield]][github-nightly-link]
 [![][github-contributors-shield]][github-contributors-link]
+
+</div>
+
+<div align="center">
+
 [![][license-shield]][license-link]
 [![][commercial-shield]][commercial-link]
 [![][sponsor-shield]][sponsor-link]
@@ -56,9 +36,9 @@
 </div>

 <div align="center">
- <a href="https://hellogithub.com/repository/1605492e1e2a4df3be07abfa4578dd37" target="_blank" style="text-decoration: none"><img src="https://api.hellogithub.com/v1/widgets/recommend.svg?rid=1605492e1e2a4df3be07abfa4578dd37" alt="Featured｜HelloGitHub"  width="220" height="55" /></a>
- <a href="https://trendshift.io/repositories/11772" target="_blank" style="text-decoration: none"><img src="https://trendshift.io/api/badge/repositories/11772" alt="kangfenmao%2Fcherry-studio | Trendshift" width="220" height="55" /></a>
- <a href="https://www.producthunt.com/posts/cherry-studio?embed=true&utm_source=badge-featured&utm_medium=badge&utm_souce=badge-cherry&#0045;studio" target="_blank"><img src="https://api.producthunt.com/widgets/embed-image/v1/featured.svg?post_id=496640&theme=light" alt="Cherry&#0032;Studio - AI&#0032;Chatbots&#0044;&#0032;AI&#0032;Desktop&#0032;Client | Product Hunt" width="220" height="55" /></a>
+ <a href="https://hellogithub.com/repository/1605492e1e2a4df3be07abfa4578dd37" target="_blank"><img src="https://api.hellogithub.com/v1/widgets/recommend.svg?rid=1605492e1e2a4df3be07abfa4578dd37" alt="Featured｜HelloGitHub" style="width: 200px; height: 43px;" width="200" height="43" /></a>
+ <a href="https://trendshift.io/repositories/11772" target="_blank"><img src="https://trendshift.io/api/badge/repositories/11772" alt="kangfenmao%2Fcherry-studio | Trendshift" style="width: 250px; height: 55px;" width="250" height="55"/></a>
+ <a href="https://www.producthunt.com/posts/cherry-studio?embed=true&utm_source=badge-featured&utm_medium=badge&utm_souce=badge-cherry&#0045;studio" target="_blank"><img src="https://api.producthunt.com/widgets/embed-image/v1/featured.svg?post_id=496640&theme=light" alt="Cherry&#0032;Studio - AI&#0032;Chatbots&#0044;&#0032;AI&#0032;Desktop&#0032;Client | Product Hunt" style="width: 200px; height: 43px;" width="200" height="43" /></a>
 </div>

 # 🍒 Cherry Studio
@@ -183,82 +163,10 @@ Refer to the [Branching Strategy](docs/branching-strategy-en.md) for contributio
 3. **Submit Changes**: Commit and push your changes.
 4. **Open a Pull Request**: Describe your changes and reasons.

-For more detailed guidelines, please refer to our [Contributing Guide](CONTRIBUTING.md).
+For more detailed guidelines, please refer to our [Contributing Guide](./CONTRIBUTING.md).

 Thank you for your support and contributions!

-# 🔧 Developer Co-creation Program
-
-We are launching the Cherry Studio Developer Co-creation Program to foster a healthy and positive-feedback loop within the open-source ecosystem. We believe that great software is built collaboratively, and every merged pull request breathes new life into the project.
-
-We sincerely invite you to join our ranks of contributors and shape the future of Cherry Studio with us.
-
-## Contributor Rewards Program
-
-To give back to our core contributors and create a virtuous cycle, we have established the following long-term incentive plan.
-
-**The inaugural tracking period for this program will be Q3 2025 (July, August, September). Rewards for this cycle will be distributed on October 1st.**
-
-Within any tracking period (e.g., July 1st to September 30th for the first cycle), any developer who contributes more than **30 meaningful commits** to any of Cherry Studio's open-source projects on GitHub is eligible for the following benefits:
-
- **Cursor Subscription Sponsorship**: Receive a **$70 USD** credit or reimbursement for your [Cursor](https://cursor.sh/) subscription, making AI your most efficient coding partner.
- **Unlimited Model Access**: Get **unlimited** API calls for the **DeepSeek** and **Qwen** models.
- **Cutting-Edge Tech Access**: Enjoy occasional perks, including API access to models like **Claude**, **Gemini**, and **OpenAI**, keeping you at the forefront of technology.
-
-## Growing Together & Future Plans
-
-A vibrant community is the driving force behind any sustainable open-source project. As Cherry Studio grows, so will our rewards program. We are committed to continuously aligning our benefits with the best-in-class tools and resources in the industry. This ensures our core contributors receive meaningful support, creating a positive cycle where developers, the community, and the project grow together.
-
-**Moving forward, the project will also embrace an increasingly open stance to give back to the entire open-source community.**
-
-## How to Get Started?
-
-We look forward to your first Pull Request!
-
-You can start by exploring our repositories, picking up a `good first issue`, or proposing your own enhancements. Every commit is a testament to the spirit of open source.
-
-Thank you for your interest and contributions.
-
-Let's build together.
-
-# 🏢 Enterprise Edition
-
-Building on the Community Edition, we are proud to introduce **Cherry Studio Enterprise Edition**—a privately deployable AI productivity and management platform designed for modern teams and enterprises.
-
-The Enterprise Edition addresses core challenges in team collaboration by centralizing the management of AI resources, knowledge, and data. It empowers organizations to enhance efficiency, foster innovation, and ensure compliance, all while maintaining 100% control over their data in a secure environment.
-
-## Core Advantages
-
- **Unified Model Management**: Centrally integrate and manage various cloud-based LLMs (e.g., OpenAI, Anthropic, Google Gemini) and locally deployed private models. Employees can use them out-of-the-box without individual configuration.
- **Enterprise-Grade Knowledge Base**: Build, manage, and share team-wide knowledge bases. Ensure knowledge is retained and consistent, enabling team members to interact with AI based on unified and accurate information.
- **Fine-Grained Access Control**: Easily manage employee accounts and assign role-based permissions for different models, knowledge bases, and features through a unified admin backend.
- **Fully Private Deployment**: Deploy the entire backend service on your on-premises servers or private cloud, ensuring your data remains 100% private and under your control to meet the strictest security and compliance standards.
- **Reliable Backend Services**: Provides stable API services, enterprise-grade data backup and recovery mechanisms to ensure business continuity.
-
-## ✨ Online Demo
-
-> 🚧 **Public Beta Notice**
->
-> The Enterprise Edition is currently in its early public beta stage, and we are actively iterating and optimizing its features. We are aware that it may not be perfectly stable yet. If you encounter any issues or have valuable suggestions during your trial, we would be very grateful if you could contact us via email to provide feedback.
-
-**🔗 [Cherry Studio Enterprise](https://www.cherry-ai.com/enterprise)**
-
-## Version Comparison
-
-| Feature           | Community Edition                          | Enterprise Edition                                                                                                                      |
-| :---------------- | :----------------------------------------- | :-------------------------------------------------------------------------------------------------------------------------------------- |
-| **Open Source**   | ✅ Yes                                     | ⭕️ part. released to cust.                                                                                                              |
-| **Cost**          | Free for Personal Use / Commercial License | Buyout / Subscription Fee                                                                                                               |
-| **Admin Backend** | —                                          | ● Centralized **Model** Access<br>● **Employee** Management<br>● Shared **Knowledge Base**<br>● **Access** Control<br>● **Data** Backup |
-| **Server**        | —                                          | ✅ Dedicated Private Deployment                                                                                                         |
-
-## Get the Enterprise Edition
-
-We believe the Enterprise Edition will become your team's AI productivity engine. If you are interested in Cherry Studio Enterprise Edition and would like to learn more, request a quote, or schedule a demo, please contact us.
-
- **For Business Inquiries & Purchasing**:
-  **📧 [bd@cherry-ai.com](mailto:bd@cherry-ai.com)**
-
 # 🔗 Related Projects

 - [one-api](https://github.com/songquanpeng/one-api):LLM API management and distribution system, supporting mainstream models like OpenAI, Azure, and Anthropic. Features unified API interface, suitable for key management and secondary distribution.
@@ -272,45 +180,34 @@ We believe the Enterprise Edition will become your team's AI productivity engine
 </a>
 <br /><br />

-# 📊 GitHub Stats
-
-![Stats](https://repobeats.axiom.co/api/embed/a693f2e5f773eed620f70031e974552156c7f397.svg 'Repobeats analytics image')
-
 # ⭐️ Star History

-<a href="https://www.star-history.com/#CherryHQ/cherry-studio&Date">
- <picture>
-   <source media="(prefers-color-scheme: dark)" srcset="https://api.star-history.com/svg?repos=CherryHQ/cherry-studio&type=Date&theme=dark" />
-   <source media="(prefers-color-scheme: light)" srcset="https://api.star-history.com/svg?repos=CherryHQ/cherry-studio&type=Date" />
-   <img alt="Star History Chart" src="https://api.star-history.com/svg?repos=CherryHQ/cherry-studio&type=Date" />
- </picture>
-</a>
+[![Star History Chart](https://api.star-history.com/svg?repos=CherryHQ/cherry-studio&type=Timeline)](https://star-history.com/#CherryHQ/cherry-studio&Timeline)

 <!-- Links & Images -->
-
-[deepwiki-shield]: https://img.shields.io/badge/Deepwiki-CherryHQ-0088CC?logo=data:image/svg+xml;base64,PHN2ZyB4bWxucz0iaHR0cDovL3d3dy53My5vcmcvMjAwMC9zdmciIHZpZXdCb3g9IjAgMCAyNy45MyAzMiI+PHBhdGggZD0iTTE5LjMzIDE0LjEyYy42Ny0uMzkgMS41LS4zOSAyLjE4IDBsMS43NCAxYy4wNi4wMy4xMS4wNi4xOC4wN2guMDRjLjA2LjAzLjEyLjAzLjE4LjAzaC4wMmMuMDYgMCAuMTEgMCAuMTctLjAyaC4wM2MuMDYtLjAyLjEyLS4wNS4xNy0uMDhoLjAybDMuNDgtMi4wMWMuMjUtLjE0LjQtLjQxLjQtLjdWOC40YS44MS44MSAwIDAgMC0uNC0uN2wtMy40OC0yLjAxYS44My44MyAwIDAgMC0uODEgMEwxOS43NyA3LjdoLS4wMWwtLjE1LjEyLS4wMi4wMnMtLjA3LjA5LS4xLjE0VjhhLjQuNCAwIDAgMC0uMDguMTd2LjA0Yy0uMDMuMDYtLjAzLjEyLS4wMy4xOXYyLjAxYzAgLjc4LS40MSAxLjQ5LTEuMDkgMS44OC0uNjcuMzktMS41LjM5LTIuMTggMGwtMS43NC0xYS42LjYgMCAwIDAtLjIxLS4wOGMtLjA2LS4wMS0uMTItLjAyLS4xOC0uMDJoLS4wM2MtLjA2IDAtLjExLjAxLS4xNy4wMmgtLjAzYy0uMDYuMDItLjEyLjA0LS4xNy4wN2gtLjAybC0zLjQ3IDIuMDFjLS4yNS4xNC0uNC40MS0uNC43VjE4YzAgLjI5LjE1LjU1LjQuN2wzLjQ4IDIuMDFoLjAyYy4wNi4wNC4xMS4wNi4xNy4wOGguMDNjLjA1LjAyLjExLjAzLjE3LjAzaC4wMmMuMDYgMCAuMTIgMCAuMTgtLjAyaC4wNGMuMDYtLjAzLjEyLS4wNS4xOC0uMDhsMS43NC0xYy42Ny0uMzkgMS41LS4zOSAyLjE3IDBzMS4wOSAxLjExIDEuMDkgMS44OHYyLjAxYzAgLjA3IDAgLjEzLjAyLjE5di4wNGMuMDMuMDYuMDUuMTIuMDguMTd2LjAycy4wOC4wOS4xMi4xM2wuMDIuMDJzLjA5LjA4LjE1LjExYzAgMCAuMDEgMCAuMDEuMDFsMy40OCAyLjAxYy4yNS4xNC41Ni4xNC44MSAwbDMuNDgtMi4wMWMuMjUtLjE0LjQtLjQxLjQtLjd2LTQuMDFhLjgxLjgxIDAgMCAwLS40LS43bC0zLjQ4LTIuMDFoLS4wMmMtLjA1LS4wNC0uMTEtLjA2LS4xNy0uMDhoLS4wM2EuNS41IDAgMCAwLS4xNy0uMDNoLS4wM2MtLjA2IDAtLjEyIDAtLjE4LjAyLS4wNy4wMi0uMTUuMDUtLjIxLjA4bC0xLjc0IDFjLS42Ny4zOS0xLjUuMzktMi4xNyAwYTIuMTkgMi4xOSAwIDAgMS0xLjA5LTEuODhjMC0uNzguNDItMS40OSAxLjA5LTEuODhaIiBzdHlsZT0iZmlsbDojNWRiZjlkIi8+PHBhdGggZD0ibS40IDEzLjExIDMuNDcgMi4wMWMuMjUuMTQuNTYuMTQuOCAwbDMuNDctMi4wMWguMDFsLjE1LS4xMi4wMi0uMDJzLjA3LS4wOS4xLS4xNGwuMDItLjAyYy4wMy0uMDUuMDUtLjExLjA3LS4xN3YtLjA0Yy4wMy0uMDYuMDMtLjEyLjAzLS4xOVYxMC40YzAtLjc4LjQyLTEuNDkgMS4wOS0xLjg4czEuNS0uMzkgMi4xOCAwbDEuNzQgMWMuMDcuMDQuMTQuMDcuMjEuMDguMDYuMDEuMTIuMDIuMTguMDJoLjAzYy4wNiAwIC4xMS0uMDEuMTctLjAyaC4wM2MuMDYtLjAyLjEyLS4wNC4xNy0uMDdoLjAybDMuNDctMi4wMmMuMjUtLjE0LjQtLjQxLjQtLjd2LTRhLjgxLjgxIDAgMCAwLS40LS43bC0zLjQ2LTJhLjgzLjgzIDAgMCAwLS44MSAwbC0zLjQ4IDIuMDFoLS4wMWwtLjE1LjEyLS4wMi4wMi0uMS4xMy0uMDIuMDJjLS4wMy4wNS0uMDUuMTEtLjA3LjE3di4wNGMtLjAzLjA2LS4wMy4xMi0uMDMuMTl2Mi4wMWMwIC43OC0uNDIgMS40OS0xLjA5IDEuODhzLTEuNS4zOS0yLjE4IDBsLTEuNzQtMWEuNi42IDAgMCAwLS4yMS0uMDhjLS4wNi0uMDEtLjEyLS4wMi0uMTgtLjAyaC0uMDNjLS4wNiAwLS4xMS4wMS0uMTcuMDJoLS4wM2MtLjA2LjAyLS4xMi4wNS0uMTcuMDhoLS4wMkwuNCA3LjcxYy0uMjUuMTQtLjQuNDEtLjQuNjl2NC4wMWMwIC4yOS4xNS41Ni40LjciIHN0eWxlPSJmaWxsOiM0NDY4YzQiLz48cGF0aCBkPSJtMTcuODQgMjQuNDgtMy40OC0yLjAxaC0uMDJjLS4wNS0uMDQtLjExLS4wNi0uMTctLjA4aC0uMDNhLjUuNSAwIDAgMC0uMTctLjAzaC0uMDNjLS4wNiAwLS4xMiAwLS4xOC4wMmgtLjA0Yy0uMDYuMDMtLjEyLjA1LS4xOC4wOGwtMS43NCAxYy0uNjcuMzktMS41LjM5LTIuMTggMGEyLjE5IDIuMTkgMCAwIDEtMS4wOS0xLjg4di0yLjAxYzAtLjA2IDAtLjEzLS4wMi0uMTl2LS4wNGMtLjAzLS4wNi0uMDUtLjExLS4wOC0uMTdsLS4wMi0uMDJzLS4wNi0uMDktLjEtLjEzTDguMjkgMTlzLS4wOS0uMDgtLjE1LS4xMWgtLjAxbC0zLjQ3LTIuMDJhLjgzLjgzIDAgMCAwLS44MSAwTC4zNyAxOC44OGEuODcuODcgMCAwIDAtLjM3LjcxdjQuMDFjMCAuMjkuMTUuNTUuNC43bDMuNDcgMi4wMWguMDJjLjA1LjA0LjExLjA2LjE3LjA4aC4wM2MuMDUuMDIuMTEuMDMuMTYuMDNoLjAzYy4wNiAwIC4xMiAwIC4xOC0uMDJoLjA0Yy4wNi0uMDMuMTItLjA1LjE4LS4wOGwxLjc0LTFjLjY3LS4zOSAxLjUtLjM5IDIuMTcgMHMxLjA5IDEuMTEgMS4wOSAxLjg4djIuMDFjMCAuMDcgMCAuMTMuMDIuMTl2LjA0Yy4wMy4wNi4wNS4xMS4wOC4xN2wuMDIuMDJzLjA2LjA5LjEuMTRsLjAyLjAycy4wOS4wOC4xNS4xMWguMDFsMy40OCAyLjAyYy4yNS4xNC41Ni4xNC44MSAwbDMuNDgtMi4wMWMuMjUtLjE0LjQtLjQxLjQtLjdWMjUuMmEuODEuODEgMCAwIDAtLjQtLjdaIiBzdHlsZT0iZmlsbDojNDI5M2Q5Ii8+PC9zdmc+
+[deepwiki-shield]: https://img.shields.io/badge/Deepwiki-CherryHQ-0088CC?style=plastic
 [deepwiki-link]: https://deepwiki.com/CherryHQ/cherry-studio
-[twitter-shield]: https://img.shields.io/badge/Twitter-CherryStudioApp-0088CC?logo=x
+[twitter-shield]: https://img.shields.io/badge/Twitter-CherryStudioApp-0088CC?style=plastic&logo=x
 [twitter-link]: https://twitter.com/CherryStudioHQ
-[discord-shield]: https://img.shields.io/badge/Discord-@CherryStudio-0088CC?logo=discord
+[discord-shield]: https://img.shields.io/badge/Discord-@CherryStudio-0088CC?style=plastic&logo=discord
 [discord-link]: https://discord.gg/wez8HtpxqQ
-[telegram-shield]: https://img.shields.io/badge/Telegram-@CherryStudioAI-0088CC?logo=telegram
+[telegram-shield]: https://img.shields.io/badge/Telegram-@CherryStudioAI-0088CC?style=plastic&logo=telegram
 [telegram-link]: https://t.me/CherryStudioAI

 <!-- Links & Images -->
-
-[github-release-shield]: https://img.shields.io/github/v/release/CherryHQ/cherry-studio?logo=github
+[github-stars-shield]: https://img.shields.io/github/stars/CherryHQ/cherry-studio?style=social
+[github-stars-link]: https://github.com/CherryHQ/cherry-studio/stargazers
+[github-forks-shield]: https://img.shields.io/github/forks/CherryHQ/cherry-studio?style=social
+[github-forks-link]: https://github.com/CherryHQ/cherry-studio/network
+[github-release-shield]: https://img.shields.io/github/v/release/CherryHQ/cherry-studio
 [github-release-link]: https://github.com/CherryHQ/cherry-studio/releases
-[github-nightly-shield]: https://img.shields.io/github/actions/workflow/status/CherryHQ/cherry-studio/nightly-build.yml?label=nightly%20build&logo=github
-[github-nightly-link]: https://github.com/CherryHQ/cherry-studio/actions/workflows/nightly-build.yml
-[github-contributors-shield]: https://img.shields.io/github/contributors/CherryHQ/cherry-studio?logo=github
+[github-contributors-shield]: https://img.shields.io/github/contributors/CherryHQ/cherry-studio
 [github-contributors-link]: https://github.com/CherryHQ/cherry-studio/graphs/contributors

 <!-- Links & Images -->
-
-[license-shield]: https://img.shields.io/badge/License-AGPLv3-important.svg?logo=gnu
+[license-shield]: https://img.shields.io/badge/License-AGPLv3-important.svg?style=plastic&logo=gnu
 [license-link]: https://www.gnu.org/licenses/agpl-3.0
-[commercial-shield]: https://img.shields.io/badge/License-Contact-white.svg?logoColor=white&logo=telegram&color=blue
+[commercial-shield]: https://img.shields.io/badge/License-Contact-white.svg?style=plastic&logoColor=white&logo=telegram&color=blue
 [commercial-link]: mailto:license@cherry-ai.com?subject=Commercial%20License%20Inquiry
-[sponsor-shield]: https://img.shields.io/badge/Sponsor-FF6699.svg?logo=githubsponsors&logoColor=white
+[sponsor-shield]: https://img.shields.io/badge/Sponsor-FF6699.svg?style=plastic&logo=githubsponsors&logoColor=white
 [sponsor-link]: https://github.com/CherryHQ/cherry-studio/blob/main/docs/sponsor.md
--- a/docs/CONTRIBUTING.zh.md
+++ b/docs/CONTRIBUTING.zh.md
@@ -1,6 +1,6 @@
 # Cherry Studio 贡献者指南

-[**English**](../CONTRIBUTING.md) | [**中文**](CONTRIBUTING.zh.md)
+[**English**](../CONTRIBUTING.md) | [**中文**](./CONTRIBUTING.zh.md)

 欢迎来到 Cherry Studio 的贡献者社区！我们致力于将 Cherry Studio 打造成一个长期提供价值的项目，并希望邀请更多的开发者加入我们的行列。无论您是经验丰富的开发者还是刚刚起步的初学者，您的贡献都将帮助我们更好地服务用户，提升软件质量。

@@ -24,7 +24,7 @@

 ## 开始之前

-请确保阅读了[行为准则](../CODE_OF_CONDUCT.md)和[LICENSE](../LICENSE)。
+请确保阅读了[行为准则](CODE_OF_CONDUCT.md)和[LICENSE](LICENSE)。

 ## 开始贡献

@@ -32,7 +32,7 @@

 ### 测试

-未经测试的功能等同于不存在。为确保代码真正有效，应通过单元测试和功能测试覆盖相关流程。因此，在考虑贡献时，也请考虑可测试性。所有测试均可本地运行，无需依赖 CI。请参阅[开发者指南](dev.md#test)中的“Test”部分。
+未经测试的功能等同于不存在。为确保代码真正有效，应通过单元测试和功能测试覆盖相关流程。因此，在考虑贡献时，也请考虑可测试性。所有测试均可本地运行，无需依赖 CI。请参阅[开发者指南](docs/dev.md#test)中的“Test”部分。

 ### 拉取请求的自动化测试

@@ -60,11 +60,7 @@ git commit --signoff -m "Your commit message"

 ### 获取代码审查/合并

-维护者在此帮助您在合理时间内实现您的用例。他们会尽力在合理时间内审查您的代码并提供建设性反馈。但如果您在审查过程中受阻，或认为您的 Pull Request 未得到应有的关注，请通过 Issue 中的评论或者[社群](README.zh.md#-community)联系我们
-
-### 参与测试计划
-
-测试计划旨在为用户提供更稳定的应用体验和更快的迭代速度，详细情况请参阅[测试计划](testplan-zh.md)。
+维护者在此帮助您在合理时间内实现您的用例。他们会尽力在合理时间内审查您的代码并提供建设性反馈。但如果您在审查过程中受阻，或认为您的 Pull Request 未得到应有的关注，请通过 Issue 中的评论或者[社群](README.md#-community)联系我们

 ### 其他建议

--- a/docs/README.ja.md
+++ b/docs/README.ja.md
@@ -0,0 +1,215 @@
+<h1 align="center">
+  <a href="https://github.com/CherryHQ/cherry-studio/releases">
+    <img src="https://github.com/CherryHQ/cherry-studio/blob/main/build/icon.png?raw=true" width="150" height="150" alt="banner" /><br>
+  </a>
+</h1>
+<p align="center">
+  <a href="https://github.com/CherryHQ/cherry-studio">English</a> | <a href="./README.zh.md">中文</a> | 日本語 | <a href="https://cherry-ai.com">公式サイト</a> | <a href="https://docs.cherry-ai.com/cherry-studio-wen-dang/ja">ドキュメント</a> | <a href="./dev.md">開発</a> | <a href="https://github.com/CherryHQ/cherry-studio/issues">フィードバック</a><br>
+</p>
+
+<!-- バッジコレクション -->
+
+<div align="center">
+
+[![][deepwiki-shield]][deepwiki-link]
+[![][twitter-shield]][twitter-link]
+[![][discord-shield]][discord-link]
+[![][telegram-shield]][telegram-link]
+
+</div>
+
+<!-- プロジェクト統計 -->
+
+<div align="center">
+
+[![][github-stars-shield]][github-stars-link]
+[![][github-forks-shield]][github-forks-link]
+[![][github-release-shield]][github-release-link]
+[![][github-contributors-shield]][github-contributors-link]
+
+</div>
+
+<div align="center">
+
+[![][license-shield]][license-link]
+[![][commercial-shield]][commercial-link]
+[![][sponsor-shield]][sponsor-link]
+
+</div>
+
+<div align="center">
+ <a href="https://hellogithub.com/repository/1605492e1e2a4df3be07abfa4578dd37" target="_blank"><img src="https://api.hellogithub.com/v1/widgets/recommend.svg?rid=1605492e1e2a4df3be07abfa4578dd37" alt="Featured｜HelloGitHub" style="width: 200px; height: 43px;" width="200" height="43" /></a>
+ <a href="https://trendshift.io/repositories/11772" target="_blank"><img src="https://trendshift.io/api/badge/repositories/11772" alt="kangfenmao%2Fcherry-studio | Trendshift" style="width: 250px; height: 55px;" width="250" height="55"/></a>
+ <a href="https://www.producthunt.com/posts/cherry-studio?embed=true&utm_source=badge-featured&utm_medium=badge&utm_souce=badge-cherry&#0045;studio" target="_blank"><img src="https://api.producthunt.com/widgets/embed-image/v1/featured.svg?post_id=496640&theme=light" alt="Cherry&#0032;Studio - AI&#0032;Chatbots&#0044;&#0032;AI&#0032;Desktop&#0032;Client | Product Hunt" style="width: 200px; height: 43px;" width="200" height="43" /></a>
+</div>
+
+# 🍒 Cherry Studio
+
+Cherry Studio は、複数の LLM プロバイダーをサポートするデスクトップクライアントで、Windows、Mac、Linux で利用可能です。
+
+👏 [Telegram](https://t.me/CherryStudioAI)｜[Discord](https://discord.gg/wez8HtpxqQ) | [QQグループ(575014769)](https://qm.qq.com/q/lo0D4qVZKi)
+
+❤️ Cherry Studio をお気に入りにしましたか？小さな星をつけてください 🌟 または [スポンサー](sponsor.md) をして開発をサポートしてください！
+
+# 🌠 スクリーンショット
+
+![](https://github.com/user-attachments/assets/36dddb2c-e0fb-4a5f-9411-91447bab6e18)
+
+![](https://github.com/user-attachments/assets/f549e8a0-2385-40b4-b52b-2039e39f2930)
+
+![](https://github.com/user-attachments/assets/58e0237c-4d36-40de-b428-53051d982026)
+
+# 🌟 主な機能
+
+1. **多様な LLM サービス対応**：
+
+- ☁️ 主要な LLM クラウドサービス対応：OpenAI、Gemini、Anthropic など
+- 🔗 AI Web サービス統合：Claude、Peplexity、Poe など
+- 💻 Ollama、LM Studio によるローカルモデル実行対応
+
+2. **AI アシスタントと対話**：
+
+- 📚 300+ の事前設定済み AI アシスタント
+- 🤖 カスタム AI アシスタントの作成
+- 💬 複数モデルでの同時対話機能
+
+3. **文書とデータ処理**：
+
+- 📄 テキスト、画像、Office、PDF など多様な形式対応
+- ☁️ WebDAV によるファイル管理とバックアップ
+- 📊 Mermaid による図表作成
+- 💻 コードハイライト機能
+
+4. **実用的なツール統合**：
+
+- 🔍 グローバル検索機能
+- 📝 トピック管理システム
+- 🔤 AI による翻訳機能
+- 🎯 ドラッグ＆ドロップによる整理
+- 🔌 ミニプログラム対応
+- ⚙️ MCP（モデルコンテキストプロトコル）サービス
+
+5. **優れたユーザー体験**：
+
+- 🖥️ Windows、Mac、Linux のクロスプラットフォーム対応
+- 📦 環境構築不要ですぐに使用可能
+- 🎨 ライト/ダークテーマと透明ウィンドウ対応
+- 📝 完全な Markdown レンダリング
+- 🤲 簡単な共有機能
+
+# 📝 開発計画
+
+以下の機能と改善に積極的に取り組んでいます：
+
+1. 🎯 **コア機能**
+
+- 選択アシスタント - スマートな内容選択の強化
+- ディープリサーチ - 高度な研究能力
+- メモリーシステム - グローバルコンテキスト認識
+- ドキュメント前処理 - 文書処理の改善
+- MCP マーケットプレイス - モデルコンテキストプロトコルエコシステム
+
+2. 🗂 **ナレッジ管理**
+
+- ノートとコレクション
+- ダイナミックキャンバス可視化
+- OCR 機能
+- TTS（テキスト読み上げ）サポート
+
+3. 📱 **プラットフォーム対応**
+
+- HarmonyOS エディション
+- Android アプリ（フェーズ1）
+- iOS アプリ（フェーズ1）
+- マルチウィンドウ対応
+- ウィンドウピン留め機能
+
+4. 🔌 **高度な機能**
+
+- プラグインシステム
+- ASR（音声認識）
+- アシスタントとトピックの対話機能リファクタリング
+
+[プロジェクトボード](https://github.com/orgs/CherryHQ/projects/7)で進捗を確認し、貢献することができます。
+
+開発計画に影響を与えたいですか？[GitHub ディスカッション](https://github.com/CherryHQ/cherry-studio/discussions)に参加して、アイデアやフィードバックを共有してください！
+
+# 🌈 テーマ
+
+- テーマギャラリー：https://cherrycss.com
+- Aero テーマ：https://github.com/hakadao/CherryStudio-Aero
+- PaperMaterial テーマ：https://github.com/rainoffallingstar/CherryStudio-PaperMaterial
+- Claude テーマ：https://github.com/bjl101501/CherryStudio-Claudestyle-dynamic
+- メープルネオンテーマ：https://github.com/BoningtonChen/CherryStudio_themes
+
+より多くのテーマの PR を歓迎します
+
+# 🤝 貢献
+
+Cherry Studio への貢献を歓迎します！以下の方法で貢献できます：
+
+1. **コードの貢献**：新機能を開発するか、既存のコードを最適化します
+2. **バグの修正**：見つけたバグを修正します
+3. **問題の管理**：GitHub の問題を管理するのを手伝います
+4. **製品デザイン**：デザインの議論に参加します
+5. **ドキュメントの作成**：ユーザーマニュアルやガイドを改善します
+6. **コミュニティの参加**：ディスカッションに参加し、ユーザーを支援します
+7. **使用の促進**：Cherry Studio を広めます
+
+[ブランチ戦略](branching-strategy-en.md)を参照して貢献ガイドラインを確認してください
+
+## 始め方
+
+1. **リポジトリをフォーク**：フォークしてローカルマシンにクローンします
+2. **ブランチを作成**：変更のためのブランチを作成します
+3. **変更を提出**：変更をコミットしてプッシュします
+4. **プルリクエストを開く**：変更内容と理由を説明します
+
+詳細なガイドラインについては、[貢献ガイド](../CONTRIBUTING.md)をご覧ください。
+
+ご支援と貢献に感謝します！
+
+# 🔗 関連プロジェクト
+
+- [one-api](https://github.com/songquanpeng/one-api)：LLM API の管理・配信システム。OpenAI、Azure、Anthropic などの主要モデルに対応し、統一 API インターフェースを提供。API キー管理と再配布に利用可能。
+
+- [ublacklist](https://github.com/iorate/ublacklist)：Google 検索結果から特定のサイトを非表示にします
+
+# 🚀 コントリビューター
+
+<a href="https://github.com/CherryHQ/cherry-studio/graphs/contributors">
+  <img src="https://contrib.rocks/image?repo=CherryHQ/cherry-studio" />
+</a>
+<br /><br />
+
+# ⭐️ スター履歴
+
+[![Star History Chart](https://api.star-history.com/svg?repos=CherryHQ/cherry-studio&type=Timeline)](https://star-history.com/#CherryHQ/cherry-studio&Timeline)
+
+<!-- リンクと画像 -->
+[deepwiki-shield]: https://img.shields.io/badge/Deepwiki-CherryHQ-0088CC?style=plastic
+[deepwiki-link]: https://deepwiki.com/CherryHQ/cherry-studio
+[twitter-shield]: https://img.shields.io/badge/Twitter-CherryStudioApp-0088CC?style=plastic&logo=x
+[twitter-link]: https://twitter.com/CherryStudioHQ
+[discord-shield]: https://img.shields.io/badge/Discord-@CherryStudio-0088CC?style=plastic&logo=discord
+[discord-link]: https://discord.gg/wez8HtpxqQ
+[telegram-shield]: https://img.shields.io/badge/Telegram-@CherryStudioAI-0088CC?style=plastic&logo=telegram
+[telegram-link]: https://t.me/CherryStudioAI
+
+<!-- プロジェクト統計 -->
+[github-stars-shield]: https://img.shields.io/github/stars/CherryHQ/cherry-studio?style=social
+[github-stars-link]: https://github.com/CherryHQ/cherry-studio/stargazers
+[github-forks-shield]: https://img.shields.io/github/forks/CherryHQ/cherry-studio?style=social
+[github-forks-link]: https://github.com/CherryHQ/cherry-studio/network
+[github-release-shield]: https://img.shields.io/github/v/release/CherryHQ/cherry-studio
+[github-release-link]: https://github.com/CherryHQ/cherry-studio/releases
+[github-contributors-shield]: https://img.shields.io/github/contributors/CherryHQ/cherry-studio
+[github-contributors-link]: https://github.com/CherryHQ/cherry-studio/graphs/contributors
+
+<!-- ライセンスとスポンサー -->
+[license-shield]: https://img.shields.io/badge/License-AGPLv3-important.svg?style=plastic&logo=gnu
+[license-link]: https://www.gnu.org/licenses/agpl-3.0
+[commercial-shield]: https://img.shields.io/badge/商用ライセンス-お問い合わせ-white.svg?style=plastic&logoColor=white&logo=telegram&color=blue
+[commercial-link]: mailto:license@cherry-ai.com?subject=商業ライセンスについて
+[sponsor-shield]: https://img.shields.io/badge/スポンサー-FF6699.svg?style=plastic&logo=githubsponsors&logoColor=white
+[sponsor-link]: https://github.com/CherryHQ/cherry-studio/blob/main/docs/sponsor.md
--- a/docs/README.zh.md
+++ b/docs/README.zh.md
@@ -1,40 +1,10 @@
-<div align="right" >
-  <details>
-    <summary >🌐 Language</summary>
-    <div>
-      <div align="right">
-        <p><a href="https://openaitx.github.io/view.html?user=CherryHQ&project=cherry-studio&lang=en">English</a></p>
-        <p><a href="https://openaitx.github.io/view.html?user=CherryHQ&project=cherry-studio&lang=zh-CN">简体中文</a></p>
-        <p><a href="https://openaitx.github.io/view.html?user=CherryHQ&project=cherry-studio&lang=zh-TW">繁體中文</a></p>
-        <p><a href="https://openaitx.github.io/view.html?user=CherryHQ&project=cherry-studio&lang=ja">日本語</a></p>
-        <p><a href="https://openaitx.github.io/view.html?user=CherryHQ&project=cherry-studio&lang=ko">한국어</a></p>
-        <p><a href="https://openaitx.github.io/view.html?user=CherryHQ&project=cherry-studio&lang=hi">हिन्दी</a></p>
-        <p><a href="https://openaitx.github.io/view.html?user=CherryHQ&project=cherry-studio&lang=th">ไทย</a></p>
-        <p><a href="https://openaitx.github.io/view.html?user=CherryHQ&project=cherry-studio&lang=fr">Français</a></p>
-        <p><a href="https://openaitx.github.io/view.html?user=CherryHQ&project=cherry-studio&lang=de">Deutsch</a></p>
-        <p><a href="https://openaitx.github.io/view.html?user=CherryHQ&project=cherry-studio&lang=es">Español</a></p>
-        <p><a href="https://openaitx.github.io/view.html?user=CherryHQ&project=cherry-studio&lang=it">Itapano</a></p>
-        <p><a href="https://openaitx.github.io/view.html?user=CherryHQ&project=cherry-studio&lang=ru">Русский</a></p>
-        <p><a href="https://openaitx.github.io/view.html?user=CherryHQ&project=cherry-studio&lang=pt">Português</a></p>
-        <p><a href="https://openaitx.github.io/view.html?user=CherryHQ&project=cherry-studio&lang=nl">Nederlands</a></p>
-        <p><a href="https://openaitx.github.io/view.html?user=CherryHQ&project=cherry-studio&lang=pl">Polski</a></p>
-        <p><a href="https://openaitx.github.io/view.html?user=CherryHQ&project=cherry-studio&lang=ar">العربية</a></p>
-        <p><a href="https://openaitx.github.io/view.html?user=CherryHQ&project=cherry-studio&lang=fa">فارسی</a></p>
-        <p><a href="https://openaitx.github.io/view.html?user=CherryHQ&project=cherry-studio&lang=tr">Türkçe</a></p>
-        <p><a href="https://openaitx.github.io/view.html?user=CherryHQ&project=cherry-studio&lang=vi">Tiếng Việt</a></p>
-        <p><a href="https://openaitx.github.io/view.html?user=CherryHQ&project=cherry-studio&lang=id">Bahasa Indonesia</a></p>
-      </div>
-    </div>
-  </details>
-</div>
-
 <h1 align="center">
  <a href="https://github.com/CherryHQ/cherry-studio/releases">
    <img src="https://github.com/CherryHQ/cherry-studio/blob/main/build/icon.png?raw=true" width="150" height="150" alt="banner" /><br>
  </a>
 </h1>
 <p align="center">
-  <a href="https://github.com/CherryHQ/cherry-studio">English</a> | 中文 | <a href="https://cherry-ai.com">官方网站</a> | <a href="https://docs.cherry-ai.com/cherry-studio-wen-dang/zh-cn">文档</a> | <a href="./dev.md">开发</a> | <a href="https://github.com/CherryHQ/cherry-studio/issues">反馈</a><br>
+  <a href="https://github.com/CherryHQ/cherry-studio">English</a> | 中文 | <a href="./README.ja.md">日本語</a> | <a href="https://cherry-ai.com">官方网站</a> | <a href="https://docs.cherry-ai.com/cherry-studio-wen-dang/zh-cn">文档</a> | <a href="./dev.md">开发</a> | <a href="https://github.com/CherryHQ/cherry-studio/issues">反馈</a><br>
 </p>

 <!-- 题头徽章组合 -->
@@ -48,10 +18,19 @@

 </div>

+<!-- 项目统计徽章 -->
+
 <div align="center">

+[![][github-stars-shield]][github-stars-link]
+[![][github-forks-shield]][github-forks-link]
 [![][github-release-shield]][github-release-link]
 [![][github-contributors-shield]][github-contributors-link]
+
+</div>
+
+<div align="center">
+
 [![][license-shield]][license-link]
 [![][commercial-shield]][commercial-link]
 [![][sponsor-shield]][sponsor-link]
@@ -59,9 +38,9 @@
 </div>

 <div align="center">
- <a href="https://hellogithub.com/repository/1605492e1e2a4df3be07abfa4578dd37" target="_blank" style="text-decoration: none"><img src="https://api.hellogithub.com/v1/widgets/recommend.svg?rid=1605492e1e2a4df3be07abfa4578dd37" alt="Featured｜HelloGitHub"  width="220" height="55" /></a>
- <a href="https://trendshift.io/repositories/11772" target="_blank" style="text-decoration: none"><img src="https://trendshift.io/api/badge/repositories/11772" alt="kangfenmao%2Fcherry-studio | Trendshift" width="220" height="55" /></a>
- <a href="https://www.producthunt.com/posts/cherry-studio?embed=true&utm_source=badge-featured&utm_medium=badge&utm_souce=badge-cherry&#0045;studio" target="_blank"><img src="https://api.producthunt.com/widgets/embed-image/v1/featured.svg?post_id=496640&theme=light" alt="Cherry&#0032;Studio - AI&#0032;Chatbots&#0044;&#0032;AI&#0032;Desktop&#0032;Client | Product Hunt" width="220" height="55" /></a>
+ <a href="https://hellogithub.com/repository/1605492e1e2a4df3be07abfa4578dd37" target="_blank"><img src="https://api.hellogithub.com/v1/widgets/recommend.svg?rid=1605492e1e2a4df3be07abfa4578dd37" alt="Featured｜HelloGitHub" style="width: 200px; height: 43px;" width="200" height="43" /></a>
+ <a href="https://trendshift.io/repositories/11772" target="_blank"><img src="https://trendshift.io/api/badge/repositories/11772" alt="kangfenmao%2Fcherry-studio | Trendshift" style="width: 250px; height: 55px;" width="250" height="55"/></a>
+ <a href="https://www.producthunt.com/posts/cherry-studio?embed=true&utm_source=badge-featured&utm_medium=badge&utm_souce=badge-cherry&#0045;studio" target="_blank"><img src="https://api.producthunt.com/widgets/embed-image/v1/featured.svg?post_id=496640&theme=light" alt="Cherry&#0032;Studio - AI&#0032;Chatbots&#0044;&#0032;AI&#0032;Desktop&#0032;Client | Product Hunt" style="width: 200px; height: 43px;" width="200" height="43" /></a>
 </div>

 # 🍒 Cherry Studio
@@ -72,6 +51,14 @@ Cherry Studio 是一款支持多个大语言模型（LLM）服务商的桌面客

 ❤️ 喜欢 Cherry Studio? 点亮小星星 🌟 或 [赞助开发者](sponsor.md)! ❤️

+# GitCode✖️Cherry Studio【新源力】贡献挑战赛
+
+<p align="center">
+  <a href="https://gitcode.com/CherryHQ/cherry-studio/discussion/2">
+    <img src="https://raw.gitcode.com/user-images/assets/5007375/8d8d7559-1141-4691-b90f-d154558c6896/cherry-studio-gitcode.jpg" width="100%" alt="banner" />
+  </a>
+</p>
+
 # 📖 使用教程

 https://docs.cherry-ai.com
@@ -190,82 +177,10 @@ https://docs.cherry-ai.com
 3. **提交更改**：提交并推送您的更改
 4. **打开 Pull Request**：描述您的更改和原因

-有关更详细的指南，请参阅我们的 [贡献指南](CONTRIBUTING.zh.md)
+有关更详细的指南，请参阅我们的 [贡献指南](./CONTRIBUTING.zh.md)

 感谢您的支持和贡献！

-# 🔧 开发者共创计划
-
-我们正在启动 Cherry Studio 开发者共创计划，旨在为开源生态系统构建一个健康、正向反馈的循环。我们相信，优秀的软件是通过协作构建的，每一个合并的拉取请求都为项目注入新的生命力。
-
-我们诚挚地邀请您加入我们的贡献者队伍，与我们一起塑造 Cherry Studio 的未来。
-
-## 贡献者奖励计划
-
-为了回馈我们的核心贡献者并创造良性循环，我们建立了以下长期激励计划。
-
-**该计划的首个跟踪周期将是 2025 年第三季度（7月、8月、9月）。此周期的奖励将在 10月1日 发放。**
-
-在任何跟踪周期内（例如，首个周期的 7月1日 至 9月30日），任何为 Cherry Studio 在 GitHub 上的开源项目贡献超过 **30 个有意义提交** 的开发者都有资格获得以下福利：
-
- **Cursor 订阅赞助**：获得 **70 美元** 的 [Cursor](https://cursor.sh/) 订阅积分或报销，让 AI 成为您最高效的编码伙伴。
- **无限模型访问**：获得 **DeepSeek** 和 **Qwen** 模型的 **无限次** API 调用。
- **前沿技术访问**：享受偶尔的特殊福利，包括 **Claude**、**Gemini** 和 **OpenAI** 等模型的 API 访问权限，让您始终站在技术前沿。
-
-## 共同成长与未来规划
-
-活跃的社区是任何可持续开源项目背后的推动力。随着 Cherry Studio 的发展，我们的奖励计划也将随之发展。我们致力于持续将我们的福利与行业内最优秀的工具和资源保持一致。这确保我们的核心贡献者获得有意义的支持，创造一个开发者、社区和项目共同成长的正向循环。
-
-**展望未来，该项目还将采取越来越开放的态度来回馈整个开源社区。**
-
-## 如何开始？
-
-我们期待您的第一个拉取请求！
-
-您可以从探索我们的仓库开始，选择一个 `good first issue`，或者提出您自己的改进建议。每一个提交都是开源精神的体现。
-
-感谢您的关注和贡献。
-
-让我们一起建设。
-
-# 🏢 企业版
-
-在社区版的基础上，我们自豪地推出 **Cherry Studio 企业版**——一个为现代团队和企业设计的私有部署 AI 生产力与管理平台。
-
-企业版通过集中管理 AI 资源、知识和数据，解决了团队协作中的核心挑战。它赋能组织提升效率、促进创新并确保合规，同时在安全环境中保持对数据的 100% 控制。
-
-## 核心优势
-
- **统一模型管理**：集中整合和管理各种基于云的大语言模型（如 OpenAI、Anthropic、Google Gemini）和本地部署的私有模型。员工可以开箱即用，无需单独配置。
- **企业级知识库**：构建、管理和分享全团队的知识库。确保知识得到保留且一致，使团队成员能够基于统一准确的信息与 AI 交互。
- **细粒度访问控制**：通过统一的管理后台轻松管理员工账户，并为不同模型、知识库和功能分配基于角色的权限。
- **完全私有部署**：在您的本地服务器或私有云上部署整个后端服务，确保您的数据 100% 私有且在您的控制之下，满足最严格的安全和合规标准。
- **可靠的后端服务**：提供稳定的 API 服务、企业级数据备份和恢复机制，确保业务连续性。
-
-## ✨ 在线演示
-
-> 🚧 **公开测试版通知**
->
-> 企业版目前处于早期公开测试阶段，我们正在积极迭代和优化其功能。我们知道它可能还不够完全稳定。如果您在试用过程中遇到任何问题或有宝贵建议，我们非常感谢您能通过邮件联系我们提供反馈。
-
-**🔗 [Cherry Studio 企业版](https://www.cherry-ai.com/enterprise)**
-
-## 版本对比
-
-| 功能         | 社区版                  | 企业版                                                                                         |
-| :----------- | :---------------------- | :--------------------------------------------------------------------------------------------- |
-| **开源**     | ✅ 是                   | ⭕️ 部分开源，对客户开放                                                                        |
-| **成本**     | 个人使用免费 / 商业授权 | 买断 / 订阅费用                                                                                |
-| **管理后台** | —                       | ● 集中化**模型**访问<br>● **员工**管理<br>● 共享**知识库**<br>● **访问**控制<br>● **数据**备份 |
-| **服务器**   | —                       | ✅ 专用私有部署                                                                                |
-
-## 获取企业版
-
-我们相信企业版将成为您团队的 AI 生产力引擎。如果您对 Cherry Studio 企业版感兴趣，希望了解更多信息、请求报价或安排演示，请联系我们。
-
- **商业咨询与购买**：
-  **📧 [bd@cherry-ai.com](mailto:bd@cherry-ai.com)**
-
 # 🔗 相关项目

 - [one-api](https://github.com/songquanpeng/one-api)：LLM API 管理及分发系统，支持 OpenAI、Azure、Anthropic 等主流模型，统一 API 接口，可用于密钥管理与二次分发。
@@ -279,43 +194,34 @@ https://docs.cherry-ai.com
 </a>
 <br /><br />

-# 📊 GitHub 统计
-
-![Stats](https://repobeats.axiom.co/api/embed/a693f2e5f773eed620f70031e974552156c7f397.svg 'Repobeats analytics image')
-
 # ⭐️ Star 记录

-<a href="https://www.star-history.com/#CherryHQ/cherry-studio&Date">
- <picture>
-   <source media="(prefers-color-scheme: dark)" srcset="https://api.star-history.com/svg?repos=CherryHQ/cherry-studio&type=Date&theme=dark" />
-   <source media="(prefers-color-scheme: light)" srcset="https://api.star-history.com/svg?repos=CherryHQ/cherry-studio&type=Date" />
-   <img alt="Star History Chart" src="https://api.star-history.com/svg?repos=CherryHQ/cherry-studio&type=Date" />
- </picture>
-</a>
+[![Star History Chart](https://api.star-history.com/svg?repos=CherryHQ/cherry-studio&type=Timeline)](https://star-history.com/#CherryHQ/cherry-studio&Timeline)

 <!-- Links & Images -->
-
-[deepwiki-shield]: https://img.shields.io/badge/Deepwiki-CherryHQ-0088CC
+[deepwiki-shield]: https://img.shields.io/badge/Deepwiki-CherryHQ-0088CC?style=plastic
 [deepwiki-link]: https://deepwiki.com/CherryHQ/cherry-studio
-[twitter-shield]: https://img.shields.io/badge/Twitter-CherryStudioApp-0088CC?logo=x
+[twitter-shield]: https://img.shields.io/badge/Twitter-CherryStudioApp-0088CC?style=plastic&logo=x
 [twitter-link]: https://twitter.com/CherryStudioHQ
-[discord-shield]: https://img.shields.io/badge/Discord-@CherryStudio-0088CC?logo=discord
+[discord-shield]: https://img.shields.io/badge/Discord-@CherryStudio-0088CC?style=plastic&logo=discord
 [discord-link]: https://discord.gg/wez8HtpxqQ
-[telegram-shield]: https://img.shields.io/badge/Telegram-@CherryStudioAI-0088CC?logo=telegram
+[telegram-shield]: https://img.shields.io/badge/Telegram-@CherryStudioAI-0088CC?style=plastic&logo=telegram
 [telegram-link]: https://t.me/CherryStudioAI

 <!-- 项目统计徽章 -->
-
+[github-stars-shield]: https://img.shields.io/github/stars/CherryHQ/cherry-studio?style=social
+[github-stars-link]: https://github.com/CherryHQ/cherry-studio/stargazers
+[github-forks-shield]: https://img.shields.io/github/forks/CherryHQ/cherry-studio?style=social
+[github-forks-link]: https://github.com/CherryHQ/cherry-studio/network
 [github-release-shield]: https://img.shields.io/github/v/release/CherryHQ/cherry-studio
 [github-release-link]: https://github.com/CherryHQ/cherry-studio/releases
 [github-contributors-shield]: https://img.shields.io/github/contributors/CherryHQ/cherry-studio
 [github-contributors-link]: https://github.com/CherryHQ/cherry-studio/graphs/contributors

 <!-- 许可和赞助徽章 -->
-
-[license-shield]: https://img.shields.io/badge/License-AGPLv3-important.svg?logo=gnu
+[license-shield]: https://img.shields.io/badge/License-AGPLv3-important.svg?style=plastic&logo=gnu
 [license-link]: https://www.gnu.org/licenses/agpl-3.0
-[commercial-shield]: https://img.shields.io/badge/商用授权-联系-white.svg?logoColor=white&logo=telegram&color=blue
+[commercial-shield]: https://img.shields.io/badge/商用授权-联系-white.svg?style=plastic&logoColor=white&logo=telegram&color=blue
 [commercial-link]: mailto:license@cherry-ai.com?subject=商业授权咨询
-[sponsor-shield]: https://img.shields.io/badge/赞助支持-FF6699.svg?logo=githubsponsors&logoColor=white
+[sponsor-shield]: https://img.shields.io/badge/赞助支持-FF6699.svg?style=plastic&logo=githubsponsors&logoColor=white
 [sponsor-link]: https://github.com/CherryHQ/cherry-studio/blob/main/docs/sponsor.md
--- a/docs/branching-strategy-en.md
+++ b/docs/branching-strategy-en.md
@@ -16,8 +16,6 @@ Cherry Studio implements a structured branching strategy to maintain code qualit
  - Only accepts documentation updates and bug fixes
  - Thoroughly tested before production deployment

-For details about the `testplan` branch used in the Test Plan, please refer to the [Test Plan](testplan-en.md).
-
 ## Contributing Branches

 When contributing to Cherry Studio, please follow these guidelines:
--- a/docs/branching-strategy-zh.md
+++ b/docs/branching-strategy-zh.md
@@ -16,8 +16,6 @@ Cherry Studio 采用结构化的分支策略来维护代码质量并简化开发
  - 只接受文档更新和 bug 修复
  - 经过完整测试后可以发布到生产环境

-关于测试计划所使用的`testplan`分支，请查阅[测试计划](testplan-zh.md)。
-
 ## 贡献分支

 在为 Cherry Studio 贡献代码时，请遵循以下准则：
--- a/docs/technical/how-to-write-middlewares.md
+++ b/docs/technical/how-to-write-middlewares.md
@@ -1,214 +0,0 @@
-# 如何为 AI Provider 编写中间件
-
-本文档旨在指导开发者如何为我们的 AI Provider 框架创建和集成自定义中间件。中间件提供了一种强大而灵活的方式来增强、修改或观察 Provider 方法的调用过程，例如日志记录、缓存、请求/响应转换、错误处理等。
-
-## 架构概览
-
-我们的中间件架构借鉴了 Redux 的三段式设计，并结合了 JavaScript Proxy 来动态地将中间件应用于 Provider 的方法。
-
- **Proxy**: 拦截对 Provider 方法的调用，并将调用引导至中间件链。
- **中间件链**: 一系列按顺序执行的中间件函数。每个中间件都可以处理请求/响应，然后将控制权传递给链中的下一个中间件，或者在某些情况下提前终止链。
- **上下文 (Context)**: 一个在中间件之间传递的对象，携带了关于当前调用的信息（如方法名、原始参数、Provider 实例、以及中间件自定义的数据）。
-
-## 中间件的类型
-
-目前主要支持两种类型的中间件，它们共享相似的结构但针对不同的场景：
-
-1.  **`CompletionsMiddleware`**: 专门为 `completions` 方法设计。这是最常用的中间件类型，因为它允许对 AI 模型的核心聊天/文本生成功能进行精细控制。
-2.  **`ProviderMethodMiddleware`**: 通用中间件，可以应用于 Provider 上的任何其他方法（例如，`translate`, `summarize` 等，如果这些方法也通过中间件系统包装）。
-
-## 编写一个 `CompletionsMiddleware`
-
-`CompletionsMiddleware` 的基本签名（TypeScript 类型）如下：
-
-```typescript
-import { AiProviderMiddlewareCompletionsContext, CompletionsParams, MiddlewareAPI } from './AiProviderMiddlewareTypes' // 假设类型定义文件路径
-
-export type CompletionsMiddleware = (
-  api: MiddlewareAPI<AiProviderMiddlewareCompletionsContext, [CompletionsParams]>
-) => (
-  next: (context: AiProviderMiddlewareCompletionsContext, params: CompletionsParams) => Promise<any> // next 返回 Promise<any> 代表原始SDK响应或下游中间件的结果
-) => (context: AiProviderMiddlewareCompletionsContext, params: CompletionsParams) => Promise<void> // 最内层函数通常返回 Promise<void>，因为结果通过 onChunk 或 context 副作用传递
-```
-
-让我们分解这个三段式结构：
-
-1.  **第一层函数 `(api) => { ... }`**:
-
-    - 接收一个 `api` 对象。
-    - `api` 对象提供了以下方法：
-      - `api.getContext()`: 获取当前调用的上下文对象 (`AiProviderMiddlewareCompletionsContext`)。
-      - `api.getOriginalArgs()`: 获取传递给 `completions` 方法的原始参数数组 (即 `[CompletionsParams]`)。
-      - `api.getProviderId()`: 获取当前 Provider 的 ID。
-      - `api.getProviderInstance()`: 获取原始的 Provider 实例。
-    - 此函数通常用于进行一次性的设置或获取所需的服务/配置。它返回第二层函数。
-
-2.  **第二层函数 `(next) => { ... }`**:
-
-    - 接收一个 `next` 函数。
-    - `next` 函数代表了中间件链中的下一个环节。调用 `next(context, params)` 会将控制权传递给下一个中间件，或者如果当前中间件是链中的最后一个，则会调用核心的 Provider 方法逻辑 (例如，实际的 SDK 调用)。
-    - `next` 函数接收当前的 `context` 和 `params` (这些可能已被上游中间件修改)。
-    - **重要的是**：`next` 的返回类型通常是 `Promise<any>`。对于 `completions` 方法，如果 `next` 调用了实际的 SDK，它将返回原始的 SDK 响应（例如，OpenAI 的流对象或 JSON 对象）。你需要处理这个响应。
-    - 此函数返回第三层（也是最核心的）函数。
-
-3.  **第三层函数 `(context, params) => { ... }`**:
-    - 这是执行中间件主要逻辑的地方。
-    - 它接收当前的 `context` (`AiProviderMiddlewareCompletionsContext`) 和 `params` (`CompletionsParams`)。
-    - 在此函数中，你可以：
-      - **在调用 `next` 之前**:
-        - 读取或修改 `params`。例如，添加默认参数、转换消息格式。
-        - 读取或修改 `context`。例如，设置一个时间戳用于后续计算延迟。
-        - 执行某些检查，如果不满足条件，可以不调用 `next` 而直接返回或抛出错误（例如，参数校验失败）。
-      - **调用 `await next(context, params)`**:
-        - 这是将控制权传递给下游的关键步骤。
-        - `next` 的返回值是原始的 SDK 响应或下游中间件的结果，你需要根据情况处理它（例如，如果是流，则开始消费流）。
-      - **在调用 `next` 之后**:
-        - 处理 `next` 的返回结果。例如，如果 `next` 返回了一个流，你可以在这里开始迭代处理这个流，并通过 `context.onChunk` 发送数据块。
-        - 基于 `context` 的变化或 `next` 的结果执行进一步操作。例如，计算总耗时、记录日志。
-        - 修改最终结果（尽管对于 `completions`，结果通常通过 `onChunk` 副作用发出）。
-
-### 示例：一个简单的日志中间件
-
-```typescript
-import {
-  AiProviderMiddlewareCompletionsContext,
-  CompletionsParams,
-  MiddlewareAPI,
-  OnChunkFunction // 假设 OnChunkFunction 类型被导出
-} from './AiProviderMiddlewareTypes' // 调整路径
-import { ChunkType } from '@renderer/types' // 调整路径
-
-export const createSimpleLoggingMiddleware = (): CompletionsMiddleware => {
-  return (api: MiddlewareAPI<AiProviderMiddlewareCompletionsContext, [CompletionsParams]>) => {
-    // console.log(`[LoggingMiddleware] Initialized for provider: ${api.getProviderId()}`);
-
-    return (next: (context: AiProviderMiddlewareCompletionsContext, params: CompletionsParams) => Promise<any>) => {
-      return async (context: AiProviderMiddlewareCompletionsContext, params: CompletionsParams): Promise<void> => {
-        const startTime = Date.now()
-        // 从 context 中获取 onChunk (它最初来自 params.onChunk)
-        const onChunk = context.onChunk
-
-        console.log(
-          `[LoggingMiddleware] Request for ${context.methodName} with params:`,
-          params.messages?.[params.messages.length - 1]?.content
-        )
-
-        try {
-          // 调用下一个中间件或核心逻辑
-          // `rawSdkResponse` 是来自下游的原始响应 (例如 OpenAIStream 或 ChatCompletion 对象)
-          const rawSdkResponse = await next(context, params)
-
-          // 此处简单示例不处理 rawSdkResponse，假设下游中间件 (如 StreamingResponseHandler)
-          // 会处理它并通过 onChunk 发送数据。
-          // 如果这个日志中间件在 StreamingResponseHandler 之后，那么流已经被处理。
-          // 如果在之前，那么它需要自己处理 rawSdkResponse 或确保下游会处理。
-
-          const duration = Date.now() - startTime
-          console.log(`[LoggingMiddleware] Request for ${context.methodName} completed in ${duration}ms.`)
-
-          // 假设下游已经通过 onChunk 发送了所有数据。
-          // 如果这个中间件是链的末端，并且需要确保 BLOCK_COMPLETE 被发送，
-          // 它可能需要更复杂的逻辑来跟踪何时所有数据都已发送。
-        } catch (error) {
-          const duration = Date.now() - startTime
-          console.error(`[LoggingMiddleware] Request for ${context.methodName} failed after ${duration}ms:`, error)
-
-          // 如果 onChunk 可用，可以尝试发送一个错误块
-          if (onChunk) {
-            onChunk({
-              type: ChunkType.ERROR,
-              error: { message: (error as Error).message, name: (error as Error).name, stack: (error as Error).stack }
-            })
-            // 考虑是否还需要发送 BLOCK_COMPLETE 来结束流
-            onChunk({ type: ChunkType.BLOCK_COMPLETE, response: {} })
-          }
-          throw error // 重新抛出错误，以便上层或全局错误处理器可以捕获
-        }
-      }
-    }
-  }
-}
-```
-
-### `AiProviderMiddlewareCompletionsContext` 的重要性
-
-`AiProviderMiddlewareCompletionsContext` 是在中间件之间传递状态和数据的核心。它通常包含：
-
- `methodName`: 当前调用的方法名 (总是 `'completions'`)。
- `originalArgs`: 传递给 `completions` 的原始参数数组。
- `providerId`: Provider 的 ID。
- `_providerInstance`: Provider 实例。
- `onChunk`: 从原始 `CompletionsParams` 传入的回调函数，用于流式发送数据块。**所有中间件都应该通过 `context.onChunk` 来发送数据。**
- `messages`, `model`, `assistant`, `mcpTools`: 从原始 `CompletionsParams` 中提取的常用字段，方便访问。
- **自定义字段**: 中间件可以向上下文中添加自定义字段，以供后续中间件使用。例如，一个缓存中间件可能会添加 `context.cacheHit = true`。
-
-**关键**: 当你在中间件中修改 `params` 或 `context` 时，这些修改会向下游中间件传播（如果它们在 `next` 调用之前修改）。
-
-### 中间件的顺序
-
-中间件的执行顺序非常重要。它们在 `AiProviderMiddlewareConfig` 的数组中定义的顺序就是它们的执行顺序。
-
- 请求首先通过第一个中间件，然后是第二个，依此类推。
- 响应（或 `next` 的调用结果）则以相反的顺序"冒泡"回来。
-
-例如，如果链是 `[AuthMiddleware, CacheMiddleware, LoggingMiddleware]`：
-
-1.  `AuthMiddleware` 先执行其 "调用 `next` 之前" 的逻辑。
-2.  然后 `CacheMiddleware` 执行其 "调用 `next` 之前" 的逻辑。
-3.  然后 `LoggingMiddleware` 执行其 "调用 `next` 之前" 的逻辑。
-4.  核心SDK调用（或链的末端）。
-5.  `LoggingMiddleware` 先接收到结果，执行其 "调用 `next` 之后" 的逻辑。
-6.  然后 `CacheMiddleware` 接收到结果（可能已被 LoggingMiddleware 修改的上下文），执行其 "调用 `next` 之后" 的逻辑（例如，存储结果）。
-7.  最后 `AuthMiddleware` 接收到结果，执行其 "调用 `next` 之后" 的逻辑。
-
-### 注册中间件
-
-中间件在 `src/renderer/src/providers/middleware/register.ts` (或其他类似的配置文件) 中进行注册。
-
-```typescript
-// register.ts
-import { AiProviderMiddlewareConfig } from './AiProviderMiddlewareTypes'
-import { createSimpleLoggingMiddleware } from './common/SimpleLoggingMiddleware' // 假设你创建了这个文件
-import { createCompletionsLoggingMiddleware } from './common/CompletionsLoggingMiddleware' // 已有的
-
-const middlewareConfig: AiProviderMiddlewareConfig = {
-  completions: [
-    createSimpleLoggingMiddleware(), // 你新加的中间件
-    createCompletionsLoggingMiddleware() // 已有的日志中间件
-    // ... 其他 completions 中间件
-  ],
-  methods: {
-    // translate: [createGenericLoggingMiddleware()],
-    // ... 其他方法的中间件
-  }
-}
-
-export default middlewareConfig
-```
-
-### 最佳实践
-
-1.  **单一职责**: 每个中间件应专注于一个特定的功能（例如，日志、缓存、转换特定数据）。
-2.  **无副作用 (尽可能)**: 除了通过 `context` 或 `onChunk` 明确的副作用外，尽量避免修改全局状态或产生其他隐蔽的副作用。
-3.  **错误处理**:
-    - 在中间件内部使用 `try...catch` 来处理可能发生的错误。
-    - 决定是自行处理错误（例如，通过 `onChunk` 发送错误块）还是将错误重新抛出给上游。
-    - 如果重新抛出，确保错误对象包含足够的信息。
-4.  **性能考虑**: 中间件会增加请求处理的开销。避免在中间件中执行非常耗时的同步操作。对于IO密集型操作，确保它们是异步的。
-5.  **可配置性**: 使中间件的行为可通过参数或配置进行调整。例如，日志中间件可以接受一个日志级别参数。
-6.  **上下文管理**:
-    - 谨慎地向 `context` 添加数据。避免污染 `context` 或添加过大的对象。
-    - 明确你添加到 `context` 的字段的用途和生命周期。
-7.  **`next` 的调用**:
-    - 除非你有充分的理由提前终止请求（例如，缓存命中、授权失败），否则**总是确保调用 `await next(context, params)`**。否则，下游的中间件和核心逻辑将不会执行。
-    - 理解 `next` 的返回值并正确处理它，特别是当它是一个流时。你需要负责消费这个流或将其传递给另一个能够消费它的组件/中间件。
-8.  **命名清晰**: 给你的中间件和它们创建的函数起描述性的名字。
-9.  **文档和注释**: 对复杂的中间件逻辑添加注释，解释其工作原理和目的。
-
-### 调试技巧
-
- 在中间件的关键点使用 `console.log` 或调试器来检查 `params`、`context` 的状态以及 `next` 的返回值。
- 暂时简化中间件链，只保留你正在调试的中间件和最简单的核心逻辑，以隔离问题。
- 编写单元测试来独立验证每个中间件的行为。
-
-通过遵循这些指南，你应该能够有效地为我们的系统创建强大且可维护的中间件。如果你有任何疑问或需要进一步的帮助，请咨询团队。
--- a/docs/technical/topic-message-tree.md
+++ b/docs/technical/topic-message-tree.md
@@ -0,0 +1,635 @@
+# 消息历史版本管理系统设计技术报告（最终版 - 含多模型支持）
+
+## 1. 系统概述
+
+基于现有扁平化架构的最小化扩展，通过 **Topic快照 + Message字段扩展（含siblingIds）** 实现版本管理、分支对话和多模型并行回复功能。
+
+### 1.1 核心设计理念
+
+- **最小破坏性**：只扩展现有实体，不新增表
+- **快照渲染**：通过Topic简单快照管理主线渲染顺序
+- **关系扩展**：通过Message字段实现树状分支、双向链表版本、多模型兄弟关系
+
+## 2. 数据结构设计
+
+### 2.1 实体定义
+
+```typescript
+interface Topic {
+  // === 现有字段保持不变 ===
+  id: string
+  name: string
+  createdAt: string
+  updatedAt: string
+
+  // === 保持简单快照 ===
+  activeMessageIds: string[] // 当前活跃对话主线的消息ID顺序
+}
+
+interface Message {
+  // === 现有字段保持不变 ===
+  id: string
+  role: 'user' | 'assistant' | 'system'
+  topicId: string
+  blocks: MessageBlock['id'][]
+
+  // === 新增：关系字段 ===
+  askId?: string // 问答关系：assistant指向对应的user消息
+  parentMessageId?: string // 分支关系：指向回复的目标消息
+  version?: number // 版本号（assistant消息专用）
+  prevVersionId?: string // 版本链表：前一版本
+  nextVersionId?: string // 版本链表：后一版本
+  groupRequestId?: string // 请求分组：同次API请求的标识
+  siblingIds?: string[] // 兄弟关系：同级多模型回复的ID列表
+}
+
+interface MessageBlock {
+  // === 完全不变 ===
+  id: string
+  messageId: string
+  type: MessageBlockType
+  content: string
+  // ...其他现有字段
+}
+```
+
+### 2.2 数据关系图
+
+```mermaid
+graph TB
+    subgraph "Topic快照层 (主线)"
+        T[Topic.activeMessageIds: user1→asst1-gpt→user2]
+    end
+
+    subgraph "消息实体层"
+        U1[User Message 1<br/>id: user1]
+        A1G["GPT-4 回复<br/>id: asst1-gpt, askId: user1<br/>siblingIds: [asst1-claude]"]
+        A1C["Claude 回复<br/>id: asst1-claude, askId: user1<br/>siblingIds: [asst1-gpt]"]
+        U2["User Message 2<br/>id: user2, parentMessageId: asst1-gpt"]
+    end
+
+    subgraph "版本链表层 (隐藏)"
+        A1GV0[GPT-4 v0<br/>askId: user1, version: 0]
+        A1GV1[GPT-4 v1<br/>askId: user1, version: 1]
+
+        A1GV0 -.->|nextVersionId| A1GV1
+        A1GV1 -.->|prevVersionId| A1GV0
+    end
+
+    subgraph "分支树层 (隐藏)"
+        U1B[User Branch 1<br/>parentMessageId: asst1-gpt]
+        A1B[Assistant Branch 1<br/>askId: user1b]
+    end
+
+    T --> U1
+    T --> A1G
+    T --> U2
+
+    A1G -.->|askId| U1
+    A1C -.->|askId| U1
+    A1G -.->|siblingIds| A1C
+    A1C -.->|siblingIds| A1G
+    U2 -.->|parentMessageId| A1G
+
+    U1B -.->|parentMessageId| A1G
+    A1B -.->|askId| U1B
+```
+
+## 3. 核心操作流程
+
+### 3.1 发送新消息（多模型）
+
+```mermaid
+sequenceDiagram
+    participant UI
+    participant Redux
+    participant DB
+    participant API
+
+    UI->>Redux: sendMessage(userContent, models[])
+
+    Note over Redux: 1. 创建用户消息
+    Redux->>Redux: userMessage = { id: uuid(), role: 'user', ... }
+
+    Note over Redux: 2. 创建助手消息（多模型）
+    Redux->>Redux: groupRequestId = uuid()
+    Redux->>Redux: assistantMessages = models.map(m => createAssistant(userMessage.id, m))
+
+    Note over Redux: 3. 设置兄弟关系
+    Redux->>Redux: assistantIds = assistantMessages.map(m => m.id)
+    loop 每个助手消息
+        Redux->>Redux: msg.siblingIds = assistantIds.filter(id => id !== msg.id)
+    end
+
+    Note over Redux: 4. 更新Topic快照
+    Redux->>Redux: newActiveMessageIds = [<br/>...oldIds,<br/>userMessage.id,<br/>assistantMessages[0].id<br/>]
+
+    Note over Redux: 5. 原子保存
+    Redux->>DB: transaction([messages, topics])
+    DB->>DB: messages.bulkPut([userMessage, ...assistantMessages])
+    DB->>DB: topics.update(topicId, { activeMessageIds })
+
+    Note over Redux: 6. 发送API请求
+    loop 每个模型
+        Redux->>API: generateResponse(model, userContent)
+    end
+
+    Redux->>UI: 更新状态
+```
+
+**复杂度**：O(M) where M = 模型数量
+
+### 3.2 重发消息（版本管理）
+
+```mermaid
+sequenceDiagram
+    participant UI
+    participant Redux
+    participant DB
+
+    UI->>Redux: resendMessage(userMessageId)
+
+    Note over Redux: 1. 查找现有版本
+    Redux->>DB: messages.where('askId').equals(userMessageId)
+    DB-->>Redux: existingVersions[]
+
+    Note over Redux: 2. 计算新版本号
+    Redux->>Redux: latestVersion = max(versions.map(v => v.version))
+    Redux->>Redux: newVersion = latestVersion + 1
+
+    Note over Redux: 3. 创建新版本消息（可能多模型）
+    Redux->>Redux: newGroupRequestId = uuid()
+    Redux->>Redux: newVersionMessages = models.map(m => createNewVersion(prevMsg, newVersion, newGroupRequestId))
+
+    Note over Redux: 4. 设置新版本的兄弟关系
+    Redux->>Redux: newVersionIds = newVersionMessages.map(m => m.id)
+    loop 每个新版本消息
+        Redux->>Redux: msg.siblingIds = newVersionIds.filter(id => id !== msg.id)
+    end
+
+    Note over Redux: 5. 更新版本链表
+    Redux->>DB: transaction(messages)
+    DB->>DB: messages.update(prevMessage.id, { nextVersionId })
+    DB->>DB: messages.bulkPut(newVersionMessages)
+
+    Redux->>UI: 更新状态
+```
+
+**复杂度**：O(V) 查找 + O(M) 创建
+
+### 3.3 切换活跃模型（UI交互）
+
+```mermaid
+flowchart TD
+    A[用户在UI上选择其他模型] --> B[获取当前快照]
+    B --> C[找到当前助手消息在快照中的位置]
+    C --> D[用新选择的模型消息ID替换快照中的ID]
+    D --> E[保存到数据库]
+    E --> F[Redux自动重新渲染]
+
+    style A fill:#e1f5fe
+    style F fill:#c8e6c9
+```
+
+```typescript
+const switchActiveModel = async (topicId: string, messageIndex: number, newModelMessageId: string) => {
+  const topic = await db.topics.get(topicId)
+  const newActiveMessageIds = [...topic.activeMessageIds]
+  newActiveMessageIds[messageIndex] = newModelMessageId
+
+  await db.topics.update(topicId, { activeMessageIds: newActiveMessageIds })
+}
+```
+
+**复杂度**：O(1)
+
+## 4. 字段作用详解
+
+### 4.1 关键字段关系图
+
+```mermaid
+graph LR
+    subgraph "问答关系"
+        askId[askId<br/>assistant → user<br/>逻辑关系，永久不变]
+    end
+
+    subgraph "分支关系"
+        parentId[parentMessageId<br/>message → message<br/>分支对话，树状结构]
+    end
+
+    subgraph "版本关系"
+        version[version + prevVersionId + nextVersionId<br/>同askId下的版本链表]
+    end
+
+    subgraph "请求分组"
+        groupId[groupRequestId<br/>同次API请求标识<br/>一次性，每次重发都变]
+    end
+
+    subgraph "兄弟关系"
+        siblingId[siblingIds<br/>同级多模型回复<br/>双向引用]
+    end
+
+    askId -.-> version
+    askId -.-> siblingId
+    parentId -.-> askId
+    groupId -.-> askId
+```
+
+### 4.2 字段使用场景
+
+| 字段                             | 用途       | 查询场景                   | 生命周期 |
+| -------------------------------- | ---------- | -------------------------- | -------- |
+| **askId**                        | 问答映射   | 查找用户问题的所有回复版本 | 永久不变 |
+| **parentMessageId**              | 分支对话   | 查找某消息的回复分支       | 永久不变 |
+| **version + prev/nextVersionId** | 版本管理   | 版本历史导航               | 永久不变 |
+| **groupRequestId**               | 请求追踪   | 批量状态更新、请求监控     | 一次性   |
+| **siblingIds**                   | 多模型并行 | 渲染同级多模型回复         | 永久不变 |
+
+### 4.3 多模型并行渲染示例
+
+```mermaid
+graph TD
+    U1[User: 帮我写个函数<br/>id: user1]
+
+    subgraph "第一次请求 (groupRequestId: req1)"
+        A1["GPT-4 回复<br/>id: asst1-gpt, askId: user1<br/>siblingIds: [asst1-claude]"]
+        A2["Claude 回复<br/>id: asst1-claude, askId: user1<br/>siblingIds: [asst1-gpt]"]
+    end
+
+    subgraph "Topic快照 (主线)"
+        T["activeMessageIds: [user1, asst1-gpt]"]
+    end
+
+    subgraph "UI渲染 (通过siblingIds扩展)"
+        UI_U1[User: 帮我写个函数]
+        UI_A1["GPT-4 回复 (活跃)"]
+        UI_A2["Claude 回复 (可选)"]
+    end
+
+    U1 --> A1
+    U1 --> A2
+
+    T --> U1
+    T --> A1
+
+    A1 -.->|siblingIds| A2
+    A2 -.->|siblingIds| A1
+
+    UI_U1 -.-> UI_A1
+    UI_U1 -.-> UI_A2
+```
+
+## 5. 数据查询与状态管理
+
+### 5.1 话题加载流程
+
+```mermaid
+sequenceDiagram
+    participant UI
+    participant Redux
+    participant DB
+    participant Selector
+
+    UI->>Redux: loadTopic(topicId)
+    Redux->>DB: 并行查询
+
+    par 查询消息
+        DB->>DB: messages.where('topicId').equals(topicId)
+    and 查询块
+        DB->>DB: messageBlocks.where('topicId').equals(topicId)
+    end
+
+    DB-->>Redux: { messages[], blocks[] }
+    Redux->>Redux: 更新实体状态
+
+    UI->>Selector: selectActiveConversationWithSiblings(topicId)
+    Selector->>Redux: 获取Topic.activeMessageIds
+    Selector->>Redux: 获取messages实体
+    Selector-->>UI: 按快照顺序的消息列表 (含兄弟节点)
+
+    Note over UI: 渲染对话界面 (支持多模型)
+```
+
+### 5.2 渲染选择器（含兄弟节点）
+
+```typescript
+export const selectActiveConversationWithSiblings = createSelector(
+  [
+    (state: RootState, topicId: string) => state.topics.entities[topicId]?.activeMessageIds || [],
+    (state: RootState) => state.messages.entities,
+    (state: RootState) => state.messageBlocks.entities
+  ],
+  (activeMessageIds, messagesEntities, blocksEntities) => {
+    return activeMessageIds
+      .map((messageId) => {
+        const message = messagesEntities[messageId]
+        if (!message) return null
+
+        if (message.role === 'user') {
+          return { type: 'user', message, blocks: getMessageBlocks(message, blocksEntities) }
+        } else if (message.role === 'assistant') {
+          const siblingMessages = (message.siblingIds || []).map((id) => messagesEntities[id]).filter(Boolean)
+          const allAssistantMessages = [message, ...siblingMessages]
+
+          return {
+            type: 'assistant_group',
+            messages: allAssistantMessages.map((msg) => ({
+              message: msg,
+              blocks: getMessageBlocks(msg, blocksEntities),
+              isActive: msg.id === messageId
+            })),
+            activeMessageId: messageId
+          }
+        }
+      })
+      .filter(Boolean)
+  }
+)
+```
+
+**复杂度**：O(N + S) where N = 快照长度, S = 兄弟节点总数
+
+## 6. 时空复杂度分析
+
+### 6.1 核心操作复杂度对比
+
+```mermaid
+graph LR
+    subgraph "现有架构"
+        A1[加载话题: O(M+B)]
+        A2[渲染对话: O(M) 需要过滤排序]
+        A3[发送消息: O(1)]
+    end
+
+    subgraph "新架构 (含多模型)"
+        B1[加载话题: O(M+B) ✅相同]
+        B2[渲染对话: O(N+S) ✅更优]
+        B3[发送消息: O(M_models) ✅相同]
+        B4[版本切换: O(1) ➕新功能]
+        B5[重发消息: O(V)+O(M_models) ➕新功能]
+        B6[模型切换: O(1) ➕新功能]
+    end
+
+    style B1 fill:#c8e6c9
+    style B2 fill:#c8e6c9
+    style B3 fill:#c8e6c9
+    style B4 fill:#fff3e0
+    style B5 fill:#fff3e0
+    style B6 fill:#fff3e0
+```
+
+### 6.2 性能优势分析
+
+| 操作         | 现有架构       | 新架构                       | 优势说明             |
+| ------------ | -------------- | ---------------------------- | -------------------- |
+| **话题加载** | O(M + B)       | O(M + B)                     | 性能保持不变         |
+| **对话渲染** | O(M) 过滤+排序 | **O(N+S)** 直接索引+兄弟扩展 | N << M，S通常较小    |
+| **发送消息** | O(1)           | O(M_models)                  | 支持多模型，合理增长 |
+| **版本切换** | 不支持         | **O(1)**                     | 新功能，极佳性能     |
+| **模型切换** | 不支持         | **O(1)**                     | 新功能，极佳性能     |
+
+**关键优势**：
+
+- **渲染性能提升**：从 O(M) 优化到 O(N+S)，长对话场景收益显著
+- **多模型支持**：通过 siblingIds 优雅实现
+- **版本管理**：O(1) 的版本/模型切换，用户体验极佳
+- **向后兼容**：现有核心操作性能保持不变
+
+## 7. 数据库Schema演进
+
+### 7.1 Migration策略
+
+```mermaid
+flowchart TD
+    A[现有Schema] --> B[添加字段]
+    B --> C[创建索引]
+    C --> D[数据迁移]
+    D --> E[验证完整性]
+
+    B1[Topic: +activeMessageIds]
+    B2[Message: +askId, +parentMessageId<br/>+version, +prevVersionId<br/>+nextVersionId, +groupRequestId<br/>+siblingIds]
+
+    C1[idx_messages_askid_version]
+    C2[idx_messages_parent]
+    C3[idx_messages_group_request]
+
+    D1[生成activeMessageIds快照]
+    D2[设置现有assistant消息version=0]
+
+    B --> B1
+    B --> B2
+    C --> C1
+    C --> C2
+    C --> C3
+    D --> D1
+    D --> D2
+```
+
+### 7.2 SQL Migration
+
+```sql
+-- 1. 添加字段
+ALTER TABLE topics ADD COLUMN activeMessageIds TEXT; -- JSON数组
+ALTER TABLE messages ADD COLUMN askId TEXT;
+ALTER TABLE messages ADD COLUMN parentMessageId TEXT;
+ALTER TABLE messages ADD COLUMN version INTEGER;
+ALTER TABLE messages ADD COLUMN prevVersionId TEXT;
+ALTER TABLE messages ADD COLUMN nextVersionId TEXT;
+ALTER TABLE messages ADD COLUMN groupRequestId TEXT;
+ALTER TABLE messages ADD COLUMN siblingIds TEXT; -- JSON数组
+
+-- 2. 创建索引
+CREATE INDEX idx_messages_askid_version ON messages(askId, version);
+CREATE INDEX idx_messages_parent ON messages(parentMessageId);
+CREATE INDEX idx_messages_group_request ON messages(groupRequestId);
+
+-- 3. 数据迁移
+UPDATE messages SET version = 0 WHERE role = 'assistant';
+```
+
+## 8. 流式更新兼容性
+
+### 8.1 MessageBlock更新流程
+
+```mermaid
+sequenceDiagram
+    participant Stream
+    participant Redux
+    participant DB
+    participant UI
+
+    Note over Stream: 流式内容到达
+    Stream->>Redux: updateBlock(blockId, content)
+    Redux->>Redux: updateOneBlock({ id, changes })
+    Redux->>UI: 立即更新显示
+
+    Note over Redux: 节流数据库写入
+    Redux->>DB: throttledDbUpdate(blockId, content)
+
+    Note over Stream,UI: 版本/兄弟关系不影响块更新
+```
+
+**关键点**：
+
+- MessageBlock 仍然直接关联到 Message
+- 版本/兄弟关系在 Message 层面，不影响 Block 的流式更新
+- 现有的节流机制和更新逻辑完全保持不变
+
+## 9. 系统架构总览
+
+### 9.1 整体架构图
+
+```mermaid
+graph TB
+    subgraph "UI层"
+        UI1[对话界面]
+        UI2[版本选择器]
+        UI3[分支导航]
+        UI4[模型切换器]
+    end
+
+    subgraph "Redux状态层"
+        R1[topics: EntityAdapter]
+        R2[messages: EntityAdapter]
+        R3[messageBlocks: EntityAdapter]
+        S1[selectActiveConversationWithSiblings]
+        S2[selectVersionHistory]
+    end
+
+    subgraph "数据库层"
+        DB1[(topics表)]
+        DB2[(messages表)]
+        DB3[(messageBlocks表)]
+    end
+
+    subgraph "API层"
+        API1[多模型并行请求]
+        API2[流式响应处理]
+    end
+
+    UI1 --> S1
+    UI2 --> S2
+    UI4 --> S1
+    S1 --> R1
+    S1 --> R2
+    S2 --> R2
+
+    R1 <--> DB1
+    R2 <--> DB2
+    R3 <--> DB3
+
+    R2 --> API1
+    API2 --> R3
+
+    style UI1 fill:#e3f2fd
+    style R1 fill:#f3e5f5
+    style R2 fill:#f3e5f5
+    style R3 fill:#f3e5f5
+    style DB1 fill:#e8f5e8
+    style DB2 fill:#e8f5e8
+    style DB3 fill:#e8f5e8
+```
+
+### 9.2 数据流向
+
+```mermaid
+flowchart LR
+    A[用户输入] --> B[创建User Message]
+    B --> C["创建Assistant Messages (多模型)"]
+    C --> C1[设置Sibling关系]
+    C1 --> D["更新Topic快照 (主线)"]
+    D --> E[API并行请求]
+    E --> F[流式更新Blocks]
+    F --> G["UI实时渲染 (含多模型)"]
+
+    H[版本切换] --> I[更新快照指针]
+    I --> G
+
+    J[分支对话] --> K[创建分支消息]
+    K --> D
+
+    L[模型切换] --> I
+
+    style A fill:#ffebee
+    style G fill:#e8f5e8
+    style H fill:#fff3e0
+    style J fill:#f3e5f5
+    style L fill:#e1f5fe
+```
+
+## 10. Redux Slice 实现范例
+
+根据上述架构设计，`messages` slice 将演变为一个纯粹的、由 `createEntityAdapter` 管理的"消息池"。它只负责高效地存储和访问单个消息实体，而不再关心对话的顺序。
+
+### `store/messagesSlice.ts`
+
+```typescript
+import { createSlice, createEntityAdapter, PayloadAction } from '@reduxjs/toolkit'
+import type { RootState } from './store' // 你的store类型定义
+import type { Message } from '@renderer/types/newMessage' // 假设 Message 类型定义在外部
+
+// 1. 创建 Entity Adapter
+// 它会自动生成管理实体的reducer逻辑，实现一个高效的消息池。
+const messagesAdapter = createEntityAdapter<Message>()
+
+// 2. 定义 Slice 的初始状态
+// adapter.getInitialState() 会自动创建 { ids: [], entities: {} } 结构
+const initialState = messagesAdapter.getInitialState()
+
+// 3. 创建 Slice
+const messagesSlice = createSlice({
+  name: 'messages',
+  initialState,
+  // Reducers被极大简化，多数直接引用adapter提供的方法
+  reducers: {
+    // Action: 添加一条消息
+    messageAdded: messagesAdapter.addOne,
+
+    // Action: 一次性添加或更新多个消息 (高性能)
+    // 用途: 加载话题历史、发送新一轮问答(user+assistants)
+    messagesUpserted: messagesAdapter.upsertMany,
+
+    // Action: 更新单个消息
+    // 用途: 流式更新结束、状态变更等
+    messageUpdated: messagesAdapter.updateOne,
+
+    // Action: 删除单个消息
+    messageRemoved: messagesAdapter.removeOne,
+
+    // Action: 删除多个消息
+    messagesRemoved: messagesAdapter.removeMany,
+
+    // Action: 用新数据完全替换消息池
+    // 用途: 首次加载或强制刷新
+    messagesSet: messagesAdapter.setAll
+  }
+})
+
+// 4. 导出 Actions
+export const { messageAdded, messagesUpserted, messageUpdated, messageRemoved, messagesRemoved, messagesSet } =
+  messagesSlice.actions
+
+// 5. 导出 Selectors
+// Adapter 会自动创建高效的查询函数 (e.g., O(1) by ID)
+export const messagesSelectors = messagesAdapter.getSelectors((state: RootState) => state.messages)
+
+// 6. 导出 Reducer
+export default messagesSlice.reducer
+```
+
+### 核心思想总结
+
+1.  **职责单一**: 此 Slice 只做一件事——管理 `Message` 实体。它像一个数据库表，高效地处理增删改查，但对业务逻辑（如对话顺序）一无所知。
+2.  **逻辑上移**: 所有涉及多个 Slice 的复杂业务逻辑（如发送消息、切换版本）都应封装在 **Thunks** 或其他中间件中。Thunk 作为流程协调者，会 `dispatch` 多个原子化的 Action 给 `messagesSlice` 和 `topicsSlice`，以完成一次完整的业务操作并保证数据一致性。
+3.  **性能保证**: `createEntityAdapter` 内部使用哈希表（对象）来存储实体，确保通过 ID 查询消息的操作为 O(1) 复杂度，性能极佳。
+
+### 旧状态属性迁移
+
+为了完成 `messagesSlice` 向纯粹"消息池"的演进，原有的混合状态属性需要被迁移或废弃，以实现彻底的职责分离。
+
+| 原属性 (`newMessage.ts`) | 处理方式      | 新的归宿 / 说明                                                                               |
+| :----------------------- | :------------ | :-------------------------------------------------------------------------------------------- |
+| `messageIdsByTopic`      | **废弃**      | 核心职责转移。由 `topicsSlice` 中的 `activeMessageIds` 字段接管，作为渲染快照。               |
+| `currentTopicId`         | **迁移**      | 属于UI当前上下文状态，应迁移至 `topicsSlice`。                                                |
+| `loadingByTopic`         | **迁移**      | 话题的加载状态与话题本身更相关，应迁移至 `topicsSlice`。                                      |
+| `displayCount`           | **废弃/迁移** | UI相关的显示逻辑，不属于消息数据层。建议迁移至专门的 `Slice` 或在相关组件中作为本地状态管理。 |
--- a/docs/technical/topic-message-tree.png
+++ b/docs/technical/topic-message-tree.png
--- a/docs/testplan-en.md
+++ b/docs/testplan-en.md
@@ -1,99 +0,0 @@
-# Test Plan
-
-To provide users with a more stable application experience and faster iteration speed, Cherry Studio has launched the "Test Plan".
-
-## User Guide
-
-The Test Plan is divided into the RC channel and the Beta channel, with the following differences:
-
- **RC (Release Candidate)**: The features are stable, with fewer bugs, and it is close to the official release.
- **Beta**: Features may change at any time, and there may be more bugs, but users can experience future features earlier.
-
-Users can enable the "Test Plan" and select the version channel in the software's `Settings` > `About`. Please note that the versions in the "Test Plan" cannot guarantee data consistency, so be sure to back up your data before using them.
-
-Users are welcome to submit issues or provide feedback through other channels for any bugs encountered during testing. Your feedback is very important to us.
-
-## Developer Guide
-
-### Participating in the Test Plan
-
-Developers should submit `PRs` according to the [Contributor Guide](../CONTRIBUTING.md) (and ensure the target branch is `main`). The repository maintainers will evaluate whether the `PR` should be included in the Test Plan based on factors such as the impact of the feature on the application, its importance, and whether broader testing is needed.
-
-If the `PR` is added to the Test Plan, the repository maintainers will:
-
- Notify the `PR` submitter.
- Set the PR to `draft` status (to avoid accidental merging into `main` before testing is complete).
- Set the `milestone` to the specific Test Plan version.
- Modify the `PR` title.
-
-During participation in the Test Plan, `PR` submitters should:
-
- Keep the `PR` branch synchronized with the latest `main` (i.e., the `PR` branch should always be based on the latest `main` code).
- Ensure the `PR` branch is conflict-free.
- Actively respond to comments & reviews and fix bugs.
- Enable maintainers to modify the `PR` branch to allow for bug fixes at any time.
-
-Inclusion in the Test Plan does not guarantee the final merging of the `PR`. It may be shelved due to immature features or poor testing feedback.
-
-### Test Plan Lead
-
-A maintainer will be assigned as the lead for a specific version (e.g., `1.5.0-rc`). The responsibilities of the Test Plan lead include:
-
- Determining whether a `PR` meets the Test Plan requirements and deciding whether it should be included in the current Test Plan.
- Modifying the status of `PRs` added to the Test Plan and communicating relevant matters with the `PR` submitter.
- Before the Test Plan release, merging the branches of `PRs` added to the Test Plan (using squash merge) into the corresponding version branch of `testplan` and resolving conflicts.
- Ensuring the `testplan` branch is synchronized with the latest `main`.
- Overseeing the Test Plan release.
-
-## In-Depth Understanding
-
-### About `PRs`
-
-A `PR` is a collection of a specific branch (and commits), comments, reviews, and other information, and it is the **smallest management unit** of the Test Plan.
-
-Compared to submitting all features to a single branch, the Test Plan manages features through `PRs`, which offers greater flexibility and efficiency:
-
- Features can be added or removed between different versions of the Test Plan without cumbersome `revert` operations.
- Clear feature boundaries and responsibilities are established. Bug fixes are completed within their respective `PRs`, isolating cross-impact and better tracking progress.
- The `PR` submitter is responsible for resolving conflicts with the latest `main`. The Test Plan lead is responsible for resolving conflicts between `PR` branches. However, since features added to the Test Plan are relatively independent (in other words, if a feature has broad implications, it should be independently included in the Test Plan), conflicts are generally few or simple.
-
-### The `testplan` Branch
-
-The `testplan` branch is a **temporary** branch used for Test Plan releases.
-
-Note:
-
- **Do not develop based on this branch**. It may change or even be deleted at any time, and there is no guarantee of commit completeness or order.
- **Do not submit `commits` or `PRs` to this branch**, as they will not be retained.
- The `testplan` branch is always based on the latest `main` branch (not on a released version), with features added on top.
-
-#### RC Branch
-
-Branch name: `testplan/rc/x.y.z`
-
-Used for RC releases, where `x.y.z` is the target version number. Note that whether it is rc.1 or rc.5, as long as the major version number is `x.y.z`, it is completed in this branch.
-
-Generally, the version number for releases from this branch is named `x.y.z-rc.n`.
-
-#### Beta Branch
-
-Branch name: `testplan/beta/x.y.z`
-
-Used for Beta releases, where `x.y.z` is the target version number. Note that whether it is beta.1 or beta.5, as long as the major version number is `x.y.z`, it is completed in this branch.
-
-Generally, the version number for releases from this branch is named `x.y.z-beta.n`.
-
-### Version Rules
-
-The application version number for the Test Plan is: `x.y.z-CHA.n`, where:
-
- `x.y.z` is the conventional version number, referred to here as the **target version number**.
- `CHA` is the channel code (Channel), currently divided into `rc` and `beta`.
- `n` is the release number, starting from `1`.
-
-Examples of complete version numbers: `1.5.0-rc.3`, `1.5.1-beta.1`, `1.6.0-beta.6`.
-
-The **target version number** of the Test Plan points to the official version number where these features are expected to be added. For example:
-
- `1.5.0-rc.3` means this is a preview of the `1.5.0` official release (the current latest official release is `1.4.9`, and `1.5.0` has not yet been officially released).
- `1.5.1-beta.1` means this is a beta version of the `1.5.1` official release (the current latest official release is `1.5.0`, and `1.5.1` has not yet been officially released).
--- a/docs/testplan-zh.md
+++ b/docs/testplan-zh.md
@@ -1,99 +0,0 @@
-# 测试计划
-
-为了给用户提供更稳定的应用体验，并提供更快的迭代速度，Cherry Studio推出“测试计划”。
-
-## 用户指南
-
-测试计划分为RC版通道和Beta版通道吗，区别在于：
-
- **RC版（预览版）**：RC即Release Candidate，功能已经稳定，BUG较少，接近正式版
- **Beta版（测试版）**：功能可能随时变化，BUG较多，可以较早体验未来功能
-
-用户可以在软件的`设置`-`关于`中，开启“测试计划”并选择版本通道。请注意“测试计划”的版本无法保证数据的一致性，请使用前一定要备份数据。
-
-用户在测试过程中发现的BUG，欢迎提交issue或通过其他渠道反馈。用户的反馈对我们非常重要。
-
-## 开发者指南
-
-### 参与测试计划
-
-开发者按照[贡献者指南](CONTRIBUTING.zh.md)要求正常提交`PR`（并注意提交target为`main`）。仓库维护者会综合考虑（例如该功能对应用的影响程度，功能的重要性，是否需要更广泛的测试等），决定该`PR`是否应加入测试计划。
-
-若该`PR`加入测试计划，仓库维护者会做如下操作：
-
- 通知`PR`提交人
- 设置PR为`draft`状态（避免在测试完成前意外并入`main`）
- `milestone`设置为具体测试计划版本
- 修改`PR`标题
-
-`PR`提交人在参与测试计划过程中，应做到：
-
- 保持`PR`分支与最新`main`同步（即`PR`分支总是应基于最新`main`代码）
- 保持`PR`分支为无冲突状态
- 积极响应 comments & reviews，修复bug
- 开启维护者可以修改`PR`分支的权限，以便维护者能随时修改BUG
-
-加入测试计划并不保证`PR`的最终合并，也有可能由于功能不成熟或测试反馈不佳而搁置
-
-### 测试计划负责人
-
-某个维护者会被指定为某个版本期间（例如`1.5.0-rc`）的测试计划负责人。测试计划负责人的工作为：
-
- 判断某个`PR`是否符合测试计划要求，并决定是否应合入当期测试计划
- 修改加入测试计划的`PR`状态，并与`PR`提交人沟通相关事宜
- 在测试计划发版前，将加入测试计划的`PR`分支逐一合并（采用squash merge）至`testplan`对应版本分支，并解决冲突
- 保证`testplan`分支与最新`main`同步
- 负责测试计划发版
-
-## 深入理解
-
-### 关于`PR`
-
-`PR`是特定分支（及commits）、comments、reviews等各种信息的集合，也是测试计划的**最小管理单元**。
-
-相比将所有功能都提交到某个分支，测试计划通过`PR`来管理功能，这可以带来极大的灵活度和效率：
-
- 测试计划的各个版本间，可以随意增减功能，而无需繁琐的`revert`操作
- 明确了功能边界和负责人，bug修复在各自`PR`中完成，隔离了交叉影响，也能更好观察进度
- `PR`提交人负责与最新`main`之间的冲突；测试计划负责人负责各`PR`分支之间的冲突，但因加入测试计划的各功能相对比较独立（话句话说，如果功能牵涉较广，则应独立上测试计划），冲突一般比较少或简单。
-
-### `testplan`分支
-
-`testplan`分支是用于测试计划发版所用的**临时**分支。
-
-注意：
-
- **请勿基于该分支开发**。该分支随时会变化甚至删除，且并不保证commit的完整和顺序。
- **请勿向该分支提交`commit`及`PR`**，将不会得到保留
- `testplan`分支总是基于最新`main`分支（而不是基于已发布版本），在其之上添加功能
-
-#### RC版分支
-
-分支名称：`testplan/rc/x.y.z`
-
-用于RC版的发版，x.y.z为目标版本号，注意无论是rc.1还是rc.5，只要主版本号为x.y.z，都在该分支完成。
-
-一般而言，该分支发版的版本号命名为`x.y.z-rc.n`
-
-#### Beta版分支
-
-分支名称：`testplan/beta/x.y.z`
-
-用于Beta版的发版，x.y.z为目标版本号，注意无论是beta.1还是beta.5，只要主版本号为x.y.z，都在该分支完成。
-
-一般而言，该分支发版的版本号命名为`x.y.z-beta.n`
-
-### 版本规则
-
-测试计划的应用版本号为：`x.y.z-CHA.n`，其中：
-
- `x.y.z`为一般意义上的版本号，在这里称为**目标版本号**
- `CHA`为通道号（Channel），现在分为`rc`和`beta`
- `n`为发版编号，从`1`计数
-
-完整的版本号举例：`1.5.0-rc.3`、`1.5.1-beta.1`、`1.6.0-beta.6`
-
-测试计划的**目标版本号**指向希望添加这些功能的正式版版本号。例如：
-
- `1.5.0-rc.3`是指，这是`1.5.0`正式版的预览版（当前最新正式版是`1.4.9`，而`1.5.0`正式版还未发布）
- `1.5.1-beta.1`是指，这是`1.5.1`正式版的测试版（当前最新正式版是`1.5.0`，而`1.5.1`正式版还未发布）
--- a/electron-builder.yml
+++ b/electron-builder.yml
@@ -11,11 +11,6 @@ electronLanguages:
  - en # for macOS
 directories:
  buildResources: build
-
-protocols:
-  - name: Cherry Studio
-    schemes:
-      - cherrystudio
 files:
  - '**/*'
  - '!**/{.vscode,.yarn,.yarn-lock,.github,.cursorrules,.prettierrc}'
@@ -53,11 +48,7 @@ files:
  - '!node_modules/pdf-parse/lib/pdf.js/{v1.9.426,v1.10.88,v2.0.550}'
  - '!node_modules/mammoth/{mammoth.browser.js,mammoth.browser.min.js}'
  - '!node_modules/selection-hook/prebuilds/**/*' # we rebuild .node, don't use prebuilds
-  - '!node_modules/pdfjs-dist/web/**/*'
-  - '!node_modules/pdfjs-dist/legacy/web/*'
-  - '!node_modules/selection-hook/node_modules' # we don't need what in the node_modules dir
-  - '!node_modules/selection-hook/src' # we don't need source files
-  - '!**/*.{h,iobj,ipdb,tlog,recipe,vcxproj,vcxproj.filters,Makefile,*.Makefile}' # filter .node build files
+  - '!**/*.{h,iobj,ipdb,tlog,recipe,vcxproj,vcxproj.filters}' # filter .node build files
 asarUnpack:
  - resources/**
  - '**/*.{metal,exp,lib}'
@@ -99,7 +90,6 @@ linux:
  artifactName: ${productName}-${version}-${arch}.${ext}
  target:
    - target: AppImage
-    - target: deb
  maintainer: electronjs.org
  category: Utility
  desktop:
@@ -117,9 +107,11 @@ afterSign: scripts/notarize.js
 artifactBuildCompleted: scripts/artifact-build-completed.js
 releaseInfo:
  releaseNotes: |
-    划词助手：支持 macOS 系统
-    文档处理：增加 MinerU、Doc2x，Mistral 等服务商支持
-    知识库：新的知识库界面，增加扫描版 PDF 支持
-    OCR：macOS 增加系统 OCR 支持
-    服务商：支持一键添加服务商，新增 PH8 大模型开放平台, 支持 PPIO OAuth 登录
-    修复：Linux下数据目录移动问题
+    划词助手：支持文本选择快捷键、开关快捷键、思考块支持和引用功能
+    复制功能：新增纯文本复制（去除Markdown格式符号）
+    知识库：支持设置向量维度，修复Ollama分数错误和维度编辑问题
+    多语言：增加模型名称多语言提示和翻译源语言手动选择
+    文件管理：修复主题/消息删除时文件未清理问题，优化文件选择流程
+    模型：修复Gemini模型推理预算、Voyage AI嵌入问题和DeepSeek翻译模型更新
+    图像功能：统一图片查看器，支持Base64图片渲染，修复图片预览相关问题
+    UI：实现标签折叠/拖拽排序，修复气泡溢出，增加引文索引显示
--- a/electron.vite.config.ts
+++ b/electron.vite.config.ts
@@ -1,5 +1,4 @@
 import react from '@vitejs/plugin-react-swc'
-import { CodeInspectorPlugin } from 'code-inspector-plugin'
 import { defineConfig, externalizeDepsPlugin } from 'electron-vite'
 import { resolve } from 'path'
 import { visualizer } from 'rollup-plugin-visualizer'
@@ -20,13 +19,7 @@ export default defineConfig({
    },
    build: {
      rollupOptions: {
-        external: ['@libsql/client', 'bufferutil', 'utf-8-validate', '@cherrystudio/mac-system-ocr'],
-        output: {
-          // 彻底禁用代码分割 - 返回 null 强制单文件打包
-          manualChunks: undefined,
-          // 内联所有动态导入，这是关键配置
-          inlineDynamicImports: true
-        }
+        external: ['@libsql/client', 'bufferutil', 'utf-8-validate']
      },
      sourcemap: process.env.NODE_ENV === 'development'
    },
@@ -60,14 +53,6 @@ export default defineConfig({
          ]
        ]
      }),
-      // 只在开发环境下启用 CodeInspectorPlugin
-      ...(process.env.NODE_ENV === 'development'
-        ? [
-            CodeInspectorPlugin({
-              bundler: 'vite'
-            })
-          ]
-        : []),
      ...visualizerPlugin('renderer')
    ],
    resolve: {
@@ -77,16 +62,12 @@ export default defineConfig({
      }
    },
    optimizeDeps: {
-      exclude: ['pyodide'],
-      esbuildOptions: {
-        target: 'esnext' // for dev
-      }
+      exclude: ['pyodide']
    },
    worker: {
      format: 'es'
    },
    build: {
-      target: 'esnext', // for build
      rollupOptions: {
        input: {
          index: resolve(__dirname, 'src/renderer/index.html'),
--- a/package.json
+++ b/package.json
@@ -1,6 +1,6 @@
 {
  "name": "CherryStudio",
-  "version": "1.4.8",
+  "version": "1.4.2",
  "private": true,
  "description": "A powerful AI assistant for producer.",
  "main": "./out/main/index.js",
@@ -58,25 +58,6 @@
    "prepare": "husky"
  },
  "dependencies": {
-    "@cherrystudio/pdf-to-img-napi": "^0.0.1",
-    "@libsql/client": "0.14.0",
-    "@libsql/win32-x64-msvc": "^0.4.7",
-    "@strongtz/win32-arm64-msvc": "^0.4.7",
-    "jsdom": "26.1.0",
-    "macos-release": "^3.4.0",
-    "node-stream-zip": "^1.15.0",
-    "notion-helper": "^1.3.22",
-    "os-proxy-config": "^1.1.2",
-    "pdfjs-dist": "4.10.38",
-    "selection-hook": "^1.0.4",
-    "turndown": "7.2.0"
-  },
-  "devDependencies": {
-    "@agentic/exa": "^7.3.3",
-    "@agentic/searxng": "^7.3.3",
-    "@agentic/tavily": "^7.3.3",
-    "@ant-design/v5-patch-for-react-19": "^1.0.3",
-    "@anthropic-ai/sdk": "^0.41.0",
    "@cherrystudio/embedjs": "^0.1.31",
    "@cherrystudio/embedjs-libsql": "^0.1.31",
    "@cherrystudio/embedjs-loader-csv": "^0.1.31",
@@ -89,30 +70,61 @@
    "@cherrystudio/embedjs-loader-xml": "^0.1.31",
    "@cherrystudio/embedjs-ollama": "^0.1.31",
    "@cherrystudio/embedjs-openai": "^0.1.31",
+    "@electron-toolkit/utils": "^3.0.0",
+    "@langchain/community": "^0.3.36",
+    "@langchain/ollama": "^0.2.1",
+    "@strongtz/win32-arm64-msvc": "^0.4.7",
+    "@tanstack/react-query": "^5.27.0",
+    "@types/react-infinite-scroll-component": "^5.0.0",
+    "archiver": "^7.0.1",
+    "async-mutex": "^0.5.0",
+    "diff": "^7.0.0",
+    "docx": "^9.0.2",
+    "electron-log": "^5.1.5",
+    "electron-store": "^8.2.0",
+    "electron-updater": "6.6.4",
+    "electron-window-state": "^5.0.3",
+    "epub": "patch:epub@npm%3A1.3.0#~/.yarn/patches/epub-npm-1.3.0-8325494ffe.patch",
+    "fast-xml-parser": "^5.2.0",
+    "franc-min": "^6.2.0",
+    "fs-extra": "^11.2.0",
+    "jsdom": "^26.0.0",
+    "markdown-it": "^14.1.0",
+    "node-stream-zip": "^1.15.0",
+    "officeparser": "^4.1.1",
+    "os-proxy-config": "^1.1.2",
+    "proxy-agent": "^6.5.0",
+    "remove-markdown": "^0.6.2",
+    "selection-hook": "^0.9.23",
+    "tar": "^7.4.3",
+    "turndown": "^7.2.0",
+    "webdav": "^5.8.0",
+    "zipread": "^1.3.3"
+  },
+  "devDependencies": {
+    "@agentic/exa": "^7.3.3",
+    "@agentic/searxng": "^7.3.3",
+    "@agentic/tavily": "^7.3.3",
+    "@ant-design/v5-patch-for-react-19": "^1.0.3",
+    "@anthropic-ai/sdk": "^0.41.0",
    "@electron-toolkit/eslint-config-prettier": "^3.0.0",
    "@electron-toolkit/eslint-config-ts": "^3.0.0",
    "@electron-toolkit/preload": "^3.0.0",
    "@electron-toolkit/tsconfig": "^1.0.1",
-    "@electron-toolkit/utils": "^3.0.0",
    "@electron/notarize": "^2.5.0",
    "@emotion/is-prop-valid": "^1.3.1",
    "@eslint-react/eslint-plugin": "^1.36.1",
    "@eslint/js": "^9.22.0",
-    "@google/genai": "patch:@google/genai@npm%3A1.0.1#~/.yarn/patches/@google-genai-npm-1.0.1-e26f0f9af7.patch",
+    "@google/genai": "^1.0.1",
    "@hello-pangea/dnd": "^16.6.0",
    "@kangfenmao/keyv-storage": "^0.1.0",
-    "@langchain/community": "^0.3.36",
-    "@langchain/ollama": "^0.2.1",
-    "@mistralai/mistralai": "^1.6.0",
    "@modelcontextprotocol/sdk": "^1.11.4",
    "@mozilla/readability": "^0.6.0",
    "@notionhq/client": "^2.2.15",
    "@playwright/test": "^1.52.0",
    "@reduxjs/toolkit": "^2.2.5",
-    "@shikijs/markdown-it": "^3.7.0",
+    "@shikijs/markdown-it": "^3.4.2",
    "@swc/plugin-styled-components": "^7.1.5",
-    "@tanstack/react-query": "^5.27.0",
-    "@tanstack/react-virtual": "^3.13.12",
    "@testing-library/dom": "^10.4.0",
    "@testing-library/jest-dom": "^6.6.3",
    "@testing-library/react": "^16.3.0",
@@ -129,50 +141,34 @@
    "@types/react-infinite-scroll-component": "^5.0.0",
    "@types/react-window": "^1",
    "@types/tinycolor2": "^1",
-    "@types/word-extractor": "^1",
-    "@uiw/codemirror-extensions-langs": "^4.23.14",
-    "@uiw/codemirror-themes-all": "^4.23.14",
-    "@uiw/react-codemirror": "^4.23.14",
+    "@uiw/codemirror-extensions-langs": "^4.23.12",
+    "@uiw/codemirror-themes-all": "^4.23.12",
+    "@uiw/react-codemirror": "^4.23.12",
    "@vitejs/plugin-react-swc": "^3.9.0",
    "@vitest/browser": "^3.1.4",
    "@vitest/coverage-v8": "^3.1.4",
    "@vitest/ui": "^3.1.4",
    "@vitest/web-worker": "^3.1.4",
    "@xyflow/react": "^12.4.4",
-    "antd": "patch:antd@npm%3A5.24.7#~/.yarn/patches/antd-npm-5.24.7-356a553ae5.patch",
-    "archiver": "^7.0.1",
-    "async-mutex": "^0.5.0",
+    "antd": "^5.22.5",
    "axios": "^1.7.3",
    "browser-image-compression": "^2.0.2",
-    "code-inspector-plugin": "^0.20.14",
    "color": "^5.0.0",
-    "country-flag-emoji-polyfill": "0.1.8",
    "dayjs": "^1.11.11",
    "dexie": "^4.0.8",
    "dexie-react-hooks": "^1.1.7",
-    "diff": "^7.0.0",
-    "docx": "^9.0.2",
    "dotenv-cli": "^7.4.2",
-    "electron": "35.6.0",
+    "electron": "35.4.0",
    "electron-builder": "26.0.15",
    "electron-devtools-installer": "^3.2.0",
-    "electron-log": "^5.1.5",
-    "electron-store": "^8.2.0",
-    "electron-updater": "6.6.4",
    "electron-vite": "^3.1.0",
-    "electron-window-state": "^5.0.3",
    "emittery": "^1.0.3",
    "emoji-picker-element": "^1.22.1",
-    "epub": "patch:epub@npm%3A1.3.0#~/.yarn/patches/epub-npm-1.3.0-8325494ffe.patch",
    "eslint": "^9.22.0",
    "eslint-plugin-react-hooks": "^5.2.0",
    "eslint-plugin-simple-import-sort": "^12.1.1",
    "eslint-plugin-unused-imports": "^4.1.4",
    "fast-diff": "^1.3.0",
-    "fast-xml-parser": "^5.2.0",
-    "franc-min": "^6.2.0",
-    "fs-extra": "^11.2.0",
-    "google-auth-library": "^9.15.1",
    "html-to-image": "^1.11.13",
    "husky": "^9.1.7",
    "i18next": "^23.11.5",
@@ -181,24 +177,21 @@
    "lodash": "^4.17.21",
    "lru-cache": "^11.1.0",
    "lucide-react": "^0.487.0",
-    "markdown-it": "^14.1.0",
-    "mermaid": "^11.7.0",
+    "mermaid": "^11.6.0",
    "mime": "^4.0.4",
    "motion": "^12.10.5",
    "npx-scope-finder": "^1.2.0",
-    "officeparser": "^4.1.1",
    "openai": "patch:openai@npm%3A5.1.0#~/.yarn/patches/openai-npm-5.1.0-0e7b3ccb07.patch",
    "p-queue": "^8.1.0",
    "playwright": "^1.52.0",
    "prettier": "^3.5.3",
-    "proxy-agent": "^6.5.0",
    "rc-virtual-list": "^3.18.6",
    "react": "^19.0.0",
    "react-dom": "^19.0.0",
    "react-hotkeys-hook": "^4.6.1",
    "react-i18next": "^14.1.2",
    "react-infinite-scroll-component": "^6.1.0",
-    "react-markdown": "^10.1.0",
+    "react-markdown": "^9.0.1",
    "react-redux": "^9.1.2",
    "react-router": "6",
    "react-router-dom": "6",
@@ -207,30 +200,22 @@
    "redux": "^5.0.1",
    "redux-persist": "^6.0.0",
    "rehype-katex": "^7.0.1",
-    "rehype-mathjax": "^7.1.0",
+    "rehype-mathjax": "^7.0.0",
    "rehype-raw": "^7.0.0",
-    "remark-cjk-friendly": "^1.2.0",
-    "remark-gfm": "^4.0.1",
+    "remark-cjk-friendly": "^1.1.0",
+    "remark-gfm": "^4.0.0",
    "remark-math": "^6.0.0",
-    "remove-markdown": "^0.6.2",
    "rollup-plugin-visualizer": "^5.12.0",
    "sass": "^1.88.0",
-    "shiki": "^3.7.0",
+    "shiki": "^3.4.2",
    "string-width": "^7.2.0",
    "styled-components": "^6.1.11",
-    "tar": "^7.4.3",
    "tiny-pinyin": "^1.3.2",
-    "tokenx": "^1.1.0",
+    "tokenx": "^0.4.1",
    "typescript": "^5.6.2",
    "uuid": "^10.0.0",
    "vite": "6.2.6",
-    "vitest": "^3.1.4",
-    "webdav": "^5.8.0",
-    "word-extractor": "^1.0.4",
-    "zipread": "^1.3.3"
-  },
-  "optionalDependencies": {
-    "@cherrystudio/mac-system-ocr": "^0.2.2"
+    "vitest": "^3.1.4"
  },
  "resolutions": {
    "pdf-parse@npm:1.1.1": "patch:pdf-parse@npm%3A1.1.1#~/.yarn/patches/pdf-parse-npm-1.1.1-04a6109b2a.patch",
--- a/packages/shared/IpcChannel.ts
+++ b/packages/shared/IpcChannel.ts
@@ -3,8 +3,6 @@ export enum IpcChannel {
  App_ClearCache = 'app:clear-cache',
  App_SetLaunchOnBoot = 'app:set-launch-on-boot',
  App_SetLanguage = 'app:set-language',
-  App_SetEnableSpellCheck = 'app:set-enable-spell-check',
-  App_SetSpellCheckLanguages = 'app:set-spell-check-languages',
  App_ShowUpdateDialog = 'app:show-update-dialog',
  App_CheckForUpdate = 'app:check-for-update',
  App_Reload = 'app:reload',
@@ -15,34 +13,20 @@ export enum IpcChannel {
  App_SetTrayOnClose = 'app:set-tray-on-close',
  App_SetTheme = 'app:set-theme',
  App_SetAutoUpdate = 'app:set-auto-update',
-  App_SetTestPlan = 'app:set-test-plan',
-  App_SetTestChannel = 'app:set-test-channel',
+  App_SetFeedUrl = 'app:set-feed-url',
  App_HandleZoomFactor = 'app:handle-zoom-factor',
-  App_Select = 'app:select',
-  App_HasWritePermission = 'app:has-write-permission',
-  App_Copy = 'app:copy',
-  App_SetStopQuitApp = 'app:set-stop-quit-app',
-  App_SetAppDataPath = 'app:set-app-data-path',
-  App_GetDataPathFromArgs = 'app:get-data-path-from-args',
-  App_FlushAppData = 'app:flush-app-data',
-  App_IsNotEmptyDir = 'app:is-not-empty-dir',
-  App_RelaunchApp = 'app:relaunch-app',
+
  App_IsBinaryExist = 'app:is-binary-exist',
  App_GetBinaryPath = 'app:get-binary-path',
  App_InstallUvBinary = 'app:install-uv-binary',
  App_InstallBunBinary = 'app:install-bun-binary',

-  App_MacIsProcessTrusted = 'app:mac-is-process-trusted',
-  App_MacRequestProcessTrust = 'app:mac-request-process-trust',
-
  App_QuoteToMain = 'app:quote-to-main',
-  App_SetDisableHardwareAcceleration = 'app:set-disable-hardware-acceleration',

  Notification_Send = 'notification:send',
  Notification_OnClick = 'notification:on-click',

  Webview_SetOpenLinkExternal = 'webview:set-open-link-external',
-  Webview_SetSpellCheckEnabled = 'webview:set-spell-check-enabled',

  // Open
  Open_Path = 'open:path',
@@ -75,9 +59,6 @@ export enum IpcChannel {
  Mcp_ServersUpdated = 'mcp:servers-updated',
  Mcp_CheckConnectivity = 'mcp:check-connectivity',

-  // Python
-  Python_Execute = 'python:execute',
-
  //copilot
  Copilot_GetAuthMessage = 'copilot:get-auth-message',
  Copilot_GetCopilotToken = 'copilot:get-copilot-token',
@@ -105,10 +86,6 @@ export enum IpcChannel {
  Gemini_ListFiles = 'gemini:list-files',
  Gemini_DeleteFile = 'gemini:delete-file',

-  // VertexAI
-  VertexAI_GetAuthHeaders = 'vertexai:get-auth-headers',
-  VertexAI_ClearAuthCache = 'vertexai:clear-auth-cache',
-
  Windows_ResetMinimumSize = 'window:reset-minimum-size',
  Windows_SetMinimumSize = 'window:set-minimum-size',

@@ -119,7 +96,6 @@ export enum IpcChannel {
  KnowledgeBase_Remove = 'knowledge-base:remove',
  KnowledgeBase_Search = 'knowledge-base:search',
  KnowledgeBase_Rerank = 'knowledge-base:rerank',
-  KnowledgeBase_Check_Quota = 'knowledge-base:check-quota',

  //file
  File_Open = 'file:open',
@@ -130,10 +106,9 @@ export enum IpcChannel {
  File_Clear = 'file:clear',
  File_Read = 'file:read',
  File_Delete = 'file:delete',
-  File_DeleteDir = 'file:deleteDir',
  File_Get = 'file:get',
  File_SelectFolder = 'file:selectFolder',
-  File_CreateTempFile = 'file:createTempFile',
+  File_Create = 'file:create',
  File_Write = 'file:write',
  File_WriteWithId = 'file:writeWithId',
  File_SaveImage = 'file:saveImage',
@@ -143,15 +118,8 @@ export enum IpcChannel {
  File_Copy = 'file:copy',
  File_BinaryImage = 'file:binaryImage',
  File_Base64File = 'file:base64File',
-  File_GetPdfInfo = 'file:getPdfInfo',
  Fs_Read = 'fs:read',

-  // file service
-  FileService_Upload = 'file-service:upload',
-  FileService_List = 'file-service:list',
-  FileService_Delete = 'file-service:delete',
-  FileService_Retrieve = 'file-service:retrieve',
-
  Export_Word = 'export:word',

  Shortcuts_Update = 'shortcuts:update',
--- a/packages/shared/config/constant.ts
+++ b/packages/shared/config/constant.ts
@@ -1,7 +1,7 @@
 export const imageExts = ['.jpg', '.jpeg', '.png', '.gif', '.bmp', '.webp']
 export const videoExts = ['.mp4', '.avi', '.mov', '.wmv', '.flv', '.mkv']
 export const audioExts = ['.mp3', '.wav', '.ogg', '.flac', '.aac']
-export const documentExts = ['.pdf', '.doc', '.docx', '.pptx', '.xlsx', '.odt', '.odp', '.ods']
+export const documentExts = ['.pdf', '.docx', '.pptx', '.xlsx', '.odt', '.odp', '.ods']
 export const thirdPartyApplicationExts = ['.draftsExport']
 export const bookExts = ['.epub']
 const textExtsByCategory = new Map([
@@ -406,16 +406,5 @@ export const defaultLanguage = 'en-US'

 export enum FeedUrl {
  PRODUCTION = 'https://releases.cherry-ai.com',
-  GITHUB_LATEST = 'https://github.com/CherryHQ/cherry-studio/releases/latest/download',
-  PRERELEASE_LOWEST = 'https://github.com/CherryHQ/cherry-studio/releases/download/v1.4.0'
+  EARLY_ACCESS = 'https://github.com/CherryHQ/cherry-studio/releases/latest/download'
 }
-
-export enum UpgradeChannel {
-  LATEST = 'latest', // 最新稳定版本
-  RC = 'rc', // 公测版本
-  BETA = 'beta' // 预览版本
-}
-
-export const defaultTimeout = 10 * 1000 * 60
-
-export const occupiedDirs = ['logs', 'Network', 'Partitions/webview/Network']
--- a/packages/shared/config/languages.ts
+++ b/packages/shared/config/languages.ts
--- a/packages/shared/config/types.ts
+++ b/packages/shared/config/types.ts
@@ -1,11 +1,6 @@
-import { ProcessingStatus } from '@types'
-
 export type LoaderReturn = {
  entriesAdded: number
  uniqueId: string
  uniqueIds: string[]
  loaderType: string
-  status?: ProcessingStatus
-  message?: string
-  messageSource?: 'preprocess' | 'embedding'
 }
--- a/resources/data/agents-en.json
+++ b/resources/data/agents-en.json
--- a/resources/data/agents-zh.json
+++ b/resources/data/agents-zh.json
--- a/resources/model-catalogs/01-ai/yi-large.yaml
+++ b/resources/model-catalogs/01-ai/yi-large.yaml
@@ -1,47 +0,0 @@
-id: 01-ai/yi-large
-canonical_slug: 01-ai/yi-large
-hugging_face_id: ''
-name: '01.AI: Yi Large'
-type: chat
-created: 1719273600
-description: |-
-  The Yi Large model was designed by 01.AI with the following usecases in mind: knowledge search, data classification, human-like chat bots, and customer service.
-
-  It stands out for its multilingual proficiency, particularly in Spanish, Chinese, Japanese, German, and French.
-
-  Check out the [launch announcement](https://01-ai.github.io/blog/01.ai-yi-large-llm-launch) to learn more.
-context_length: 32768
-architecture:
-  modality: text->text
-  input_modalities:
-    - text
-  output_modalities:
-    - text
-  tokenizer: Yi
-  instruct_type: null
-pricing:
-  prompt: '0.000003'
-  completion: '0.000003'
-  input_cache_read: ''
-  input_cache_write: ''
-  request: '0'
-  image: '0'
-  web_search: '0'
-  internal_reasoning: '0'
-  unit: 1
-  currency: USD
-supported_parameters:
-  - max_tokens
-  - temperature
-  - top_p
-  - stop
-  - frequency_penalty
-  - presence_penalty
-  - top_k
-  - repetition_penalty
-  - response_format
-  - structured_outputs
-  - logit_bias
-  - logprobs
-  - top_logprobs
-model_provider: 01-ai
--- a/resources/model-catalogs/aetherwiing/mn-starcannon-12b.yaml
+++ b/resources/model-catalogs/aetherwiing/mn-starcannon-12b.yaml
@@ -1,42 +0,0 @@
-id: aetherwiing/mn-starcannon-12b
-canonical_slug: aetherwiing/mn-starcannon-12b
-hugging_face_id: aetherwiing/MN-12B-Starcannon-v2
-name: 'Aetherwiing: Starcannon 12B'
-type: chat
-created: 1723507200
-description: |-
-  Starcannon 12B v2 is a creative roleplay and story writing model, based on Mistral Nemo, using [nothingiisreal/mn-celeste-12b](/nothingiisreal/mn-celeste-12b) as a base, with [intervitens/mini-magnum-12b-v1.1](https://huggingface.co/intervitens/mini-magnum-12b-v1.1) merged in using the [TIES](https://arxiv.org/abs/2306.01708) method.
-
-  Although more similar to Magnum overall, the model remains very creative, with a pleasant writing style. It is recommended for people wanting more variety than Magnum, and yet more verbose prose than Celeste.
-context_length: 16384
-architecture:
-  modality: text->text
-  input_modalities:
-    - text
-  output_modalities:
-    - text
-  tokenizer: Mistral
-  instruct_type: chatml
-pricing:
-  prompt: '0.0000008'
-  completion: '0.0000012'
-  input_cache_read: ''
-  input_cache_write: ''
-  request: '0'
-  image: '0'
-  web_search: '0'
-  internal_reasoning: '0'
-  unit: 1
-  currency: USD
-supported_parameters:
-  - max_tokens
-  - temperature
-  - top_p
-  - stop
-  - frequency_penalty
-  - presence_penalty
-  - repetition_penalty
-  - top_k
-  - min_p
-  - seed
-model_provider: aetherwiing
--- a/resources/model-catalogs/ai21/jamba-1.6-large.yaml
+++ b/resources/model-catalogs/ai21/jamba-1.6-large.yaml
@@ -1,38 +0,0 @@
-id: ai21/jamba-1.6-large
-canonical_slug: ai21/jamba-1.6-large
-hugging_face_id: ai21labs/AI21-Jamba-Large-1.6
-name: 'AI21: Jamba 1.6 Large'
-type: chat
-created: 1741905173
-description: |-
-  AI21 Jamba Large 1.6 is a high-performance hybrid foundation model combining State Space Models (Mamba) with Transformer attention mechanisms. Developed by AI21, it excels in extremely long-context handling (256K tokens), demonstrates superior inference efficiency (up to 2.5x faster than comparable models), and supports structured JSON output and tool-use capabilities. It has 94 billion active parameters (398 billion total), optimized quantization support (ExpertsInt8), and multilingual proficiency in languages such as English, Spanish, French, Portuguese, Italian, Dutch, German, Arabic, and Hebrew.
-
-  Usage of this model is subject to the [Jamba Open Model License](https://www.ai21.com/licenses/jamba-open-model-license).
-context_length: 256000
-architecture:
-  modality: text->text
-  input_modalities:
-    - text
-  output_modalities:
-    - text
-  tokenizer: Other
-  instruct_type: null
-pricing:
-  prompt: '0.000002'
-  completion: '0.000008'
-  input_cache_read: ''
-  input_cache_write: ''
-  request: '0'
-  image: '0'
-  web_search: '0'
-  internal_reasoning: '0'
-  unit: 1
-  currency: USD
-supported_parameters:
-  - tools
-  - tool_choice
-  - max_tokens
-  - temperature
-  - top_p
-  - stop
-model_provider: ai21
--- a/resources/model-catalogs/ai21/jamba-1.6-mini.yaml
+++ b/resources/model-catalogs/ai21/jamba-1.6-mini.yaml
@@ -1,38 +0,0 @@
-id: ai21/jamba-1.6-mini
-canonical_slug: ai21/jamba-1.6-mini
-hugging_face_id: ai21labs/AI21-Jamba-Mini-1.6
-name: 'AI21: Jamba Mini 1.6'
-type: chat
-created: 1741905171
-description: |-
-  AI21 Jamba Mini 1.6 is a hybrid foundation model combining State Space Models (Mamba) with Transformer attention mechanisms. With 12 billion active parameters (52 billion total), this model excels in extremely long-context tasks (up to 256K tokens) and achieves superior inference efficiency, outperforming comparable open models on tasks such as retrieval-augmented generation (RAG) and grounded question answering. Jamba Mini 1.6 supports multilingual tasks across English, Spanish, French, Portuguese, Italian, Dutch, German, Arabic, and Hebrew, along with structured JSON output and tool-use capabilities.
-
-  Usage of this model is subject to the [Jamba Open Model License](https://www.ai21.com/licenses/jamba-open-model-license).
-context_length: 256000
-architecture:
-  modality: text->text
-  input_modalities:
-    - text
-  output_modalities:
-    - text
-  tokenizer: Other
-  instruct_type: null
-pricing:
-  prompt: '0.0000002'
-  completion: '0.0000004'
-  input_cache_read: ''
-  input_cache_write: ''
-  request: '0'
-  image: '0'
-  web_search: '0'
-  internal_reasoning: '0'
-  unit: 1
-  currency: USD
-supported_parameters:
-  - tools
-  - tool_choice
-  - max_tokens
-  - temperature
-  - top_p
-  - stop
-model_provider: ai21
--- a/resources/model-catalogs/aion-labs/aion-1.0-mini.yaml
+++ b/resources/model-catalogs/aion-labs/aion-1.0-mini.yaml
@@ -1,34 +0,0 @@
-id: aion-labs/aion-1.0-mini
-canonical_slug: aion-labs/aion-1.0-mini
-hugging_face_id: FuseAI/FuseO1-DeepSeekR1-QwQ-SkyT1-32B-Preview
-name: 'AionLabs: Aion-1.0-Mini'
-type: chat
-created: 1738697107
-description: Aion-1.0-Mini 32B parameter model is a distilled version of the DeepSeek-R1 model, designed for strong performance in reasoning domains such as mathematics, coding, and logic. It is a modified variant of a FuseAI model that outperforms R1-Distill-Qwen-32B and R1-Distill-Llama-70B, with benchmark results available on its [Hugging Face page](https://huggingface.co/FuseAI/FuseO1-DeepSeekR1-QwQ-SkyT1-32B-Preview), independently replicated for verification.
-context_length: 131072
-architecture:
-  modality: text->text
-  input_modalities:
-    - text
-  output_modalities:
-    - text
-  tokenizer: Other
-  instruct_type: null
-pricing:
-  prompt: '0.0000007'
-  completion: '0.0000014'
-  input_cache_read: ''
-  input_cache_write: ''
-  request: '0'
-  image: '0'
-  web_search: '0'
-  internal_reasoning: '0'
-  unit: 1
-  currency: USD
-supported_parameters:
-  - max_tokens
-  - temperature
-  - top_p
-  - reasoning
-  - include_reasoning
-model_provider: aion-labs
--- a/resources/model-catalogs/aion-labs/aion-1.0.yaml
+++ b/resources/model-catalogs/aion-labs/aion-1.0.yaml
@@ -1,34 +0,0 @@
-id: aion-labs/aion-1.0
-canonical_slug: aion-labs/aion-1.0
-hugging_face_id: ''
-name: 'AionLabs: Aion-1.0'
-type: chat
-created: 1738697557
-description: Aion-1.0 is a multi-model system designed for high performance across various tasks, including reasoning and coding. It is built on DeepSeek-R1, augmented with additional models and techniques such as Tree of Thoughts (ToT) and Mixture of Experts (MoE). It is Aion Lab's most powerful reasoning model.
-context_length: 131072
-architecture:
-  modality: text->text
-  input_modalities:
-    - text
-  output_modalities:
-    - text
-  tokenizer: Other
-  instruct_type: null
-pricing:
-  prompt: '0.000004'
-  completion: '0.000008'
-  input_cache_read: ''
-  input_cache_write: ''
-  request: '0'
-  image: '0'
-  web_search: '0'
-  internal_reasoning: '0'
-  unit: 1
-  currency: USD
-supported_parameters:
-  - max_tokens
-  - temperature
-  - top_p
-  - reasoning
-  - include_reasoning
-model_provider: aion-labs
--- a/resources/model-catalogs/aion-labs/aion-rp-llama-3.1-8b.yaml
+++ b/resources/model-catalogs/aion-labs/aion-rp-llama-3.1-8b.yaml
@@ -1,32 +0,0 @@
-id: aion-labs/aion-rp-llama-3.1-8b
-canonical_slug: aion-labs/aion-rp-llama-3.1-8b
-hugging_face_id: ''
-name: 'AionLabs: Aion-RP 1.0 (8B)'
-type: chat
-created: 1738696718
-description: Aion-RP-Llama-3.1-8B ranks the highest in the character evaluation portion of the RPBench-Auto benchmark, a roleplaying-specific variant of Arena-Hard-Auto, where LLMs evaluate each other’s responses. It is a fine-tuned base model rather than an instruct model, designed to produce more natural and varied writing.
-context_length: 32768
-architecture:
-  modality: text->text
-  input_modalities:
-    - text
-  output_modalities:
-    - text
-  tokenizer: Other
-  instruct_type: null
-pricing:
-  prompt: '0.0000002'
-  completion: '0.0000002'
-  input_cache_read: ''
-  input_cache_write: ''
-  request: '0'
-  image: '0'
-  web_search: '0'
-  internal_reasoning: '0'
-  unit: 1
-  currency: USD
-supported_parameters:
-  - max_tokens
-  - temperature
-  - top_p
-model_provider: aion-labs
--- a/resources/model-catalogs/alfredpros/codellama-7b-instruct-solidity.yaml
+++ b/resources/model-catalogs/alfredpros/codellama-7b-instruct-solidity.yaml
@@ -1,39 +0,0 @@
-id: alfredpros/codellama-7b-instruct-solidity
-canonical_slug: alfredpros/codellama-7b-instruct-solidity
-hugging_face_id: AlfredPros/CodeLlama-7b-Instruct-Solidity
-name: 'AlfredPros: CodeLLaMa 7B Instruct Solidity'
-type: chat
-created: 1744641874
-description: A finetuned 7 billion parameters Code LLaMA - Instruct model to generate Solidity smart contract using 4-bit QLoRA finetuning provided by PEFT library.
-context_length: 4096
-architecture:
-  modality: text->text
-  input_modalities:
-    - text
-  output_modalities:
-    - text
-  tokenizer: Other
-  instruct_type: alpaca
-pricing:
-  prompt: '0.0000008'
-  completion: '0.0000012'
-  input_cache_read: ''
-  input_cache_write: ''
-  request: '0'
-  image: '0'
-  web_search: '0'
-  internal_reasoning: '0'
-  unit: 1
-  currency: USD
-supported_parameters:
-  - max_tokens
-  - temperature
-  - top_p
-  - stop
-  - frequency_penalty
-  - presence_penalty
-  - repetition_penalty
-  - top_k
-  - min_p
-  - seed
-model_provider: alfredpros
--- a/resources/model-catalogs/all-hands/openhands-lm-32b-v0.1.yaml
+++ b/resources/model-catalogs/all-hands/openhands-lm-32b-v0.1.yaml
@@ -1,44 +0,0 @@
-id: all-hands/openhands-lm-32b-v0.1
-canonical_slug: all-hands/openhands-lm-32b-v0.1
-hugging_face_id: all-hands/openhands-lm-32b-v0.1
-name: OpenHands LM 32B V0.1
-type: chat
-created: 1743613013
-description: |-
-  OpenHands LM v0.1 is a 32B open-source coding model fine-tuned from Qwen2.5-Coder-32B-Instruct using reinforcement learning techniques outlined in SWE-Gym. It is optimized for autonomous software development agents and achieves strong performance on SWE-Bench Verified, with a 37.2% resolve rate. The model supports a 128K token context window, making it well-suited for long-horizon code reasoning and large codebase tasks.
-
-  OpenHands LM is designed for local deployment and runs on consumer-grade GPUs such as a single 3090. It enables fully offline agent workflows without dependency on proprietary APIs. This release is intended as a research preview, and future updates aim to improve generalizability, reduce repetition, and offer smaller variants.
-context_length: 16384
-architecture:
-  modality: text->text
-  input_modalities:
-    - text
-  output_modalities:
-    - text
-  tokenizer: Other
-  instruct_type: null
-pricing:
-  prompt: '0.0000026'
-  completion: '0.0000034'
-  input_cache_read: ''
-  input_cache_write: ''
-  request: '0'
-  image: '0'
-  web_search: '0'
-  internal_reasoning: '0'
-  unit: 1
-  currency: USD
-supported_parameters:
-  - tools
-  - tool_choice
-  - max_tokens
-  - temperature
-  - top_p
-  - stop
-  - frequency_penalty
-  - presence_penalty
-  - repetition_penalty
-  - top_k
-  - min_p
-  - seed
-model_provider: all-hands
--- a/resources/model-catalogs/alpindale/goliath-120b.yaml
+++ b/resources/model-catalogs/alpindale/goliath-120b.yaml
@@ -1,48 +0,0 @@
-id: alpindale/goliath-120b
-canonical_slug: alpindale/goliath-120b
-hugging_face_id: alpindale/goliath-120b
-name: Goliath 120B
-type: chat
-created: 1699574400
-description: |-
-  A large LLM created by combining two fine-tuned Llama 70B models into one 120B model. Combines Xwin and Euryale.
-
-  Credits to
-  - [@chargoddard](https://huggingface.co/chargoddard) for developing the framework used to merge the model - [mergekit](https://github.com/cg123/mergekit).
-  - [@Undi95](https://huggingface.co/Undi95) for helping with the merge ratios.
-
-  #merge
-context_length: 6144
-architecture:
-  modality: text->text
-  input_modalities:
-    - text
-  output_modalities:
-    - text
-  tokenizer: Llama2
-  instruct_type: airoboros
-pricing:
-  prompt: '0.00001'
-  completion: '0.0000125'
-  input_cache_read: ''
-  input_cache_write: ''
-  request: '0'
-  image: '0'
-  web_search: '0'
-  internal_reasoning: '0'
-  unit: 1
-  currency: USD
-supported_parameters:
-  - max_tokens
-  - temperature
-  - top_p
-  - stop
-  - frequency_penalty
-  - presence_penalty
-  - repetition_penalty
-  - logit_bias
-  - top_k
-  - min_p
-  - seed
-  - top_a
-model_provider: alpindale
--- a/resources/model-catalogs/alpindale/magnum-72b.yaml
+++ b/resources/model-catalogs/alpindale/magnum-72b.yaml
@@ -1,42 +0,0 @@
-id: alpindale/magnum-72b
-canonical_slug: alpindale/magnum-72b
-hugging_face_id: alpindale/magnum-72b-v1
-name: Magnum 72B
-type: chat
-created: 1720656000
-description: |-
-  From the maker of [Goliath](https://openrouter.ai/models/alpindale/goliath-120b), Magnum 72B is the first in a new family of models designed to achieve the prose quality of the Claude 3 models, notably Opus & Sonnet.
-
-  The model is based on [Qwen2 72B](https://openrouter.ai/models/qwen/qwen-2-72b-instruct) and trained with 55 million tokens of highly curated roleplay (RP) data.
-context_length: 16384
-architecture:
-  modality: text->text
-  input_modalities:
-    - text
-  output_modalities:
-    - text
-  tokenizer: Qwen
-  instruct_type: chatml
-pricing:
-  prompt: '0.000004'
-  completion: '0.000006'
-  input_cache_read: ''
-  input_cache_write: ''
-  request: '0'
-  image: '0'
-  web_search: '0'
-  internal_reasoning: '0'
-  unit: 1
-  currency: USD
-supported_parameters:
-  - max_tokens
-  - temperature
-  - top_p
-  - stop
-  - frequency_penalty
-  - presence_penalty
-  - repetition_penalty
-  - top_k
-  - min_p
-  - seed
-model_provider: alpindale
--- a/resources/model-catalogs/amazon/nova-lite-v1.yaml
+++ b/resources/model-catalogs/amazon/nova-lite-v1.yaml
@@ -1,39 +0,0 @@
-id: amazon/nova-lite-v1
-canonical_slug: amazon/nova-lite-v1
-hugging_face_id: ''
-name: 'Amazon: Nova Lite 1.0'
-type: chat
-created: 1733437363
-description: |-
-  Amazon Nova Lite 1.0 is a very low-cost multimodal model from Amazon that focused on fast processing of image, video, and text inputs to generate text output. Amazon Nova Lite can handle real-time customer interactions, document analysis, and visual question-answering tasks with high accuracy.
-
-  With an input context of 300K tokens, it can analyze multiple images or up to 30 minutes of video in a single input.
-context_length: 300000
-architecture:
-  modality: text+image->text
-  input_modalities:
-    - text
-    - image
-  output_modalities:
-    - text
-  tokenizer: Nova
-  instruct_type: null
-pricing:
-  prompt: '0.00000006'
-  completion: '0.00000024'
-  input_cache_read: ''
-  input_cache_write: ''
-  request: '0'
-  image: '0.00009'
-  web_search: '0'
-  internal_reasoning: '0'
-  unit: 1
-  currency: USD
-supported_parameters:
-  - tools
-  - max_tokens
-  - temperature
-  - top_p
-  - top_k
-  - stop
-model_provider: amazon
--- a/resources/model-catalogs/amazon/nova-micro-v1.yaml
+++ b/resources/model-catalogs/amazon/nova-micro-v1.yaml
@@ -1,35 +0,0 @@
-id: amazon/nova-micro-v1
-canonical_slug: amazon/nova-micro-v1
-hugging_face_id: ''
-name: 'Amazon: Nova Micro 1.0'
-type: chat
-created: 1733437237
-description: Amazon Nova Micro 1.0 is a text-only model that delivers the lowest latency responses in the Amazon Nova family of models at a very low cost. With a context length of 128K tokens and optimized for speed and cost, Amazon Nova Micro excels at tasks such as text summarization, translation, content classification, interactive chat, and brainstorming. It has  simple mathematical reasoning and coding abilities.
-context_length: 128000
-architecture:
-  modality: text->text
-  input_modalities:
-    - text
-  output_modalities:
-    - text
-  tokenizer: Nova
-  instruct_type: null
-pricing:
-  prompt: '0.000000035'
-  completion: '0.00000014'
-  input_cache_read: ''
-  input_cache_write: ''
-  request: '0'
-  image: '0'
-  web_search: '0'
-  internal_reasoning: '0'
-  unit: 1
-  currency: USD
-supported_parameters:
-  - tools
-  - max_tokens
-  - temperature
-  - top_p
-  - top_k
-  - stop
-model_provider: amazon
--- a/resources/model-catalogs/amazon/nova-pro-v1.yaml
+++ b/resources/model-catalogs/amazon/nova-pro-v1.yaml
@@ -1,41 +0,0 @@
-id: amazon/nova-pro-v1
-canonical_slug: amazon/nova-pro-v1
-hugging_face_id: ''
-name: 'Amazon: Nova Pro 1.0'
-type: chat
-created: 1733436303
-description: |-
-  Amazon Nova Pro 1.0 is a capable multimodal model from Amazon focused on providing a combination of accuracy, speed, and cost for a wide range of tasks. As of December 2024, it achieves state-of-the-art performance on key benchmarks including visual question answering (TextVQA) and video understanding (VATEX).
-
-  Amazon Nova Pro demonstrates strong capabilities in processing both visual and textual information and at analyzing financial documents.
-
-  **NOTE**: Video input is not supported at this time.
-context_length: 300000
-architecture:
-  modality: text+image->text
-  input_modalities:
-    - text
-    - image
-  output_modalities:
-    - text
-  tokenizer: Nova
-  instruct_type: null
-pricing:
-  prompt: '0.0000008'
-  completion: '0.0000032'
-  input_cache_read: ''
-  input_cache_write: ''
-  request: '0'
-  image: '0.0012'
-  web_search: '0'
-  internal_reasoning: '0'
-  unit: 1
-  currency: USD
-supported_parameters:
-  - tools
-  - max_tokens
-  - temperature
-  - top_p
-  - top_k
-  - stop
-model_provider: amazon
--- a/resources/model-catalogs/anthracite-org/magnum-v2-72b.yaml
+++ b/resources/model-catalogs/anthracite-org/magnum-v2-72b.yaml
@@ -1,43 +0,0 @@
-id: anthracite-org/magnum-v2-72b
-canonical_slug: anthracite-org/magnum-v2-72b
-hugging_face_id: anthracite-org/magnum-v2-72b
-name: Magnum v2 72B
-type: chat
-created: 1727654400
-description: |-
-  From the maker of [Goliath](https://openrouter.ai/models/alpindale/goliath-120b), Magnum 72B is the seventh in a family of models designed to achieve the prose quality of the Claude 3 models, notably Opus & Sonnet.
-
-  The model is based on [Qwen2 72B](https://openrouter.ai/models/qwen/qwen-2-72b-instruct) and trained with 55 million tokens of highly curated roleplay (RP) data.
-context_length: 32768
-architecture:
-  modality: text->text
-  input_modalities:
-    - text
-  output_modalities:
-    - text
-  tokenizer: Qwen
-  instruct_type: chatml
-pricing:
-  prompt: '0.000003'
-  completion: '0.000003'
-  input_cache_read: ''
-  input_cache_write: ''
-  request: '0'
-  image: '0'
-  web_search: '0'
-  internal_reasoning: '0'
-  unit: 1
-  currency: USD
-supported_parameters:
-  - max_tokens
-  - temperature
-  - top_p
-  - stop
-  - frequency_penalty
-  - presence_penalty
-  - repetition_penalty
-  - logit_bias
-  - top_k
-  - min_p
-  - seed
-model_provider: anthracite-org
--- a/resources/model-catalogs/anthracite-org/magnum-v4-72b.yaml
+++ b/resources/model-catalogs/anthracite-org/magnum-v4-72b.yaml
@@ -1,44 +0,0 @@
-id: anthracite-org/magnum-v4-72b
-canonical_slug: anthracite-org/magnum-v4-72b
-hugging_face_id: anthracite-org/magnum-v4-72b
-name: Magnum v4 72B
-type: chat
-created: 1729555200
-description: |-
-  This is a series of models designed to replicate the prose quality of the Claude 3 models, specifically Sonnet(https://openrouter.ai/anthropic/claude-3.5-sonnet) and Opus(https://openrouter.ai/anthropic/claude-3-opus).
-
-  The model is fine-tuned on top of [Qwen2.5 72B](https://openrouter.ai/qwen/qwen-2.5-72b-instruct).
-context_length: 16384
-architecture:
-  modality: text->text
-  input_modalities:
-    - text
-  output_modalities:
-    - text
-  tokenizer: Qwen
-  instruct_type: chatml
-pricing:
-  prompt: '0.0000025'
-  completion: '0.000003'
-  input_cache_read: ''
-  input_cache_write: ''
-  request: '0'
-  image: '0'
-  web_search: '0'
-  internal_reasoning: '0'
-  unit: 1
-  currency: USD
-supported_parameters:
-  - max_tokens
-  - temperature
-  - top_p
-  - stop
-  - frequency_penalty
-  - presence_penalty
-  - repetition_penalty
-  - top_k
-  - min_p
-  - seed
-  - logit_bias
-  - top_a
-model_provider: anthracite-org
--- a/resources/model-catalogs/anthropic/claude-2-beta.yaml
+++ b/resources/model-catalogs/anthropic/claude-2-beta.yaml
@@ -1,34 +0,0 @@
-id: anthropic/claude-2:beta
-canonical_slug: anthropic/claude-2
-hugging_face_id: ''
-name: 'Anthropic: Claude v2 (self-moderated)'
-type: chat
-created: 1700611200
-description: 'Claude 2 delivers advancements in key capabilities for enterprises—including an industry-leading 200K token context window, significant reductions in rates of model hallucination, system prompts and a new beta feature: tool use.'
-context_length: 200000
-architecture:
-  modality: text->text
-  input_modalities:
-    - text
-  output_modalities:
-    - text
-  tokenizer: Claude
-  instruct_type: null
-pricing:
-  prompt: '0.000008'
-  completion: '0.000024'
-  input_cache_read: ''
-  input_cache_write: ''
-  request: '0'
-  image: '0'
-  web_search: '0'
-  internal_reasoning: '0'
-  unit: 1
-  currency: USD
-supported_parameters:
-  - max_tokens
-  - temperature
-  - top_p
-  - top_k
-  - stop
-model_provider: anthropic
--- a/resources/model-catalogs/anthropic/claude-2.0-beta.yaml
+++ b/resources/model-catalogs/anthropic/claude-2.0-beta.yaml
@@ -1,34 +0,0 @@
-id: anthropic/claude-2.0:beta
-canonical_slug: anthropic/claude-2.0
-hugging_face_id: ''
-name: 'Anthropic: Claude v2.0 (self-moderated)'
-type: chat
-created: 1690502400
-description: Anthropic's flagship model. Superior performance on tasks that require complex reasoning. Supports hundreds of pages of text.
-context_length: 100000
-architecture:
-  modality: text->text
-  input_modalities:
-    - text
-  output_modalities:
-    - text
-  tokenizer: Claude
-  instruct_type: null
-pricing:
-  prompt: '0.000008'
-  completion: '0.000024'
-  input_cache_read: ''
-  input_cache_write: ''
-  request: '0'
-  image: '0'
-  web_search: '0'
-  internal_reasoning: '0'
-  unit: 1
-  currency: USD
-supported_parameters:
-  - max_tokens
-  - temperature
-  - top_p
-  - top_k
-  - stop
-model_provider: anthropic
--- a/resources/model-catalogs/anthropic/claude-2.0.yaml
+++ b/resources/model-catalogs/anthropic/claude-2.0.yaml
@@ -1,34 +0,0 @@
-id: anthropic/claude-2.0
-canonical_slug: anthropic/claude-2.0
-hugging_face_id: ''
-name: 'Anthropic: Claude v2.0'
-type: chat
-created: 1690502400
-description: Anthropic's flagship model. Superior performance on tasks that require complex reasoning. Supports hundreds of pages of text.
-context_length: 100000
-architecture:
-  modality: text->text
-  input_modalities:
-    - text
-  output_modalities:
-    - text
-  tokenizer: Claude
-  instruct_type: null
-pricing:
-  prompt: '0.000008'
-  completion: '0.000024'
-  input_cache_read: ''
-  input_cache_write: ''
-  request: '0'
-  image: '0'
-  web_search: '0'
-  internal_reasoning: '0'
-  unit: 1
-  currency: USD
-supported_parameters:
-  - max_tokens
-  - temperature
-  - top_p
-  - top_k
-  - stop
-model_provider: anthropic
--- a/resources/model-catalogs/anthropic/claude-2.1-beta.yaml
+++ b/resources/model-catalogs/anthropic/claude-2.1-beta.yaml
@@ -1,34 +0,0 @@
-id: anthropic/claude-2.1:beta
-canonical_slug: anthropic/claude-2.1
-hugging_face_id: ''
-name: 'Anthropic: Claude v2.1 (self-moderated)'
-type: chat
-created: 1700611200
-description: 'Claude 2 delivers advancements in key capabilities for enterprises—including an industry-leading 200K token context window, significant reductions in rates of model hallucination, system prompts and a new beta feature: tool use.'
-context_length: 200000
-architecture:
-  modality: text->text
-  input_modalities:
-    - text
-  output_modalities:
-    - text
-  tokenizer: Claude
-  instruct_type: null
-pricing:
-  prompt: '0.000008'
-  completion: '0.000024'
-  input_cache_read: ''
-  input_cache_write: ''
-  request: '0'
-  image: '0'
-  web_search: '0'
-  internal_reasoning: '0'
-  unit: 1
-  currency: USD
-supported_parameters:
-  - max_tokens
-  - temperature
-  - top_p
-  - top_k
-  - stop
-model_provider: anthropic
--- a/resources/model-catalogs/anthropic/claude-2.1.yaml
+++ b/resources/model-catalogs/anthropic/claude-2.1.yaml
@@ -1,34 +0,0 @@
-id: anthropic/claude-2.1
-canonical_slug: anthropic/claude-2.1
-hugging_face_id: ''
-name: 'Anthropic: Claude v2.1'
-type: chat
-created: 1700611200
-description: 'Claude 2 delivers advancements in key capabilities for enterprises—including an industry-leading 200K token context window, significant reductions in rates of model hallucination, system prompts and a new beta feature: tool use.'
-context_length: 200000
-architecture:
-  modality: text->text
-  input_modalities:
-    - text
-  output_modalities:
-    - text
-  tokenizer: Claude
-  instruct_type: null
-pricing:
-  prompt: '0.000008'
-  completion: '0.000024'
-  input_cache_read: ''
-  input_cache_write: ''
-  request: '0'
-  image: '0'
-  web_search: '0'
-  internal_reasoning: '0'
-  unit: 1
-  currency: USD
-supported_parameters:
-  - max_tokens
-  - temperature
-  - top_p
-  - top_k
-  - stop
-model_provider: anthropic
--- a/resources/model-catalogs/anthropic/claude-2.yaml
+++ b/resources/model-catalogs/anthropic/claude-2.yaml
@@ -1,34 +0,0 @@
-id: anthropic/claude-2
-canonical_slug: anthropic/claude-2
-hugging_face_id: ''
-name: 'Anthropic: Claude v2'
-type: chat
-created: 1700611200
-description: 'Claude 2 delivers advancements in key capabilities for enterprises—including an industry-leading 200K token context window, significant reductions in rates of model hallucination, system prompts and a new beta feature: tool use.'
-context_length: 200000
-architecture:
-  modality: text->text
-  input_modalities:
-    - text
-  output_modalities:
-    - text
-  tokenizer: Claude
-  instruct_type: null
-pricing:
-  prompt: '0.000008'
-  completion: '0.000024'
-  input_cache_read: ''
-  input_cache_write: ''
-  request: '0'
-  image: '0'
-  web_search: '0'
-  internal_reasoning: '0'
-  unit: 1
-  currency: USD
-supported_parameters:
-  - max_tokens
-  - temperature
-  - top_p
-  - top_k
-  - stop
-model_provider: anthropic
--- a/resources/model-catalogs/anthropic/claude-3-haiku-beta.yaml
+++ b/resources/model-catalogs/anthropic/claude-3-haiku-beta.yaml
@@ -1,43 +0,0 @@
-id: anthropic/claude-3-haiku:beta
-canonical_slug: anthropic/claude-3-haiku
-hugging_face_id: ''
-name: 'Anthropic: Claude 3 Haiku (self-moderated)'
-type: chat
-created: 1710288000
-description: |-
-  Claude 3 Haiku is Anthropic's fastest and most compact model for
-  near-instant responsiveness. Quick and accurate targeted performance.
-
-  See the launch announcement and benchmark results [here](https://www.anthropic.com/news/claude-3-haiku)
-
-  #multimodal
-context_length: 200000
-architecture:
-  modality: text+image->text
-  input_modalities:
-    - text
-    - image
-  output_modalities:
-    - text
-  tokenizer: Claude
-  instruct_type: null
-pricing:
-  prompt: '0.00000025'
-  completion: '0.00000125'
-  input_cache_read: '0.00000003'
-  input_cache_write: '0.0000003'
-  request: '0'
-  image: '0.0004'
-  web_search: '0'
-  internal_reasoning: '0'
-  unit: 1
-  currency: USD
-supported_parameters:
-  - tools
-  - tool_choice
-  - max_tokens
-  - temperature
-  - top_p
-  - top_k
-  - stop
-model_provider: anthropic
--- a/resources/model-catalogs/anthropic/claude-3-haiku.yaml
+++ b/resources/model-catalogs/anthropic/claude-3-haiku.yaml
@@ -1,43 +0,0 @@
-id: anthropic/claude-3-haiku
-canonical_slug: anthropic/claude-3-haiku
-hugging_face_id: ''
-name: 'Anthropic: Claude 3 Haiku'
-type: chat
-created: 1710288000
-description: |-
-  Claude 3 Haiku is Anthropic's fastest and most compact model for
-  near-instant responsiveness. Quick and accurate targeted performance.
-
-  See the launch announcement and benchmark results [here](https://www.anthropic.com/news/claude-3-haiku)
-
-  #multimodal
-context_length: 200000
-architecture:
-  modality: text+image->text
-  input_modalities:
-    - text
-    - image
-  output_modalities:
-    - text
-  tokenizer: Claude
-  instruct_type: null
-pricing:
-  prompt: '0.00000025'
-  completion: '0.00000125'
-  input_cache_read: '0.00000003'
-  input_cache_write: '0.0000003'
-  request: '0'
-  image: '0.0004'
-  web_search: '0'
-  internal_reasoning: '0'
-  unit: 1
-  currency: USD
-supported_parameters:
-  - tools
-  - tool_choice
-  - max_tokens
-  - temperature
-  - top_p
-  - top_k
-  - stop
-model_provider: anthropic
--- a/resources/model-catalogs/anthropic/claude-3-opus-beta.yaml
+++ b/resources/model-catalogs/anthropic/claude-3-opus-beta.yaml
@@ -1,42 +0,0 @@
-id: anthropic/claude-3-opus:beta
-canonical_slug: anthropic/claude-3-opus
-hugging_face_id: ''
-name: 'Anthropic: Claude 3 Opus (self-moderated)'
-type: chat
-created: 1709596800
-description: |-
-  Claude 3 Opus is Anthropic's most powerful model for highly complex tasks. It boasts top-level performance, intelligence, fluency, and understanding.
-
-  See the launch announcement and benchmark results [here](https://www.anthropic.com/news/claude-3-family)
-
-  #multimodal
-context_length: 200000
-architecture:
-  modality: text+image->text
-  input_modalities:
-    - text
-    - image
-  output_modalities:
-    - text
-  tokenizer: Claude
-  instruct_type: null
-pricing:
-  prompt: '0.000015'
-  completion: '0.000075'
-  input_cache_read: '0.0000015'
-  input_cache_write: '0.00001875'
-  request: '0'
-  image: '0.024'
-  web_search: '0'
-  internal_reasoning: '0'
-  unit: 1
-  currency: USD
-supported_parameters:
-  - tools
-  - tool_choice
-  - max_tokens
-  - temperature
-  - top_p
-  - top_k
-  - stop
-model_provider: anthropic
--- a/resources/model-catalogs/anthropic/claude-3-opus.yaml
+++ b/resources/model-catalogs/anthropic/claude-3-opus.yaml
@@ -1,42 +0,0 @@
-id: anthropic/claude-3-opus
-canonical_slug: anthropic/claude-3-opus
-hugging_face_id: ''
-name: 'Anthropic: Claude 3 Opus'
-type: chat
-created: 1709596800
-description: |-
-  Claude 3 Opus is Anthropic's most powerful model for highly complex tasks. It boasts top-level performance, intelligence, fluency, and understanding.
-
-  See the launch announcement and benchmark results [here](https://www.anthropic.com/news/claude-3-family)
-
-  #multimodal
-context_length: 200000
-architecture:
-  modality: text+image->text
-  input_modalities:
-    - text
-    - image
-  output_modalities:
-    - text
-  tokenizer: Claude
-  instruct_type: null
-pricing:
-  prompt: '0.000015'
-  completion: '0.000075'
-  input_cache_read: '0.0000015'
-  input_cache_write: '0.00001875'
-  request: '0'
-  image: '0.024'
-  web_search: '0'
-  internal_reasoning: '0'
-  unit: 1
-  currency: USD
-supported_parameters:
-  - tools
-  - tool_choice
-  - max_tokens
-  - temperature
-  - top_p
-  - top_k
-  - stop
-model_provider: anthropic
--- a/resources/model-catalogs/anthropic/claude-3-sonnet-beta.yaml
+++ b/resources/model-catalogs/anthropic/claude-3-sonnet-beta.yaml
@@ -1,42 +0,0 @@
-id: anthropic/claude-3-sonnet:beta
-canonical_slug: anthropic/claude-3-sonnet
-hugging_face_id: ''
-name: 'Anthropic: Claude 3 Sonnet (self-moderated)'
-type: chat
-created: 1709596800
-description: |-
-  Claude 3 Sonnet is an ideal balance of intelligence and speed for enterprise workloads. Maximum utility at a lower price, dependable, balanced for scaled deployments.
-
-  See the launch announcement and benchmark results [here](https://www.anthropic.com/news/claude-3-family)
-
-  #multimodal
-context_length: 200000
-architecture:
-  modality: text+image->text
-  input_modalities:
-    - text
-    - image
-  output_modalities:
-    - text
-  tokenizer: Claude
-  instruct_type: null
-pricing:
-  prompt: '0.000003'
-  completion: '0.000015'
-  input_cache_read: '0.0000003'
-  input_cache_write: '0.00000375'
-  request: '0'
-  image: '0.0048'
-  web_search: '0'
-  internal_reasoning: '0'
-  unit: 1
-  currency: USD
-supported_parameters:
-  - tools
-  - tool_choice
-  - max_tokens
-  - temperature
-  - top_p
-  - top_k
-  - stop
-model_provider: anthropic
--- a/resources/model-catalogs/anthropic/claude-3-sonnet.yaml
+++ b/resources/model-catalogs/anthropic/claude-3-sonnet.yaml
@@ -1,42 +0,0 @@
-id: anthropic/claude-3-sonnet
-canonical_slug: anthropic/claude-3-sonnet
-hugging_face_id: ''
-name: 'Anthropic: Claude 3 Sonnet'
-type: chat
-created: 1709596800
-description: |-
-  Claude 3 Sonnet is an ideal balance of intelligence and speed for enterprise workloads. Maximum utility at a lower price, dependable, balanced for scaled deployments.
-
-  See the launch announcement and benchmark results [here](https://www.anthropic.com/news/claude-3-family)
-
-  #multimodal
-context_length: 200000
-architecture:
-  modality: text+image->text
-  input_modalities:
-    - text
-    - image
-  output_modalities:
-    - text
-  tokenizer: Claude
-  instruct_type: null
-pricing:
-  prompt: '0.000003'
-  completion: '0.000015'
-  input_cache_read: '0.0000003'
-  input_cache_write: '0.00000375'
-  request: '0'
-  image: '0.0048'
-  web_search: '0'
-  internal_reasoning: '0'
-  unit: 1
-  currency: USD
-supported_parameters:
-  - tools
-  - tool_choice
-  - max_tokens
-  - temperature
-  - top_p
-  - top_k
-  - stop
-model_provider: anthropic
--- a/resources/model-catalogs/anthropic/claude-3.5-haiku-20241022-beta.yaml
+++ b/resources/model-catalogs/anthropic/claude-3.5-haiku-20241022-beta.yaml
@@ -1,42 +0,0 @@
-id: anthropic/claude-3.5-haiku-20241022:beta
-canonical_slug: anthropic/claude-3-5-haiku-20241022
-hugging_face_id: ''
-name: 'Anthropic: Claude 3.5 Haiku (2024-10-22) (self-moderated)'
-type: chat
-created: 1730678400
-description: |-
-  Claude 3.5 Haiku features enhancements across all skill sets including coding, tool use, and reasoning. As the fastest model in the Anthropic lineup, it offers rapid response times suitable for applications that require high interactivity and low latency, such as user-facing chatbots and on-the-fly code completions. It also excels in specialized tasks like data extraction and real-time content moderation, making it a versatile tool for a broad range of industries.
-
-  It does not support image inputs.
-
-  See the launch announcement and benchmark results [here](https://www.anthropic.com/news/3-5-models-and-computer-use)
-context_length: 200000
-architecture:
-  modality: text+image->text
-  input_modalities:
-    - text
-    - image
-  output_modalities:
-    - text
-  tokenizer: Claude
-  instruct_type: null
-pricing:
-  prompt: '0.0000008'
-  completion: '0.000004'
-  input_cache_read: '0.00000008'
-  input_cache_write: '0.000001'
-  request: '0'
-  image: '0'
-  web_search: '0'
-  internal_reasoning: '0'
-  unit: 1
-  currency: USD
-supported_parameters:
-  - tools
-  - tool_choice
-  - max_tokens
-  - temperature
-  - top_p
-  - top_k
-  - stop
-model_provider: anthropic
--- a/resources/model-catalogs/anthropic/claude-3.5-haiku-20241022.yaml
+++ b/resources/model-catalogs/anthropic/claude-3.5-haiku-20241022.yaml
@@ -1,42 +0,0 @@
-id: anthropic/claude-3.5-haiku-20241022
-canonical_slug: anthropic/claude-3-5-haiku-20241022
-hugging_face_id: ''
-name: 'Anthropic: Claude 3.5 Haiku (2024-10-22)'
-type: chat
-created: 1730678400
-description: |-
-  Claude 3.5 Haiku features enhancements across all skill sets including coding, tool use, and reasoning. As the fastest model in the Anthropic lineup, it offers rapid response times suitable for applications that require high interactivity and low latency, such as user-facing chatbots and on-the-fly code completions. It also excels in specialized tasks like data extraction and real-time content moderation, making it a versatile tool for a broad range of industries.
-
-  It does not support image inputs.
-
-  See the launch announcement and benchmark results [here](https://www.anthropic.com/news/3-5-models-and-computer-use)
-context_length: 200000
-architecture:
-  modality: text+image->text
-  input_modalities:
-    - text
-    - image
-  output_modalities:
-    - text
-  tokenizer: Claude
-  instruct_type: null
-pricing:
-  prompt: '0.0000008'
-  completion: '0.000004'
-  input_cache_read: '0.00000008'
-  input_cache_write: '0.000001'
-  request: '0'
-  image: '0'
-  web_search: '0'
-  internal_reasoning: '0'
-  unit: 1
-  currency: USD
-supported_parameters:
-  - tools
-  - tool_choice
-  - max_tokens
-  - temperature
-  - top_p
-  - top_k
-  - stop
-model_provider: anthropic
--- a/resources/model-catalogs/anthropic/claude-3.5-haiku-beta.yaml
+++ b/resources/model-catalogs/anthropic/claude-3.5-haiku-beta.yaml
@@ -1,42 +0,0 @@
-id: anthropic/claude-3.5-haiku:beta
-canonical_slug: anthropic/claude-3-5-haiku
-hugging_face_id: ''
-name: 'Anthropic: Claude 3.5 Haiku (self-moderated)'
-type: chat
-created: 1730678400
-description: |-
-  Claude 3.5 Haiku features offers enhanced capabilities in speed, coding accuracy, and tool use. Engineered to excel in real-time applications, it delivers quick response times that are essential for dynamic tasks such as chat interactions and immediate coding suggestions.
-
-  This makes it highly suitable for environments that demand both speed and precision, such as software development, customer service bots, and data management systems.
-
-  This model is currently pointing to [Claude 3.5 Haiku (2024-10-22)](/anthropic/claude-3-5-haiku-20241022).
-context_length: 200000
-architecture:
-  modality: text+image->text
-  input_modalities:
-    - text
-    - image
-  output_modalities:
-    - text
-  tokenizer: Claude
-  instruct_type: null
-pricing:
-  prompt: '0.0000008'
-  completion: '0.000004'
-  input_cache_read: '0.00000008'
-  input_cache_write: '0.000001'
-  request: '0'
-  image: '0'
-  web_search: '0'
-  internal_reasoning: '0'
-  unit: 1
-  currency: USD
-supported_parameters:
-  - tools
-  - tool_choice
-  - max_tokens
-  - temperature
-  - top_p
-  - top_k
-  - stop
-model_provider: anthropic
--- a/resources/model-catalogs/anthropic/claude-3.5-haiku.yaml
+++ b/resources/model-catalogs/anthropic/claude-3.5-haiku.yaml
@@ -1,42 +0,0 @@
-id: anthropic/claude-3.5-haiku
-canonical_slug: anthropic/claude-3-5-haiku
-hugging_face_id: ''
-name: 'Anthropic: Claude 3.5 Haiku'
-type: chat
-created: 1730678400
-description: |-
-  Claude 3.5 Haiku features offers enhanced capabilities in speed, coding accuracy, and tool use. Engineered to excel in real-time applications, it delivers quick response times that are essential for dynamic tasks such as chat interactions and immediate coding suggestions.
-
-  This makes it highly suitable for environments that demand both speed and precision, such as software development, customer service bots, and data management systems.
-
-  This model is currently pointing to [Claude 3.5 Haiku (2024-10-22)](/anthropic/claude-3-5-haiku-20241022).
-context_length: 200000
-architecture:
-  modality: text+image->text
-  input_modalities:
-    - text
-    - image
-  output_modalities:
-    - text
-  tokenizer: Claude
-  instruct_type: null
-pricing:
-  prompt: '0.0000008'
-  completion: '0.000004'
-  input_cache_read: '0.00000008'
-  input_cache_write: '0.000001'
-  request: '0'
-  image: '0'
-  web_search: '0'
-  internal_reasoning: '0'
-  unit: 1
-  currency: USD
-supported_parameters:
-  - tools
-  - tool_choice
-  - max_tokens
-  - temperature
-  - top_p
-  - top_k
-  - stop
-model_provider: anthropic
--- a/resources/model-catalogs/anthropic/claude-3.5-sonnet-20240620-beta.yaml
+++ b/resources/model-catalogs/anthropic/claude-3.5-sonnet-20240620-beta.yaml
@@ -1,47 +0,0 @@
-id: anthropic/claude-3.5-sonnet-20240620:beta
-canonical_slug: anthropic/claude-3.5-sonnet-20240620
-hugging_face_id: ''
-name: 'Anthropic: Claude 3.5 Sonnet (2024-06-20) (self-moderated)'
-type: chat
-created: 1718841600
-description: |-
-  Claude 3.5 Sonnet delivers better-than-Opus capabilities, faster-than-Sonnet speeds, at the same Sonnet prices. Sonnet is particularly good at:
-
-  - Coding: Autonomously writes, edits, and runs code with reasoning and troubleshooting
-  - Data science: Augments human data science expertise; navigates unstructured data while using multiple tools for insights
-  - Visual processing: excelling at interpreting charts, graphs, and images, accurately transcribing text to derive insights beyond just the text alone
-  - Agentic tasks: exceptional tool use, making it great at agentic tasks (i.e. complex, multi-step problem solving tasks that require engaging with other systems)
-
-  For the latest version (2024-10-23), check out [Claude 3.5 Sonnet](/anthropic/claude-3.5-sonnet).
-
-  #multimodal
-context_length: 200000
-architecture:
-  modality: text+image->text
-  input_modalities:
-    - text
-    - image
-  output_modalities:
-    - text
-  tokenizer: Claude
-  instruct_type: null
-pricing:
-  prompt: '0.000003'
-  completion: '0.000015'
-  input_cache_read: '0.0000003'
-  input_cache_write: '0.00000375'
-  request: '0'
-  image: '0.0048'
-  web_search: '0'
-  internal_reasoning: '0'
-  unit: 1
-  currency: USD
-supported_parameters:
-  - tools
-  - tool_choice
-  - max_tokens
-  - temperature
-  - top_p
-  - top_k
-  - stop
-model_provider: anthropic
--- a/resources/model-catalogs/anthropic/claude-3.5-sonnet-20240620.yaml
+++ b/resources/model-catalogs/anthropic/claude-3.5-sonnet-20240620.yaml
@@ -1,47 +0,0 @@
-id: anthropic/claude-3.5-sonnet-20240620
-canonical_slug: anthropic/claude-3.5-sonnet-20240620
-hugging_face_id: ''
-name: 'Anthropic: Claude 3.5 Sonnet (2024-06-20)'
-type: chat
-created: 1718841600
-description: |-
-  Claude 3.5 Sonnet delivers better-than-Opus capabilities, faster-than-Sonnet speeds, at the same Sonnet prices. Sonnet is particularly good at:
-
-  - Coding: Autonomously writes, edits, and runs code with reasoning and troubleshooting
-  - Data science: Augments human data science expertise; navigates unstructured data while using multiple tools for insights
-  - Visual processing: excelling at interpreting charts, graphs, and images, accurately transcribing text to derive insights beyond just the text alone
-  - Agentic tasks: exceptional tool use, making it great at agentic tasks (i.e. complex, multi-step problem solving tasks that require engaging with other systems)
-
-  For the latest version (2024-10-23), check out [Claude 3.5 Sonnet](/anthropic/claude-3.5-sonnet).
-
-  #multimodal
-context_length: 200000
-architecture:
-  modality: text+image->text
-  input_modalities:
-    - text
-    - image
-  output_modalities:
-    - text
-  tokenizer: Claude
-  instruct_type: null
-pricing:
-  prompt: '0.000003'
-  completion: '0.000015'
-  input_cache_read: '0.0000003'
-  input_cache_write: '0.00000375'
-  request: '0'
-  image: '0.0048'
-  web_search: '0'
-  internal_reasoning: '0'
-  unit: 1
-  currency: USD
-supported_parameters:
-  - tools
-  - tool_choice
-  - max_tokens
-  - temperature
-  - top_p
-  - top_k
-  - stop
-model_provider: anthropic
--- a/resources/model-catalogs/anthropic/claude-3.5-sonnet-beta.yaml
+++ b/resources/model-catalogs/anthropic/claude-3.5-sonnet-beta.yaml
@@ -1,45 +0,0 @@
-id: anthropic/claude-3.5-sonnet:beta
-canonical_slug: anthropic/claude-3.5-sonnet
-hugging_face_id: ''
-name: 'Anthropic: Claude 3.5 Sonnet (self-moderated)'
-type: chat
-created: 1729555200
-description: |-
-  New Claude 3.5 Sonnet delivers better-than-Opus capabilities, faster-than-Sonnet speeds, at the same Sonnet prices. Sonnet is particularly good at:
-
-  - Coding: Scores ~49% on SWE-Bench Verified, higher than the last best score, and without any fancy prompt scaffolding
-  - Data science: Augments human data science expertise; navigates unstructured data while using multiple tools for insights
-  - Visual processing: excelling at interpreting charts, graphs, and images, accurately transcribing text to derive insights beyond just the text alone
-  - Agentic tasks: exceptional tool use, making it great at agentic tasks (i.e. complex, multi-step problem solving tasks that require engaging with other systems)
-
-  #multimodal
-context_length: 200000
-architecture:
-  modality: text+image->text
-  input_modalities:
-    - text
-    - image
-  output_modalities:
-    - text
-  tokenizer: Claude
-  instruct_type: null
-pricing:
-  prompt: '0.000003'
-  completion: '0.000015'
-  input_cache_read: '0.0000003'
-  input_cache_write: '0.00000375'
-  request: '0'
-  image: '0.0048'
-  web_search: '0'
-  internal_reasoning: '0'
-  unit: 1
-  currency: USD
-supported_parameters:
-  - tools
-  - tool_choice
-  - max_tokens
-  - temperature
-  - top_p
-  - top_k
-  - stop
-model_provider: anthropic
--- a/resources/model-catalogs/anthropic/claude-3.5-sonnet.yaml
+++ b/resources/model-catalogs/anthropic/claude-3.5-sonnet.yaml
@@ -1,45 +0,0 @@
-id: anthropic/claude-3.5-sonnet
-canonical_slug: anthropic/claude-3.5-sonnet
-hugging_face_id: ''
-name: 'Anthropic: Claude 3.5 Sonnet'
-type: chat
-created: 1729555200
-description: |-
-  New Claude 3.5 Sonnet delivers better-than-Opus capabilities, faster-than-Sonnet speeds, at the same Sonnet prices. Sonnet is particularly good at:
-
-  - Coding: Scores ~49% on SWE-Bench Verified, higher than the last best score, and without any fancy prompt scaffolding
-  - Data science: Augments human data science expertise; navigates unstructured data while using multiple tools for insights
-  - Visual processing: excelling at interpreting charts, graphs, and images, accurately transcribing text to derive insights beyond just the text alone
-  - Agentic tasks: exceptional tool use, making it great at agentic tasks (i.e. complex, multi-step problem solving tasks that require engaging with other systems)
-
-  #multimodal
-context_length: 200000
-architecture:
-  modality: text+image->text
-  input_modalities:
-    - text
-    - image
-  output_modalities:
-    - text
-  tokenizer: Claude
-  instruct_type: null
-pricing:
-  prompt: '0.000003'
-  completion: '0.000015'
-  input_cache_read: '0.0000003'
-  input_cache_write: '0.00000375'
-  request: '0'
-  image: '0.0048'
-  web_search: '0'
-  internal_reasoning: '0'
-  unit: 1
-  currency: USD
-supported_parameters:
-  - tools
-  - tool_choice
-  - max_tokens
-  - temperature
-  - top_p
-  - top_k
-  - stop
-model_provider: anthropic
--- a/resources/model-catalogs/anthropic/claude-3.7-sonnet-beta.yaml
+++ b/resources/model-catalogs/anthropic/claude-3.7-sonnet-beta.yaml
@@ -1,37 +0,0 @@
-id: anthropic/claude-3.7-sonnet:beta
-canonical_slug: anthropic/claude-3-7-sonnet-20250219
-hugging_face_id: ''
-name: 'Anthropic: Claude 3.7 Sonnet (self-moderated)'
-type: chat
-created: 1740422110
-description: "Claude 3.7 Sonnet is an advanced large language model with improved reasoning, coding, and problem-solving capabilities. It introduces a hybrid reasoning approach, allowing users to choose between rapid responses and extended, step-by-step processing for complex tasks. The model demonstrates notable improvements in coding, particularly in front-end development and full-stack updates, and excels in agentic workflows, where it can autonomously navigate multi-step processes. \n\nClaude 3.7 Sonnet maintains performance parity with its predecessor in standard mode while offering an extended reasoning mode for enhanced accuracy in math, coding, and instruction-following tasks.\n\nRead more at the [blog post here](https://www.anthropic.com/news/claude-3-7-sonnet)"
-context_length: 200000
-architecture:
-  modality: text+image->text
-  input_modalities:
-    - text
-    - image
-  output_modalities:
-    - text
-  tokenizer: Claude
-  instruct_type: null
-pricing:
-  prompt: '0.000003'
-  completion: '0.000015'
-  input_cache_read: '0.0000003'
-  input_cache_write: '0.00000375'
-  request: '0'
-  image: '0.0048'
-  web_search: '0'
-  internal_reasoning: '0'
-  unit: 1
-  currency: USD
-supported_parameters:
-  - max_tokens
-  - temperature
-  - stop
-  - reasoning
-  - include_reasoning
-  - tools
-  - tool_choice
-model_provider: anthropic
--- a/resources/model-catalogs/anthropic/claude-3.7-sonnet-thinking.yaml
+++ b/resources/model-catalogs/anthropic/claude-3.7-sonnet-thinking.yaml
@@ -1,37 +0,0 @@
-id: anthropic/claude-3.7-sonnet:thinking
-canonical_slug: anthropic/claude-3-7-sonnet-20250219
-hugging_face_id: ''
-name: 'Anthropic: Claude 3.7 Sonnet (thinking)'
-type: chat
-created: 1740422110
-description: "Claude 3.7 Sonnet is an advanced large language model with improved reasoning, coding, and problem-solving capabilities. It introduces a hybrid reasoning approach, allowing users to choose between rapid responses and extended, step-by-step processing for complex tasks. The model demonstrates notable improvements in coding, particularly in front-end development and full-stack updates, and excels in agentic workflows, where it can autonomously navigate multi-step processes. \n\nClaude 3.7 Sonnet maintains performance parity with its predecessor in standard mode while offering an extended reasoning mode for enhanced accuracy in math, coding, and instruction-following tasks.\n\nRead more at the [blog post here](https://www.anthropic.com/news/claude-3-7-sonnet)"
-context_length: 200000
-architecture:
-  modality: text+image->text
-  input_modalities:
-    - text
-    - image
-  output_modalities:
-    - text
-  tokenizer: Claude
-  instruct_type: null
-pricing:
-  prompt: '0.000003'
-  completion: '0.000015'
-  input_cache_read: '0.0000003'
-  input_cache_write: '0.00000375'
-  request: '0'
-  image: '0.0048'
-  web_search: '0'
-  internal_reasoning: '0'
-  unit: 1
-  currency: USD
-supported_parameters:
-  - max_tokens
-  - temperature
-  - stop
-  - reasoning
-  - include_reasoning
-  - tools
-  - tool_choice
-model_provider: anthropic
--- a/resources/model-catalogs/anthropic/claude-3.7-sonnet.yaml
+++ b/resources/model-catalogs/anthropic/claude-3.7-sonnet.yaml
@@ -1,39 +0,0 @@
-id: anthropic/claude-3.7-sonnet
-canonical_slug: anthropic/claude-3-7-sonnet-20250219
-hugging_face_id: ''
-name: 'Anthropic: Claude 3.7 Sonnet'
-type: chat
-created: 1740422110
-description: "Claude 3.7 Sonnet is an advanced large language model with improved reasoning, coding, and problem-solving capabilities. It introduces a hybrid reasoning approach, allowing users to choose between rapid responses and extended, step-by-step processing for complex tasks. The model demonstrates notable improvements in coding, particularly in front-end development and full-stack updates, and excels in agentic workflows, where it can autonomously navigate multi-step processes. \n\nClaude 3.7 Sonnet maintains performance parity with its predecessor in standard mode while offering an extended reasoning mode for enhanced accuracy in math, coding, and instruction-following tasks.\n\nRead more at the [blog post here](https://www.anthropic.com/news/claude-3-7-sonnet)"
-context_length: 200000
-architecture:
-  modality: text+image->text
-  input_modalities:
-    - text
-    - image
-  output_modalities:
-    - text
-  tokenizer: Claude
-  instruct_type: null
-pricing:
-  prompt: '0.000003'
-  completion: '0.000015'
-  input_cache_read: '0.0000003'
-  input_cache_write: '0.00000375'
-  request: '0'
-  image: '0.0048'
-  web_search: '0'
-  internal_reasoning: '0'
-  unit: 1
-  currency: USD
-supported_parameters:
-  - max_tokens
-  - temperature
-  - stop
-  - reasoning
-  - include_reasoning
-  - tools
-  - tool_choice
-  - top_p
-  - top_k
-model_provider: anthropic
--- a/resources/model-catalogs/anthropic/claude-opus-4.yaml
+++ b/resources/model-catalogs/anthropic/claude-opus-4.yaml
@@ -1,39 +0,0 @@
-id: anthropic/claude-opus-4
-canonical_slug: anthropic/claude-4-opus-20250522
-hugging_face_id: ''
-name: 'Anthropic: Claude Opus 4'
-type: chat
-created: 1747931245
-description: "Claude Opus 4 is benchmarked as the world’s best coding model, at time of release, bringing sustained performance on complex, long-running tasks and agent workflows. It sets new benchmarks in software engineering, achieving leading results on SWE-bench (72.5%) and Terminal-bench (43.2%). Opus 4 supports extended, agentic workflows, handling thousands of task steps continuously for hours without degradation. \n\nRead more at the [blog post here](https://www.anthropic.com/news/claude-4)"
-context_length: 200000
-architecture:
-  modality: text+image->text
-  input_modalities:
-    - image
-    - text
-  output_modalities:
-    - text
-  tokenizer: Claude
-  instruct_type: null
-pricing:
-  prompt: '0.000015'
-  completion: '0.000075'
-  input_cache_read: '0.0000015'
-  input_cache_write: '0.00001875'
-  request: '0'
-  image: '0.024'
-  web_search: '0'
-  internal_reasoning: '0'
-  unit: 1
-  currency: USD
-supported_parameters:
-  - max_tokens
-  - temperature
-  - stop
-  - reasoning
-  - include_reasoning
-  - tools
-  - tool_choice
-  - top_p
-  - top_k
-model_provider: anthropic
--- a/resources/model-catalogs/anthropic/claude-sonnet-4.yaml
+++ b/resources/model-catalogs/anthropic/claude-sonnet-4.yaml
@@ -1,42 +0,0 @@
-id: anthropic/claude-sonnet-4
-canonical_slug: anthropic/claude-4-sonnet-20250522
-hugging_face_id: ''
-name: 'Anthropic: Claude Sonnet 4'
-type: chat
-created: 1747930371
-description: |-
-  Claude Sonnet 4 significantly enhances the capabilities of its predecessor, Sonnet 3.7, excelling in both coding and reasoning tasks with improved precision and controllability. Achieving state-of-the-art performance on SWE-bench (72.7%), Sonnet 4 balances capability and computational efficiency, making it suitable for a broad range of applications from routine coding tasks to complex software development projects. Key enhancements include improved autonomous codebase navigation, reduced error rates in agent-driven workflows, and increased reliability in following intricate instructions. Sonnet 4 is optimized for practical everyday use, providing advanced reasoning capabilities while maintaining efficiency and responsiveness in diverse internal and external scenarios.
-
-  Read more at the [blog post here](https://www.anthropic.com/news/claude-4)
-context_length: 200000
-architecture:
-  modality: text+image->text
-  input_modalities:
-    - image
-    - text
-  output_modalities:
-    - text
-  tokenizer: Claude
-  instruct_type: null
-pricing:
-  prompt: '0.000003'
-  completion: '0.000015'
-  input_cache_read: '0.0000003'
-  input_cache_write: '0.00000375'
-  request: '0'
-  image: '0.0048'
-  web_search: '0'
-  internal_reasoning: '0'
-  unit: 1
-  currency: USD
-supported_parameters:
-  - max_tokens
-  - temperature
-  - stop
-  - reasoning
-  - include_reasoning
-  - tools
-  - tool_choice
-  - top_p
-  - top_k
-model_provider: anthropic
--- a/resources/model-catalogs/arcee-ai/arcee-blitz.yaml
+++ b/resources/model-catalogs/arcee-ai/arcee-blitz.yaml
@@ -1,40 +0,0 @@
-id: arcee-ai/arcee-blitz
-canonical_slug: arcee-ai/arcee-blitz
-hugging_face_id: arcee-ai/arcee-blitz
-name: 'Arcee AI: Arcee Blitz'
-type: chat
-created: 1746470100
-description: 'Arcee Blitz is a 24 B‑parameter dense model distilled from DeepSeek and built on Mistral architecture for "everyday" chat. The distillation‑plus‑refinement pipeline trims compute while keeping DeepSeek‑style reasoning, so Blitz punches above its weight on MMLU, GSM‑8K and BBH compared with other mid‑size open models. With a default 128 k context window and competitive throughput, it serves as a cost‑efficient workhorse for summarization, brainstorming and light code help. Internally, Arcee uses Blitz as the default writer in Conductor pipelines when the heavier Virtuoso line is not required. Users therefore get near‑70 B quality at ~⅓ the latency and price. '
-context_length: 32768
-architecture:
-  modality: text->text
-  input_modalities:
-    - text
-  output_modalities:
-    - text
-  tokenizer: Other
-  instruct_type: null
-pricing:
-  prompt: '0.00000045'
-  completion: '0.00000075'
-  input_cache_read: ''
-  input_cache_write: ''
-  request: '0'
-  image: '0'
-  web_search: '0'
-  internal_reasoning: '0'
-  unit: 1
-  currency: USD
-supported_parameters:
-  - max_tokens
-  - temperature
-  - top_p
-  - stop
-  - frequency_penalty
-  - presence_penalty
-  - top_k
-  - repetition_penalty
-  - logit_bias
-  - min_p
-  - response_format
-model_provider: arcee-ai
--- a/resources/model-catalogs/arcee-ai/caller-large.yaml
+++ b/resources/model-catalogs/arcee-ai/caller-large.yaml
@@ -1,42 +0,0 @@
-id: arcee-ai/caller-large
-canonical_slug: arcee-ai/caller-large
-hugging_face_id: ''
-name: 'Arcee AI: Caller Large'
-type: chat
-created: 1746487869
-description: 'Caller Large is Arcee''s specialist "function‑calling" SLM built to orchestrate external tools and APIs. Instead of maximizing next‑token accuracy, training focuses on structured JSON outputs, parameter extraction and multi‑step tool chains, making Caller a natural choice for retrieval‑augmented generation, robotic process automation or data‑pull chatbots. It incorporates a routing head that decides when (and how) to invoke a tool versus answering directly, reducing hallucinated calls. The model is already the backbone of Arcee Conductor''s auto‑tool mode, where it parses user intent, emits clean function signatures and hands control back once the tool response is ready. Developers thus gain an OpenAI‑style function‑calling UX without handing requests to a frontier‑scale model. '
-context_length: 32768
-architecture:
-  modality: text->text
-  input_modalities:
-    - text
-  output_modalities:
-    - text
-  tokenizer: Other
-  instruct_type: null
-pricing:
-  prompt: '0.00000055'
-  completion: '0.00000085'
-  input_cache_read: ''
-  input_cache_write: ''
-  request: '0'
-  image: '0'
-  web_search: '0'
-  internal_reasoning: '0'
-  unit: 1
-  currency: USD
-supported_parameters:
-  - tools
-  - tool_choice
-  - max_tokens
-  - temperature
-  - top_p
-  - stop
-  - frequency_penalty
-  - presence_penalty
-  - top_k
-  - repetition_penalty
-  - logit_bias
-  - min_p
-  - response_format
-model_provider: arcee-ai
--- a/resources/model-catalogs/arcee-ai/coder-large.yaml
+++ b/resources/model-catalogs/arcee-ai/coder-large.yaml
@@ -1,40 +0,0 @@
-id: arcee-ai/coder-large
-canonical_slug: arcee-ai/coder-large
-hugging_face_id: ''
-name: 'Arcee AI: Coder Large'
-type: chat
-created: 1746478663
-description: 'Coder‑Large is a 32 B‑parameter offspring of Qwen 2.5‑Instruct that has been further trained on permissively‑licensed GitHub, CodeSearchNet and synthetic bug‑fix corpora. It supports a 32k context window, enabling multi‑file refactoring or long diff review in a single call, and understands 30‑plus programming languages with special attention to TypeScript, Go and Terraform. Internal benchmarks show 5–8 pt gains over CodeLlama‑34 B‑Python on HumanEval and competitive BugFix scores thanks to a reinforcement pass that rewards compilable output. The model emits structured explanations alongside code blocks by default, making it suitable for educational tooling as well as production copilot scenarios. Cost‑wise, Together AI prices it well below proprietary incumbents, so teams can scale interactive coding without runaway spend. '
-context_length: 32768
-architecture:
-  modality: text->text
-  input_modalities:
-    - text
-  output_modalities:
-    - text
-  tokenizer: Other
-  instruct_type: null
-pricing:
-  prompt: '0.0000005'
-  completion: '0.0000008'
-  input_cache_read: ''
-  input_cache_write: ''
-  request: '0'
-  image: '0'
-  web_search: '0'
-  internal_reasoning: '0'
-  unit: 1
-  currency: USD
-supported_parameters:
-  - max_tokens
-  - temperature
-  - top_p
-  - stop
-  - frequency_penalty
-  - presence_penalty
-  - top_k
-  - repetition_penalty
-  - logit_bias
-  - min_p
-  - response_format
-model_provider: arcee-ai
--- a/resources/model-catalogs/arcee-ai/maestro-reasoning.yaml
+++ b/resources/model-catalogs/arcee-ai/maestro-reasoning.yaml
@@ -1,40 +0,0 @@
-id: arcee-ai/maestro-reasoning
-canonical_slug: arcee-ai/maestro-reasoning
-hugging_face_id: ''
-name: 'Arcee AI: Maestro Reasoning'
-type: chat
-created: 1746481269
-description: 'Maestro Reasoning is Arcee''s flagship analysis model: a 32 B‑parameter derivative of Qwen 2.5‑32 B tuned with DPO and chain‑of‑thought RL for step‑by‑step logic. Compared to the earlier 7 B preview, the production 32 B release widens the context window to 128 k tokens and doubles pass‑rate on MATH and GSM‑8K, while also lifting code completion accuracy. Its instruction style encourages structured "thought → answer" traces that can be parsed or hidden according to user preference. That transparency pairs well with audit‑focused industries like finance or healthcare where seeing the reasoning path matters. In Arcee Conductor, Maestro is automatically selected for complex, multi‑constraint queries that smaller SLMs bounce. '
-context_length: 131072
-architecture:
-  modality: text->text
-  input_modalities:
-    - text
-  output_modalities:
-    - text
-  tokenizer: Other
-  instruct_type: null
-pricing:
-  prompt: '0.0000009'
-  completion: '0.0000033'
-  input_cache_read: ''
-  input_cache_write: ''
-  request: '0'
-  image: '0'
-  web_search: '0'
-  internal_reasoning: '0'
-  unit: 1
-  currency: USD
-supported_parameters:
-  - max_tokens
-  - temperature
-  - top_p
-  - stop
-  - frequency_penalty
-  - presence_penalty
-  - top_k
-  - repetition_penalty
-  - logit_bias
-  - min_p
-  - response_format
-model_provider: arcee-ai
--- a/resources/model-catalogs/arcee-ai/spotlight.yaml
+++ b/resources/model-catalogs/arcee-ai/spotlight.yaml
@@ -1,41 +0,0 @@
-id: arcee-ai/spotlight
-canonical_slug: arcee-ai/spotlight
-hugging_face_id: ''
-name: 'Arcee AI: Spotlight'
-type: chat
-created: 1746481552
-description: 'Spotlight is a 7‑billion‑parameter vision‑language model derived from Qwen 2.5‑VL and fine‑tuned by Arcee AI for tight image‑text grounding tasks. It offers a 32 k‑token context window, enabling rich multimodal conversations that combine lengthy documents with one or more images. Training emphasized fast inference on consumer GPUs while retaining strong captioning, visual‐question‑answering, and diagram‑analysis accuracy. As a result, Spotlight slots neatly into agent workflows where screenshots, charts or UI mock‑ups need to be interpreted on the fly. Early benchmarks show it matching or out‑scoring larger VLMs such as LLaVA‑1.6 13 B on popular VQA and POPE alignment tests. '
-context_length: 131072
-architecture:
-  modality: text+image->text
-  input_modalities:
-    - image
-    - text
-  output_modalities:
-    - text
-  tokenizer: Other
-  instruct_type: null
-pricing:
-  prompt: '0.00000018'
-  completion: '0.00000018'
-  input_cache_read: ''
-  input_cache_write: ''
-  request: '0'
-  image: '0'
-  web_search: '0'
-  internal_reasoning: '0'
-  unit: 1
-  currency: USD
-supported_parameters:
-  - max_tokens
-  - temperature
-  - top_p
-  - stop
-  - frequency_penalty
-  - presence_penalty
-  - top_k
-  - repetition_penalty
-  - logit_bias
-  - min_p
-  - response_format
-model_provider: arcee-ai
--- a/resources/model-catalogs/arcee-ai/virtuoso-large.yaml
+++ b/resources/model-catalogs/arcee-ai/virtuoso-large.yaml
@@ -1,42 +0,0 @@
-id: arcee-ai/virtuoso-large
-canonical_slug: arcee-ai/virtuoso-large
-hugging_face_id: ''
-name: 'Arcee AI: Virtuoso Large'
-type: chat
-created: 1746478885
-description: Virtuoso‑Large is Arcee's top‑tier general‑purpose LLM at 72 B parameters, tuned to tackle cross‑domain reasoning, creative writing and enterprise QA. Unlike many 70 B peers, it retains the 128 k context inherited from Qwen 2.5, letting it ingest books, codebases or financial filings wholesale. Training blended DeepSeek R1 distillation, multi‑epoch supervised fine‑tuning and a final DPO/RLHF alignment stage, yielding strong performance on BIG‑Bench‑Hard, GSM‑8K and long‑context Needle‑In‑Haystack tests. Enterprises use Virtuoso‑Large as the "fallback" brain in Conductor pipelines when other SLMs flag low confidence. Despite its size, aggressive KV‑cache optimizations keep first‑token latency in the low‑second range on 8× H100 nodes, making it a practical production‑grade powerhouse.
-context_length: 131072
-architecture:
-  modality: text->text
-  input_modalities:
-    - text
-  output_modalities:
-    - text
-  tokenizer: Other
-  instruct_type: null
-pricing:
-  prompt: '0.00000075'
-  completion: '0.0000012'
-  input_cache_read: ''
-  input_cache_write: ''
-  request: '0'
-  image: '0'
-  web_search: '0'
-  internal_reasoning: '0'
-  unit: 1
-  currency: USD
-supported_parameters:
-  - tools
-  - tool_choice
-  - max_tokens
-  - temperature
-  - top_p
-  - stop
-  - frequency_penalty
-  - presence_penalty
-  - top_k
-  - repetition_penalty
-  - logit_bias
-  - min_p
-  - response_format
-model_provider: arcee-ai
--- a/resources/model-catalogs/arcee-ai/virtuoso-medium-v2.yaml
+++ b/resources/model-catalogs/arcee-ai/virtuoso-medium-v2.yaml
@@ -1,42 +0,0 @@
-id: arcee-ai/virtuoso-medium-v2
-canonical_slug: arcee-ai/virtuoso-medium-v2
-hugging_face_id: arcee-ai/Virtuoso-Medium-v2
-name: 'Arcee AI: Virtuoso Medium V2'
-type: chat
-created: 1746478434
-description: 'Virtuoso‑Medium‑v2 is a 32 B model distilled from DeepSeek‑v3 logits and merged back onto a Qwen 2.5 backbone, yielding a sharper, more factual successor to the original Virtuoso Medium. The team harvested ~1.1 B logit tokens and applied "fusion‑merging" plus DPO alignment, which pushed scores past Arcee‑Nova 2024 and many 40 B‑plus peers on MMLU‑Pro, MATH and HumanEval. With a 128 k context and aggressive quantization options (from BF16 down to 4‑bit GGUF), it balances capability with deployability on single‑GPU nodes. Typical use cases include enterprise chat assistants, technical writing aids and medium‑complexity code drafting where Virtuoso‑Large would be overkill. '
-context_length: 131072
-architecture:
-  modality: text->text
-  input_modalities:
-    - text
-  output_modalities:
-    - text
-  tokenizer: Other
-  instruct_type: null
-pricing:
-  prompt: '0.0000005'
-  completion: '0.0000008'
-  input_cache_read: ''
-  input_cache_write: ''
-  request: '0'
-  image: '0'
-  web_search: '0'
-  internal_reasoning: '0'
-  unit: 1
-  currency: USD
-supported_parameters:
-  - tools
-  - tool_choice
-  - max_tokens
-  - temperature
-  - top_p
-  - stop
-  - frequency_penalty
-  - presence_penalty
-  - top_k
-  - repetition_penalty
-  - logit_bias
-  - min_p
-  - response_format
-model_provider: arcee-ai
--- a/resources/model-catalogs/bytedance/doubao-embedding-large-text-240715.yaml
+++ b/resources/model-catalogs/bytedance/doubao-embedding-large-text-240715.yaml
@@ -1,24 +0,0 @@
-id: bytedance/doubao-embedding-text-240715
-canonical_slug: bytedance/doubao-embedding-text-240715
-type: embedding
-hugging_face_id: null
-name: 'ByteDance: Doubao Embedding Text (240715)'
-description: |-
-  Doubao Embedding Large 是字节跳动语义向量化模型的最新升级版，模型以豆包语言模型为基座，具备强大的语言理解能力；主要面向向量检索的使用场景，支持中、英双语。
-context_length: 4000
-dimensions:
-  - 512
-  - 1024
-  - 2048
-architecture:
-  modality: text->text
-  input_modalities:
-    - text
-  output_modalities:
-    - text
-  tokenizer: Doubao
-pricing:
-  prompt: '0.7'
-  unit: 1000000
-  currency: CNY
-model_provider: bytedance
--- a/resources/model-catalogs/bytedance/doubao-embedding-large-text-240915.yaml
+++ b/resources/model-catalogs/bytedance/doubao-embedding-large-text-240915.yaml
@@ -1,25 +0,0 @@
-id: bytedance/doubao-embedding-large-text-240915
-canonical_slug: bytedance/doubao-embedding-large-text-240915
-type: embedding
-hugging_face_id: null
-name: 'ByteDance: Doubao Embedding Large Text (240915)'
-description: |-
-  Doubao Embedding Large 是字节跳动语义向量化模型的最新升级版，模型以豆包语言模型为基座，具备强大的语言理解能力；主要面向向量检索的使用场景，支持中、英双语。
-context_length: 4000
-dimensions:
-  - 512
-  - 1024
-  - 2048
-  - 4096
-architecture:
-  modality: text->text
-  input_modalities:
-    - text
-  output_modalities:
-    - text
-  tokenizer: Doubao
-pricing:
-  prompt: '0.7'
-  unit: 1000000
-  currency: CNY
-model_provider: bytedance
--- a/resources/model-catalogs/bytedance/doubao-embedding-text-240515.yaml
+++ b/resources/model-catalogs/bytedance/doubao-embedding-text-240515.yaml
@@ -1,24 +0,0 @@
-id: bytedance/doubao-embedding-text-240715
-canonical_slug: bytedance/doubao-embedding-text-240715
-type: embedding
-hugging_face_id: null
-name: 'ByteDance: Doubao Embedding'
-description: |-
-  由字节跳动研发的语义向量化模型，主要面向向量检索的使用场景，支持中、英双语，最长 4K 上下文长度。向量维度 2048 维，支持 512、1024 降维使用。
-context_length: 4000
-dimensions:
-  - 512
-  - 1024
-  - 2048
-architecture:
-  modality: text->text
-  input_modalities:
-    - text
-  output_modalities:
-    - text
-  tokenizer: Doubao
-pricing:
-  prompt: '0.5'
-  unit: 1000000
-  currency: CNY
-model_provider: bytedance
--- a/resources/model-catalogs/bytedance/doubao-embedding-text-240715.yaml
+++ b/resources/model-catalogs/bytedance/doubao-embedding-text-240715.yaml
@@ -1,25 +0,0 @@
-id: bytedance/doubao-embedding-text-240715
-canonical_slug: bytedance/doubao-embedding-text-240715
-type: embedding
-hugging_face_id: null
-name: 'ByteDance: Doubao Embedding'
-description: |-
-  由字节跳动研发的语义向量化模型，主要面向向量检索的使用场景，支持中、英双语，最长 4K 上下文长度。向量维度 2048 维，支持 512、1024 降维使用。
-context_length: 4000
-dimensions:
-  - 512
-  - 1024
-  - 2048
-  - 2560
-architecture:
-  modality: text->text
-  input_modalities:
-    - text
-  output_modalities:
-    - text
-  tokenizer: Doubao
-pricing:
-  prompt: '0.5'
-  unit: 1000000
-  currency: CNY
-model_provider: bytedance
--- a/resources/model-catalogs/bytedance/doubao-embedding-vision-241215.yaml
+++ b/resources/model-catalogs/bytedance/doubao-embedding-vision-241215.yaml
@@ -1,24 +0,0 @@
-id: bytedance/doubao-embedding-vision-241215
-canonical_slug: bytedance/doubao-embedding-vision-241215
-type: embedding
-hugging_face_id: null
-name: 'ByteDance: Doubao Embedding Vision'
-description: |-
-  Doubao-embedding-vision，全新升级图文多模态向量化模型，主要面向图文多模向量检索的使用场景，支持图片输入及中、英双语文本输入，最长 8K 上下文长度。
-context_length: 8000
-dimensions:
-  - 3072
-architecture:
-  modality: text+image->text
-  input_modalities:
-    - text
-    - image
-  output_modalities:
-    - text
-  tokenizer: Doubao
-pricing:
-  prompt: '0.7'
-  prompt_image: '1.8'
-  unit: 1000000
-  currency: CNY
-model_provider: bytedance
--- a/resources/model-catalogs/bytedance/doubao-embedding-vision-250328.yaml
+++ b/resources/model-catalogs/bytedance/doubao-embedding-vision-250328.yaml
@@ -1,25 +0,0 @@
-id: bytedance/doubao-embedding-vision-250328
-canonical_slug: bytedance/doubao-embedding-vision-250328
-type: embedding
-hugging_face_id: null
-name: 'ByteDance: Doubao Embedding Vision'
-description: |-
-  Doubao-embedding-vision，全新升级图文多模态向量化模型，主要面向图文多模向量检索的使用场景，支持图片输入及中、英双语文本输入，最长 8K 上下文长度。
-context_length: 8000
-dimensions:
-  - 1024
-  - 2048
-architecture:
-  modality: text+image->text
-  input_modalities:
-    - text
-    - image
-  output_modalities:
-    - text
-  tokenizer: Doubao
-pricing:
-  prompt: '0.7'
-  prompt_image: '1.8'
-  unit: 1000000
-  currency: CNY
-model_provider: bytedance
--- a/resources/model-catalogs/bytedance/doubao-seed-1.6-flash.yaml
+++ b/resources/model-catalogs/bytedance/doubao-seed-1.6-flash.yaml
@@ -1,41 +0,0 @@
-id: bytedance/doubao-seed-1.6-flash
-canonical_slug: bytedance/doubao-seed-1.6-flash
-type: chat
-hugging_face_id: ''
-name: 'ByteDance: Doubao Seed 1.6 Flash'
-created: 1738402289
-description: 有极致推理速度的多模态深度思考模型；同时支持文本和视觉理解。文本理解能力超过上一代 Lite 系列模型，视觉理解比肩友商 Pro 系列模型。
-context_length: 256000
-architecture:
-  modality: text+image+vedio->text
-  input_modalities:
-    - text
-    - image
-    - video
-  output_modalities:
-    - text
-  tokenizer: Doubao
-  instruct_type: null
-pricing:
-  prompt: '0.15'
-  completion: '1.5'
-  input_cache_read: '0.03'
-  input_cache_write: ''
-  request: '0'
-  image: '0'
-  web_search: '0'
-  internal_reasoning: '0'
-  currency: CNY
-  unit: 1000000
-supported_parameters:
-  - max_tokens
-  - temperature
-  - stop
-  - reasoning
-  - include_reasoning
-  - tools
-  - tool_choice
-  - top_p
-  - top_k
-  - structured_outputs
-model_provider: bytedance
--- a/resources/model-catalogs/bytedance/doubao-seed-1.6-thinking.yaml
+++ b/resources/model-catalogs/bytedance/doubao-seed-1.6-thinking.yaml
@@ -1,41 +0,0 @@
-id: bytedance/doubao-seed-1.6-thinking
-canonical_slug: bytedance/doubao-seed-1.6-thinking
-type: chat
-hugging_face_id: ''
-name: 'ByteDance: Doubao Seed 1.6 Thinking'
-created: 1738402289
-description: 在思考能力上进行了大幅强化， 对比 doubao 1.5 代深度理解模型，在编程、数学、逻辑推理等基础能力上进一步提升， 支持视觉理解。
-context_length: 256000
-architecture:
-  modality: text+image+vedio->text
-  input_modalities:
-    - text
-    - image
-    - video
-  output_modalities:
-    - text
-  tokenizer: Doubao
-  instruct_type: null
-pricing:
-  prompt: '0.8'
-  completion: '8.0'
-  input_cache_read: '0.16'
-  input_cache_write: ''
-  request: '0'
-  image: '0'
-  web_search: '0'
-  internal_reasoning: '0'
-  currency: CNY
-  unit: 1000000
-supported_parameters:
-  - max_tokens
-  - temperature
-  - stop
-  - reasoning
-  - include_reasoning
-  - tools
-  - tool_choice
-  - top_p
-  - top_k
-  - structured_outputs
-model_provider: bytedance
--- a/resources/model-catalogs/bytedance/doubao-seed-1.6.yaml
+++ b/resources/model-catalogs/bytedance/doubao-seed-1.6.yaml
@@ -1,41 +0,0 @@
-id: bytedance/doubao-seed-1.6
-canonical_slug: bytedance/doubao-seed-1.6
-type: chat
-hugging_face_id: ''
-name: 'ByteDance: Doubao Seed 1.6'
-created: 1738402289
-description: 全新多模态深度思考模型，同时支持 thinking、non-thinking、auto三种思考模式。其中 non-thinking 模型对比 doubao-1.5-pro-32k-250115 模型大幅提升。
-context_length: 256000
-architecture:
-  modality: text+image+vedio->text
-  input_modalities:
-    - text
-    - image
-    - video
-  output_modalities:
-    - text
-  tokenizer: Doubao
-  instruct_type: null
-pricing:
-  prompt: '0.8'
-  completion: '8.0'
-  input_cache_read: '0.16'
-  input_cache_write: ''
-  request: '0'
-  image: '0'
-  web_search: '0'
-  internal_reasoning: '0'
-  currency: CNY
-  unit: 1000000
-supported_parameters:
-  - max_tokens
-  - temperature
-  - stop
-  - reasoning
-  - include_reasoning
-  - tools
-  - tool_choice
-  - top_p
-  - top_k
-  - structured_outputs
-model_provider: bytedance
--- a/resources/model-catalogs/cognitivecomputations/dolphin-mixtral-8x22b.yaml
+++ b/resources/model-catalogs/cognitivecomputations/dolphin-mixtral-8x22b.yaml
@@ -1,47 +0,0 @@
-id: cognitivecomputations/dolphin-mixtral-8x22b
-canonical_slug: cognitivecomputations/dolphin-mixtral-8x22b
-hugging_face_id: cognitivecomputations/dolphin-2.9.2-mixtral-8x22b
-name: "Dolphin 2.9.2 Mixtral 8x22B \U0001F42C"
-type: chat
-created: 1717804800
-description: |-
-  Dolphin 2.9 is designed for instruction following, conversational, and coding. This model is a finetune of [Mixtral 8x22B Instruct](/models/mistralai/mixtral-8x22b-instruct). It features a 64k context length and was fine-tuned with a 16k sequence length using ChatML templates.
-
-  This model is a successor to [Dolphin Mixtral 8x7B](/models/cognitivecomputations/dolphin-mixtral-8x7b).
-
-  The model is uncensored and is stripped of alignment and bias. It requires an external alignment layer for ethical use. Users are cautioned to use this highly compliant model responsibly, as detailed in a blog post about uncensored models at [erichartford.com/uncensored-models](https://erichartford.com/uncensored-models).
-
-  #moe #uncensored
-context_length: 16000
-architecture:
-  modality: text->text
-  input_modalities:
-    - text
-  output_modalities:
-    - text
-  tokenizer: Mistral
-  instruct_type: chatml
-pricing:
-  prompt: '0.0000009'
-  completion: '0.0000009'
-  input_cache_read: ''
-  input_cache_write: ''
-  request: '0'
-  image: '0'
-  web_search: '0'
-  internal_reasoning: '0'
-  unit: 1
-  currency: USD
-supported_parameters:
-  - max_tokens
-  - temperature
-  - top_p
-  - stop
-  - frequency_penalty
-  - presence_penalty
-  - seed
-  - top_k
-  - min_p
-  - repetition_penalty
-  - logit_bias
-model_provider: cognitivecomputations
--- a/resources/model-catalogs/cohere/command-a.yaml
+++ b/resources/model-catalogs/cohere/command-a.yaml
@@ -1,41 +0,0 @@
-id: cohere/command-a
-canonical_slug: cohere/command-a-03-2025
-hugging_face_id: CohereForAI/c4ai-command-a-03-2025
-name: 'Cohere: Command A'
-type: chat
-created: 1741894342
-description: |-
-  Command A is an open-weights 111B parameter model with a 256k context window focused on delivering great performance across agentic, multilingual, and coding use cases.
-  Compared to other leading proprietary and open-weights models Command A delivers maximum performance with minimum hardware costs, excelling on business-critical agentic and multilingual tasks.
-context_length: 256000
-architecture:
-  modality: text->text
-  input_modalities:
-    - text
-  output_modalities:
-    - text
-  tokenizer: Other
-  instruct_type: null
-pricing:
-  prompt: '0.0000025'
-  completion: '0.00001'
-  input_cache_read: ''
-  input_cache_write: ''
-  request: '0'
-  image: '0'
-  web_search: '0'
-  internal_reasoning: '0'
-  unit: 1
-  currency: USD
-supported_parameters:
-  - max_tokens
-  - temperature
-  - top_p
-  - stop
-  - frequency_penalty
-  - presence_penalty
-  - top_k
-  - seed
-  - response_format
-  - structured_outputs
-model_provider: cohere
--- a/resources/model-catalogs/cohere/command-r-03-2024.yaml
+++ b/resources/model-catalogs/cohere/command-r-03-2024.yaml
@@ -1,45 +0,0 @@
-id: cohere/command-r-03-2024
-canonical_slug: cohere/command-r-03-2024
-hugging_face_id: ''
-name: 'Cohere: Command R (03-2024)'
-type: chat
-created: 1709341200
-description: |-
-  Command-R is a 35B parameter model that performs conversational language tasks at a higher quality, more reliably, and with a longer context than previous models. It can be used for complex workflows like code generation, retrieval augmented generation (RAG), tool use, and agents.
-
-  Read the launch post [here](https://txt.cohere.com/command-r/).
-
-  Use of this model is subject to Cohere's [Usage Policy](https://docs.cohere.com/docs/usage-policy) and [SaaS Agreement](https://cohere.com/saas-agreement).
-context_length: 128000
-architecture:
-  modality: text->text
-  input_modalities:
-    - text
-  output_modalities:
-    - text
-  tokenizer: Cohere
-  instruct_type: null
-pricing:
-  prompt: '0.0000005'
-  completion: '0.0000015'
-  input_cache_read: ''
-  input_cache_write: ''
-  request: '0'
-  image: '0'
-  web_search: '0'
-  internal_reasoning: '0'
-  unit: 1
-  currency: USD
-supported_parameters:
-  - tools
-  - max_tokens
-  - temperature
-  - top_p
-  - stop
-  - frequency_penalty
-  - presence_penalty
-  - top_k
-  - seed
-  - response_format
-  - structured_outputs
-model_provider: cohere
--- a/resources/model-catalogs/cohere/command-r-08-2024.yaml
+++ b/resources/model-catalogs/cohere/command-r-08-2024.yaml
@@ -1,45 +0,0 @@
-id: cohere/command-r-08-2024
-canonical_slug: cohere/command-r-08-2024
-hugging_face_id: ''
-name: 'Cohere: Command R (08-2024)'
-type: chat
-created: 1724976000
-description: |-
-  command-r-08-2024 is an update of the [Command R](/models/cohere/command-r) with improved performance for multilingual retrieval-augmented generation (RAG) and tool use. More broadly, it is better at math, code and reasoning and is competitive with the previous version of the larger Command R+ model.
-
-  Read the launch post [here](https://docs.cohere.com/changelog/command-gets-refreshed).
-
-  Use of this model is subject to Cohere's [Usage Policy](https://docs.cohere.com/docs/usage-policy) and [SaaS Agreement](https://cohere.com/saas-agreement).
-context_length: 128000
-architecture:
-  modality: text->text
-  input_modalities:
-    - text
-  output_modalities:
-    - text
-  tokenizer: Cohere
-  instruct_type: null
-pricing:
-  prompt: '0.00000015'
-  completion: '0.0000006'
-  input_cache_read: ''
-  input_cache_write: ''
-  request: '0'
-  image: '0'
-  web_search: '0'
-  internal_reasoning: '0'
-  unit: 1
-  currency: USD
-supported_parameters:
-  - tools
-  - max_tokens
-  - temperature
-  - top_p
-  - stop
-  - frequency_penalty
-  - presence_penalty
-  - top_k
-  - seed
-  - response_format
-  - structured_outputs
-model_provider: cohere
--- a/resources/model-catalogs/cohere/command-r-plus-04-2024.yaml
+++ b/resources/model-catalogs/cohere/command-r-plus-04-2024.yaml
@@ -1,45 +0,0 @@
-id: cohere/command-r-plus-04-2024
-canonical_slug: cohere/command-r-plus-04-2024
-hugging_face_id: ''
-name: 'Cohere: Command R+ (04-2024)'
-type: chat
-created: 1712016000
-description: |-
-  Command R+ is a new, 104B-parameter LLM from Cohere. It's useful for roleplay, general consumer usecases, and Retrieval Augmented Generation (RAG).
-
-  It offers multilingual support for ten key languages to facilitate global business operations. See benchmarks and the launch post [here](https://txt.cohere.com/command-r-plus-microsoft-azure/).
-
-  Use of this model is subject to Cohere's [Usage Policy](https://docs.cohere.com/docs/usage-policy) and [SaaS Agreement](https://cohere.com/saas-agreement).
-context_length: 128000
-architecture:
-  modality: text->text
-  input_modalities:
-    - text
-  output_modalities:
-    - text
-  tokenizer: Cohere
-  instruct_type: null
-pricing:
-  prompt: '0.000003'
-  completion: '0.000015'
-  input_cache_read: ''
-  input_cache_write: ''
-  request: '0'
-  image: '0'
-  web_search: '0'
-  internal_reasoning: '0'
-  unit: 1
-  currency: USD
-supported_parameters:
-  - tools
-  - max_tokens
-  - temperature
-  - top_p
-  - stop
-  - frequency_penalty
-  - presence_penalty
-  - top_k
-  - seed
-  - response_format
-  - structured_outputs
-model_provider: cohere
--- a/resources/model-catalogs/cohere/command-r-plus-08-2024.yaml
+++ b/resources/model-catalogs/cohere/command-r-plus-08-2024.yaml
@@ -1,45 +0,0 @@
-id: cohere/command-r-plus-08-2024
-canonical_slug: cohere/command-r-plus-08-2024
-hugging_face_id: ''
-name: 'Cohere: Command R+ (08-2024)'
-type: chat
-created: 1724976000
-description: |-
-  command-r-plus-08-2024 is an update of the [Command R+](/models/cohere/command-r-plus) with roughly 50% higher throughput and 25% lower latencies as compared to the previous Command R+ version, while keeping the hardware footprint the same.
-
-  Read the launch post [here](https://docs.cohere.com/changelog/command-gets-refreshed).
-
-  Use of this model is subject to Cohere's [Usage Policy](https://docs.cohere.com/docs/usage-policy) and [SaaS Agreement](https://cohere.com/saas-agreement).
-context_length: 128000
-architecture:
-  modality: text->text
-  input_modalities:
-    - text
-  output_modalities:
-    - text
-  tokenizer: Cohere
-  instruct_type: null
-pricing:
-  prompt: '0.0000025'
-  completion: '0.00001'
-  input_cache_read: ''
-  input_cache_write: ''
-  request: '0'
-  image: '0'
-  web_search: '0'
-  internal_reasoning: '0'
-  unit: 1
-  currency: USD
-supported_parameters:
-  - tools
-  - max_tokens
-  - temperature
-  - top_p
-  - stop
-  - frequency_penalty
-  - presence_penalty
-  - top_k
-  - seed
-  - response_format
-  - structured_outputs
-model_provider: cohere
--- a/resources/model-catalogs/cohere/command-r-plus.yaml
+++ b/resources/model-catalogs/cohere/command-r-plus.yaml
@@ -1,45 +0,0 @@
-id: cohere/command-r-plus
-canonical_slug: cohere/command-r-plus
-hugging_face_id: ''
-name: 'Cohere: Command R+'
-type: chat
-created: 1712188800
-description: |-
-  Command R+ is a new, 104B-parameter LLM from Cohere. It's useful for roleplay, general consumer usecases, and Retrieval Augmented Generation (RAG).
-
-  It offers multilingual support for ten key languages to facilitate global business operations. See benchmarks and the launch post [here](https://txt.cohere.com/command-r-plus-microsoft-azure/).
-
-  Use of this model is subject to Cohere's [Usage Policy](https://docs.cohere.com/docs/usage-policy) and [SaaS Agreement](https://cohere.com/saas-agreement).
-context_length: 128000
-architecture:
-  modality: text->text
-  input_modalities:
-    - text
-  output_modalities:
-    - text
-  tokenizer: Cohere
-  instruct_type: null
-pricing:
-  prompt: '0.000003'
-  completion: '0.000015'
-  input_cache_read: ''
-  input_cache_write: ''
-  request: '0'
-  image: '0'
-  web_search: '0'
-  internal_reasoning: '0'
-  unit: 1
-  currency: USD
-supported_parameters:
-  - tools
-  - max_tokens
-  - temperature
-  - top_p
-  - stop
-  - frequency_penalty
-  - presence_penalty
-  - top_k
-  - seed
-  - response_format
-  - structured_outputs
-model_provider: cohere
--- a/resources/model-catalogs/cohere/command-r.yaml
+++ b/resources/model-catalogs/cohere/command-r.yaml
@@ -1,45 +0,0 @@
-id: cohere/command-r
-canonical_slug: cohere/command-r
-hugging_face_id: ''
-name: 'Cohere: Command R'
-type: chat
-created: 1710374400
-description: |-
-  Command-R is a 35B parameter model that performs conversational language tasks at a higher quality, more reliably, and with a longer context than previous models. It can be used for complex workflows like code generation, retrieval augmented generation (RAG), tool use, and agents.
-
-  Read the launch post [here](https://txt.cohere.com/command-r/).
-
-  Use of this model is subject to Cohere's [Usage Policy](https://docs.cohere.com/docs/usage-policy) and [SaaS Agreement](https://cohere.com/saas-agreement).
-context_length: 128000
-architecture:
-  modality: text->text
-  input_modalities:
-    - text
-  output_modalities:
-    - text
-  tokenizer: Cohere
-  instruct_type: null
-pricing:
-  prompt: '0.0000005'
-  completion: '0.0000015'
-  input_cache_read: ''
-  input_cache_write: ''
-  request: '0'
-  image: '0'
-  web_search: '0'
-  internal_reasoning: '0'
-  unit: 1
-  currency: USD
-supported_parameters:
-  - tools
-  - max_tokens
-  - temperature
-  - top_p
-  - stop
-  - frequency_penalty
-  - presence_penalty
-  - top_k
-  - seed
-  - response_format
-  - structured_outputs
-model_provider: cohere
--- a/resources/model-catalogs/cohere/command-r7b-12-2024.yaml
+++ b/resources/model-catalogs/cohere/command-r7b-12-2024.yaml
@@ -1,42 +0,0 @@
-id: cohere/command-r7b-12-2024
-canonical_slug: cohere/command-r7b-12-2024
-hugging_face_id: ''
-name: 'Cohere: Command R7B (12-2024)'
-type: chat
-created: 1734158152
-description: |-
-  Command R7B (12-2024) is a small, fast update of the Command R+ model, delivered in December 2024. It excels at RAG, tool use, agents, and similar tasks requiring complex reasoning and multiple steps.
-
-  Use of this model is subject to Cohere's [Usage Policy](https://docs.cohere.com/docs/usage-policy) and [SaaS Agreement](https://cohere.com/saas-agreement).
-context_length: 128000
-architecture:
-  modality: text->text
-  input_modalities:
-    - text
-  output_modalities:
-    - text
-  tokenizer: Cohere
-  instruct_type: null
-pricing:
-  prompt: '0.0000000375'
-  completion: '0.00000015'
-  input_cache_read: ''
-  input_cache_write: ''
-  request: '0'
-  image: '0'
-  web_search: '0'
-  internal_reasoning: '0'
-  unit: 1
-  currency: USD
-supported_parameters:
-  - max_tokens
-  - temperature
-  - top_p
-  - stop
-  - frequency_penalty
-  - presence_penalty
-  - top_k
-  - seed
-  - response_format
-  - structured_outputs
-model_provider: cohere
--- a/resources/model-catalogs/cohere/command.yaml
+++ b/resources/model-catalogs/cohere/command.yaml
@@ -1,42 +0,0 @@
-id: cohere/command
-canonical_slug: cohere/command
-hugging_face_id: ''
-name: 'Cohere: Command'
-type: chat
-created: 1710374400
-description: |-
-  Command is an instruction-following conversational model that performs language tasks with high quality, more reliably and with a longer context than our base generative models.
-
-  Use of this model is subject to Cohere's [Usage Policy](https://docs.cohere.com/docs/usage-policy) and [SaaS Agreement](https://cohere.com/saas-agreement).
-context_length: 4096
-architecture:
-  modality: text->text
-  input_modalities:
-    - text
-  output_modalities:
-    - text
-  tokenizer: Cohere
-  instruct_type: null
-pricing:
-  prompt: '0.000001'
-  completion: '0.000002'
-  input_cache_read: ''
-  input_cache_write: ''
-  request: '0'
-  image: '0'
-  web_search: '0'
-  internal_reasoning: '0'
-  unit: 1
-  currency: USD
-supported_parameters:
-  - max_tokens
-  - temperature
-  - top_p
-  - stop
-  - frequency_penalty
-  - presence_penalty
-  - top_k
-  - seed
-  - response_format
-  - structured_outputs
-model_provider: cohere
--- a/resources/model-catalogs/deepseek/deepseek-chat-v3-0324.yaml
+++ b/resources/model-catalogs/deepseek/deepseek-chat-v3-0324.yaml
@@ -1,49 +0,0 @@
-id: deepseek/deepseek-chat-v3-0324
-canonical_slug: deepseek/deepseek-chat-v3-0324
-hugging_face_id: deepseek-ai/DeepSeek-V3-0324
-name: 'DeepSeek: DeepSeek V3 0324'
-type: chat
-created: 1742824755
-description: |-
-  DeepSeek V3, a 685B-parameter, mixture-of-experts model, is the latest iteration of the flagship chat model family from the DeepSeek team.
-
-  It succeeds the [DeepSeek V3](/deepseek/deepseek-chat-v3) model and performs really well on a variety of tasks.
-context_length: 163840
-architecture:
-  modality: text->text
-  input_modalities:
-    - text
-  output_modalities:
-    - text
-  tokenizer: DeepSeek
-  instruct_type: null
-pricing:
-  prompt: '0.0000003'
-  completion: '0.00000088'
-  input_cache_read: ''
-  input_cache_write: ''
-  request: '0'
-  image: '0'
-  web_search: '0'
-  internal_reasoning: '0'
-  unit: 1
-  currency: USD
-supported_parameters:
-  - tools
-  - tool_choice
-  - max_tokens
-  - temperature
-  - top_p
-  - structured_outputs
-  - response_format
-  - stop
-  - frequency_penalty
-  - presence_penalty
-  - top_k
-  - repetition_penalty
-  - logit_bias
-  - logprobs
-  - top_logprobs
-  - seed
-  - min_p
-model_provider: deepseek
--- a/resources/model-catalogs/deepseek/deepseek-chat.yaml
+++ b/resources/model-catalogs/deepseek/deepseek-chat.yaml
@@ -1,49 +0,0 @@
-id: deepseek/deepseek-chat
-canonical_slug: deepseek/deepseek-chat-v3
-hugging_face_id: deepseek-ai/DeepSeek-V3
-name: 'DeepSeek: DeepSeek V3'
-type: chat
-created: 1735241320
-description: |-
-  DeepSeek-V3 is the latest model from the DeepSeek team, building upon the instruction following and coding abilities of the previous versions. Pre-trained on nearly 15 trillion tokens, the reported evaluations reveal that the model outperforms other open-source models and rivals leading closed-source models.
-
-  For model details, please visit [the DeepSeek-V3 repo](https://github.com/deepseek-ai/DeepSeek-V3) for more information, or see the [launch announcement](https://api-docs.deepseek.com/news/news1226).
-context_length: 163840
-architecture:
-  modality: text->text
-  input_modalities:
-    - text
-  output_modalities:
-    - text
-  tokenizer: DeepSeek
-  instruct_type: null
-pricing:
-  prompt: '0.00000038'
-  completion: '0.00000089'
-  input_cache_read: ''
-  input_cache_write: ''
-  request: '0'
-  image: '0'
-  web_search: '0'
-  internal_reasoning: '0'
-  unit: 1
-  currency: USD
-supported_parameters:
-  - tools
-  - tool_choice
-  - max_tokens
-  - temperature
-  - top_p
-  - structured_outputs
-  - response_format
-  - stop
-  - frequency_penalty
-  - presence_penalty
-  - top_k
-  - repetition_penalty
-  - logit_bias
-  - logprobs
-  - top_logprobs
-  - seed
-  - min_p
-model_provider: deepseek
--- a/resources/model-catalogs/deepseek/deepseek-prover-v2.yaml
+++ b/resources/model-catalogs/deepseek/deepseek-prover-v2.yaml
@@ -1,41 +0,0 @@
-id: deepseek/deepseek-prover-v2
-canonical_slug: deepseek/deepseek-prover-v2
-hugging_face_id: deepseek-ai/DeepSeek-Prover-V2-671B
-name: 'DeepSeek: DeepSeek Prover V2'
-type: chat
-created: 1746013094
-description: DeepSeek Prover V2 is a 671B parameter model, speculated to be geared towards logic and mathematics. Likely an upgrade from [DeepSeek-Prover-V1.5](https://huggingface.co/deepseek-ai/DeepSeek-Prover-V1.5-RL) Not much is known about the model yet, as DeepSeek released it on Hugging Face without an announcement or description.
-context_length: 131072
-architecture:
-  modality: text->text
-  input_modalities:
-    - text
-  output_modalities:
-    - text
-  tokenizer: DeepSeek
-  instruct_type: null
-pricing:
-  prompt: '0.0000005'
-  completion: '0.00000218'
-  input_cache_read: ''
-  input_cache_write: ''
-  request: '0'
-  image: '0'
-  web_search: '0'
-  internal_reasoning: '0'
-  unit: 1
-  currency: USD
-supported_parameters:
-  - max_tokens
-  - temperature
-  - top_p
-  - stop
-  - frequency_penalty
-  - presence_penalty
-  - seed
-  - top_k
-  - min_p
-  - repetition_penalty
-  - logit_bias
-  - response_format
-model_provider: deepseek
--- a/Show More
+++ b/Show More