fix build electron in ci

build the desktop framework
update tsconfig
2026-06-15 04:00:09 +00:00 · 2025-04-02 20:55:25 +08:00 · 2025-04-02 19:14:55 +08:00 · 2025-04-02 17:22:40 +08:00 · 2025-04-02 16:55:48 +08:00 · 2025-04-02 16:27:34 +08:00
714 changed files with 44880 additions and 10200 deletions
@@ -1,6 +1,6 @@
 {
-  "image": "mcr.microsoft.com/devcontainers/universal:2",
+  "image": "mcr.microsoft.com/devcontainers/typescript-node",
  "features": {
-    "ghcr.io/devcontainers/features/node:1": {}
+    "ghcr.io/devcontainer-community/devcontainer-features/bun.sh:1": {}
  }
 }
@@ -131,6 +131,10 @@ OPENAI_API_KEY=sk-xxxxxxxxx

 # PPIO_API_KEY=sk-xxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxx

+### INFINI-AI ###
+
+# INFINIAI_API_KEY=sk-xxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxx
+
 ########################################
 ############ Market Service ############
 ########################################
@@ -1,7 +1,7 @@
 name: '🐛 Bug Report'
 description: 'Report an bug'
-title: '[Bug] '
-labels: ['🐛 Bug']
+labels: ['unconfirm']
+type: Bug
 body:
  - type: dropdown
    attributes:
@@ -9,6 +9,7 @@ body:
      multiple: true
      options:
        - 'Official Preview'
+        - 'Official Cloud'
        - 'Vercel'
        - 'Zeabur'
        - 'Sealos'
@@ -1,7 +1,6 @@
 name: '🐛 反馈缺陷'
 description: '反馈一个问题缺陷'
-title: '[Bug] '
-labels: ['🐛 Bug']
+labels: ['unconfirm']
 type: Bug
 body:
  - type: markdown
@@ -17,6 +16,7 @@ body:
      multiple: true
      options:
        - 'Official Preview'
+        - 'Official Cloud'
        - 'Vercel'
        - 'Zeabur'
        - 'Sealos'
@@ -1,7 +1,7 @@
 name: '🌠 Feature Request'
 description: 'Suggest an idea'
 title: '[Request] '
-labels: ['🌠 Feature Request']
+type: Feature
 body:
  - type: textarea
    attributes:
@@ -1,7 +1,7 @@
 name: '🌠 功能需求'
 description: '提出需求或建议'
 title: '[Request] '
-labels: ['🌠 Feature Request']
+type: Feature
 body:
  - type: textarea
    attributes:
@@ -0,0 +1,260 @@
+name: Release Desktop
+
+on:
+  workflow_dispatch: # 手动触发构建
+  release:
+    types: [published] # 发布 release 时触发构建
+  pull_request:
+    types: [synchronize, labeled, unlabeled] # PR 更新或标签变化时触发
+
+# 确保同一时间只运行一个相同的 workflow，取消正在进行的旧的运行
+concurrency:
+  group: ${{ github.ref }}-${{ github.workflow }}
+  cancel-in-progress: true
+
+env:
+  PR_TAG_PREFIX: pr- # PR 构建版本的前缀标识
+
+jobs:
+  test:
+    name: Code quality check
+    # 添加 PR label 触发条件，只有添加了 Build Desktop 标签的 PR 才会触发构建
+    if: |
+      (github.event_name == 'pull_request' &&
+       contains(github.event.pull_request.labels.*.name, 'Build Desktop')) ||
+      github.event_name != 'pull_request'
+    runs-on: ubuntu-latest # 只在 ubuntu 上运行一次检查
+    steps:
+      - name: Checkout base
+        uses: actions/checkout@v4
+        with:
+          fetch-depth: 0
+
+      - name: Setup Node.js
+        uses: actions/setup-node@v4
+        with:
+          node-version: 22
+
+      - name: Setup pnpm
+        uses: pnpm/action-setup@v2
+        with:
+          version: 8
+
+      - name: Install deps
+        run: pnpm install
+        env:
+          NODE_OPTIONS: --max-old-space-size=6144
+
+      - name: Lint
+        run: pnpm run lint
+        env:
+          NODE_OPTIONS: --max-old-space-size=6144
+
+  #      - name: Test
+  #        run: pnpm run test
+
+  version:
+    name: Determine version
+    # 与 test job 相同的触发条件
+    if: |
+      (github.event_name == 'pull_request' &&
+       contains(github.event.pull_request.labels.*.name, 'Build Desktop')) ||
+      github.event_name != 'pull_request'
+    runs-on: ubuntu-latest
+    outputs:
+      # 输出版本信息，供后续 job 使用
+      version: ${{ steps.set_version.outputs.version }}
+      is_pr_build: ${{ steps.set_version.outputs.is_pr_build }}
+    steps:
+      - uses: actions/checkout@v4
+        with:
+          fetch-depth: 0
+
+      - name: Setup Node.js
+        uses: actions/setup-node@v4
+        with:
+          node-version: 22
+
+      # 主要逻辑：确定构建版本号
+      - name: Set version
+        id: set_version
+        run: |
+          # 从 apps/desktop/package.json 读取基础版本号
+          base_version=$(node -p "require('./apps/desktop/package.json').version")
+
+          if [ "${{ github.event_name }}" == "pull_request" ]; then
+            # PR 构建：在基础版本号上添加 PR 信息
+            branch_name="${{ github.head_ref }}"
+            # 清理分支名，移除非法字符
+            sanitized_branch=$(echo "${branch_name}" | sed -E 's/[^a-zA-Z0-9_.-]+/-/g')
+            # 创建特殊的 PR 版本号：基础版本号-PR前缀-分支名-提交哈希
+            version="${base_version}-${{ env.PR_TAG_PREFIX }}${sanitized_branch}-$(git rev-parse --short HEAD)"
+            echo "version=${version}" >> $GITHUB_OUTPUT
+            echo "is_pr_build=true" >> $GITHUB_OUTPUT
+            echo "📦 Release Version: ${version} (based on base version ${base_version})"
+
+          elif [ "${{ github.event_name }}" == "release" ]; then
+            # Release 事件直接使用 release tag 作为版本号，去掉可能的 v 前缀
+            version="${{ github.event.release.tag_name }}"
+            version="${version#v}"
+            echo "version=${version}" >> $GITHUB_OUTPUT
+            echo "is_pr_build=false" >> $GITHUB_OUTPUT
+            echo "📦 Release Version: ${version}"
+
+          else
+            # 其他情况（如手动触发）使用 apps/desktop/package.json 的版本号
+            version="${base_version}"
+            echo "version=${version}" >> $GITHUB_OUTPUT
+            echo "is_pr_build=false" >> $GITHUB_OUTPUT
+            echo "📦 Release Version: ${version}"
+          fi
+        env:
+          NODE_OPTIONS: --max-old-space-size=6144
+
+      # 输出版本信息总结，方便在 GitHub Actions 界面查看
+      - name: Version Summary
+        run: |
+          echo "🚦 Release Version: ${{ steps.set_version.outputs.version }}"
+          echo "🔄 Is PR Build: ${{ steps.set_version.outputs.is_pr_build }}"
+
+  build:
+    needs: [version, test]
+    name: Build Desktop App
+    runs-on: ${{ matrix.os }}
+    strategy:
+      matrix:
+        os: [macos-latest, windows-latest]
+    steps:
+      - uses: actions/checkout@v4
+        with:
+          fetch-depth: 0
+
+      - name: Setup Node.js
+        uses: actions/setup-node@v4
+        with:
+          node-version: 22
+
+      - name: Setup pnpm
+        uses: pnpm/action-setup@v2
+        with:
+          version: 8
+
+      - name: Install deps
+        run: pnpm install
+
+      - name: Install deps on Desktop
+        run: npm run install-isolated --prefix=./apps/desktop
+
+      # 设置 package.json 的版本号
+      - name: Set package version
+        run: npm run workflow:set-desktop-version ${{ needs.version.outputs.version }}
+
+      # macOS 构建处理
+      - name: Build artifact on macOS
+        if: runner.os == 'macOS'
+        run: npm run desktop:build
+        env:
+          APP_URL: http://localhost:3010
+          DATABASE_URL: 'postgresql://postgres@localhost:5432/postgres'
+          # 默认添加一个加密 SECRET
+          KEY_VAULTS_SECRET: 'oLXWIiR/AKF+rWaqy9lHkrYgzpATbW3CtJp3UfkVgpE='
+        # 公证部分将来再加回
+        #   CSC_LINK: ./build/developer-id-app-certs.p12
+        #   CSC_KEY_PASSWORD: ${{ secrets.APPLE_APP_CERTS_PASSWORD }}
+        #   APPLE_ID: ${{ secrets.APPLE_ID }}
+        #   APPLE_ID_PASSWORD: ${{ secrets.APPLE_ID_PASSWORD }}
+
+      # 非 macOS 平台构建处理
+      - name: Build artifact on other platforms
+        if: runner.os != 'macOS'
+        run: npm run desktop:build
+        env:
+          APP_URL: http://localhost:3010
+          DATABASE_URL: 'postgresql://postgres@localhost:5432/postgres'
+          KEY_VAULTS_SECRET: 'oLXWIiR/AKF+rWaqy9lHkrYgzpATbW3CtJp3UfkVgpE='
+
+      # 上传构建产物，移除了 zip 相关部分
+      - name: Upload artifact
+        uses: actions/upload-artifact@v4
+        with:
+          name: release-${{ matrix.os }}
+          path: |
+            apps/desktop/release/latest*
+            apps/desktop/release/lobehub*.dmg*
+            apps/desktop/release/lobehub*.exe*
+            apps/desktop/release/lobehub*.AppImage
+          retention-days: 5
+          echo "🔄 Is PR Build: ${{ needs.version.outputs.is_pr_build }}"
+
+  merge:
+    needs: [build, version]
+    name: Merge Artifacts
+    runs-on: ubuntu-latest
+    steps:
+      # 下载所有平台的构建产物
+      - name: Download artifacts
+        uses: actions/download-artifact@v4
+        with:
+          path: release
+          pattern: release-*
+          merge-multiple: true
+
+      # 列出所有构建产物
+      - name: List artifacts
+        run: ls -R release
+
+  publish:
+    # 只有非 PR 构建且没有 [skip ci] 标记的提交才执行发布
+    if: |
+      needs.version.outputs.is_pr_build != 'true' &&
+      !contains(github.event.head_commit.message, '[skip ci]')
+    needs: [merge, version]
+    name: Publish Release
+    runs-on: ubuntu-latest
+    steps:
+      - uses: actions/checkout@v4
+        with:
+          fetch-depth: 0
+
+      # 下载构建产物
+      - name: Download artifacts
+        uses: actions/download-artifact@v4
+        with:
+          path: release
+          pattern: release-*
+          merge-multiple: true
+
+      # 列出所有构建产物
+      - name: List artifacts
+        run: ls -R release
+
+      # 对于非 release 触发的构建，创建为 draft 状态的 GitHub Release
+      - name: Create Draft Release
+        if: github.event_name != 'release'
+        uses: softprops/action-gh-release@v1
+        with:
+          name: Desktop v${{ needs.version.outputs.version }}
+          tag_name: v${{ needs.version.outputs.version }}
+          draft: true # A draft release
+          prerelease: false
+          files: |
+            release/latest*
+            release/umi*.dmg*
+            release/umi*.exe*
+            release/umi*.AppImage
+        env:
+          GITHUB_TOKEN: ${{ secrets.GITHUB_TOKEN }}
+
+      # 对于 release 触发的构建，将构建产物上传到现有 release
+      - name: Upload to existing Release
+        if: github.event_name == 'release'
+        uses: softprops/action-gh-release@v1
+        with:
+          tag_name: ${{ github.event.release.tag_name }}
+          files: |
+            release/latest*
+            release/umi*.dmg*
+            release/umi*.exe*
+            release/umi*.AppImage
+        env:
+          GITHUB_TOKEN: ${{ secrets.GITHUB_TOKEN }}
@@ -0,0 +1,25 @@
+name: Database Schema Visualization CI
+
+on:
+  push:
+    branches:
+      - main
+    paths:
+      - 'docs/developer/database-schema.dbml'
+
+jobs:
+  build:
+    runs-on: ubuntu-latest
+    steps:
+      - uses: actions/checkout@v4
+
+      - name: Install dbdocs
+        run: sudo npm install -g dbdocs
+
+      - name: Check dbdocs
+        run: dbdocs
+
+      - name: sync database schema to dbdocs
+        env:
+          DBDOCS_TOKEN: ${{ secrets.DBDOCS_TOKEN }}
+        run: npm run db:visualize
@@ -68,4 +68,5 @@ public/swe-worker*
 *.patch
 *.pdf
 vertex-ai-key.json
-.pnpm-store
+.pnpm-store
+lobechat-db
@@ -1,6 +1,7 @@
 lockfile=false
 resolution-mode=highest

+ignore-workspace-root-check=true
 enable-pre-post-scripts=true

 public-hoist-pattern[]=*@umijs/lint*
@@ -44,9 +44,10 @@ ARG NEXT_PUBLIC_POSTHOG_KEY
 ARG NEXT_PUBLIC_ANALYTICS_UMAMI
 ARG NEXT_PUBLIC_UMAMI_SCRIPT_URL
 ARG NEXT_PUBLIC_UMAMI_WEBSITE_ID
+ARG FEATURE_FLAGS

-ENV NEXT_PUBLIC_BASE_PATH="${NEXT_PUBLIC_BASE_PATH}"
-
+ENV NEXT_PUBLIC_BASE_PATH="${NEXT_PUBLIC_BASE_PATH}" \
+    FEATURE_FLAGS="${FEATURE_FLAGS}"
 # Sentry
 ENV NEXT_PUBLIC_SENTRY_DSN="${NEXT_PUBLIC_SENTRY_DSN}" \
    SENTRY_ORG="" \
@@ -157,6 +158,8 @@ ENV \
    BAICHUAN_API_KEY="" BAICHUAN_MODEL_LIST="" \
    # Cloudflare
    CLOUDFLARE_API_KEY="" CLOUDFLARE_BASE_URL_OR_ACCOUNT_ID="" CLOUDFLARE_MODEL_LIST="" \
+    # Cohere
+    COHERE_API_KEY="" COHERE_MODEL_LIST="" COHERE_PROXY_URL="" \
    # DeepSeek
    DEEPSEEK_API_KEY="" DEEPSEEK_MODEL_LIST="" \
    # Fireworks AI
@@ -203,6 +206,8 @@ ENV \
    QWEN_API_KEY="" QWEN_MODEL_LIST="" QWEN_PROXY_URL="" \
    # SambaNova
    SAMBANOVA_API_KEY="" SAMBANOVA_MODEL_LIST="" \
+    # Search1API
+    SEARCH1API_API_KEY="" SEARCH1API_MODEL_LIST="" \
    # SenseNova
    SENSENOVA_API_KEY="" SENSENOVA_MODEL_LIST="" \
    # SiliconCloud
@@ -223,12 +228,16 @@ ENV \
    WENXIN_API_KEY="" WENXIN_MODEL_LIST="" \
    # xAI
    XAI_API_KEY="" XAI_MODEL_LIST="" XAI_PROXY_URL="" \
+    # Xinference
+    XINFERENCE_API_KEY="" XINFERENCE_MODEL_LIST="" XINFERENCE_PROXY_URL="" \
    # 01.AI
    ZEROONE_API_KEY="" ZEROONE_MODEL_LIST="" \
    # Zhipu
    ZHIPU_API_KEY="" ZHIPU_MODEL_LIST="" \
    # Tencent Cloud
-    TENCENT_CLOUD_API_KEY="" TENCENT_CLOUD_MODEL_LIST=""
+    TENCENT_CLOUD_API_KEY="" TENCENT_CLOUD_MODEL_LIST="" \
+    # Infini-AI
+    INFINIAI_API_KEY="" INFINIAI_MODEL_LIST=""

 USER nextjs

@@ -46,8 +46,10 @@ ARG NEXT_PUBLIC_POSTHOG_KEY
 ARG NEXT_PUBLIC_ANALYTICS_UMAMI
 ARG NEXT_PUBLIC_UMAMI_SCRIPT_URL
 ARG NEXT_PUBLIC_UMAMI_WEBSITE_ID
+ARG FEATURE_FLAGS

-ENV NEXT_PUBLIC_BASE_PATH="${NEXT_PUBLIC_BASE_PATH}"
+ENV NEXT_PUBLIC_BASE_PATH="${NEXT_PUBLIC_BASE_PATH}" \
+    FEATURE_FLAGS="${FEATURE_FLAGS}"

 ENV NEXT_PUBLIC_SERVICE_MODE="${NEXT_PUBLIC_SERVICE_MODE:-server}" \
    NEXT_PUBLIC_ENABLE_NEXT_AUTH="${NEXT_PUBLIC_ENABLE_NEXT_AUTH:-1}" \
@@ -200,6 +202,8 @@ ENV \
    BAICHUAN_API_KEY="" BAICHUAN_MODEL_LIST="" \
    # Cloudflare
    CLOUDFLARE_API_KEY="" CLOUDFLARE_BASE_URL_OR_ACCOUNT_ID="" CLOUDFLARE_MODEL_LIST="" \
+    # Cohere
+    COHERE_API_KEY="" COHERE_MODEL_LIST="" COHERE_PROXY_URL="" \
    # DeepSeek
    DEEPSEEK_API_KEY="" DEEPSEEK_MODEL_LIST="" \
    # Fireworks AI
@@ -246,6 +250,8 @@ ENV \
    QWEN_API_KEY="" QWEN_MODEL_LIST="" QWEN_PROXY_URL="" \
    # SambaNova
    SAMBANOVA_API_KEY="" SAMBANOVA_MODEL_LIST="" \
+    # Search1API
+    SEARCH1API_API_KEY="" SEARCH1API_MODEL_LIST="" \
    # SenseNova
    SENSENOVA_API_KEY="" SENSENOVA_MODEL_LIST="" \
    # SiliconCloud
@@ -266,12 +272,16 @@ ENV \
    WENXIN_API_KEY="" WENXIN_MODEL_LIST="" \
    # xAI
    XAI_API_KEY="" XAI_MODEL_LIST="" XAI_PROXY_URL="" \
+    # Xinference
+    XINFERENCE_API_KEY="" XINFERENCE_MODEL_LIST="" XINFERENCE_PROXY_URL="" \
    # 01.AI
    ZEROONE_API_KEY="" ZEROONE_MODEL_LIST="" \
    # Zhipu
    ZHIPU_API_KEY="" ZHIPU_MODEL_LIST="" \
    # Tencent Cloud
-    TENCENT_CLOUD_API_KEY="" TENCENT_CLOUD_MODEL_LIST=""
+    TENCENT_CLOUD_API_KEY="" TENCENT_CLOUD_MODEL_LIST="" \
+    # Infini-AI
+    INFINIAI_API_KEY="" INFINIAI_MODEL_LIST=""

 USER nextjs

@@ -44,9 +44,11 @@ ARG NEXT_PUBLIC_POSTHOG_KEY
 ARG NEXT_PUBLIC_ANALYTICS_UMAMI
 ARG NEXT_PUBLIC_UMAMI_SCRIPT_URL
 ARG NEXT_PUBLIC_UMAMI_WEBSITE_ID
+ARG FEATURE_FLAGS

 ENV NEXT_PUBLIC_CLIENT_DB="pglite"
-ENV NEXT_PUBLIC_BASE_PATH="${NEXT_PUBLIC_BASE_PATH}"
+ENV NEXT_PUBLIC_BASE_PATH="${NEXT_PUBLIC_BASE_PATH}" \
+    FEATURE_FLAGS="${FEATURE_FLAGS}"

 # Sentry
 ENV NEXT_PUBLIC_SENTRY_DSN="${NEXT_PUBLIC_SENTRY_DSN}" \
@@ -158,6 +160,8 @@ ENV \
    BAICHUAN_API_KEY="" BAICHUAN_MODEL_LIST="" \
    # Cloudflare
    CLOUDFLARE_API_KEY="" CLOUDFLARE_BASE_URL_OR_ACCOUNT_ID="" CLOUDFLARE_MODEL_LIST="" \
+    # Cohere
+    COHERE_API_KEY="" COHERE_MODEL_LIST="" COHERE_PROXY_URL="" \
    # DeepSeek
    DEEPSEEK_API_KEY="" DEEPSEEK_MODEL_LIST="" \
    # Fireworks AI
@@ -222,12 +226,16 @@ ENV \
    WENXIN_API_KEY="" WENXIN_MODEL_LIST="" \
    # xAI
    XAI_API_KEY="" XAI_MODEL_LIST="" XAI_PROXY_URL="" \
+    # Xinference
+    XINFERENCE_API_KEY="" XINFERENCE_MODEL_LIST="" XINFERENCE_PROXY_URL="" \
    # 01.AI
    ZEROONE_API_KEY="" ZEROONE_MODEL_LIST="" \
    # Zhipu
    ZHIPU_API_KEY="" ZHIPU_MODEL_LIST="" \
    # Tencent Cloud
-    TENCENT_CLOUD_API_KEY="" TENCENT_CLOUD_MODEL_LIST=""
+    TENCENT_CLOUD_API_KEY="" TENCENT_CLOUD_MODEL_LIST="" \
+    # Infini-AI
+    INFINIAI_API_KEY="" INFINIAI_MODEL_LIST=""

 USER nextjs

@@ -191,13 +191,14 @@ We have implemented support for the following model service providers:
 - **[Bedrock](https://lobechat.com/discover/provider/bedrock)**: Bedrock is a service provided by Amazon AWS, focusing on delivering advanced AI language and visual models for enterprises. Its model family includes Anthropic's Claude series, Meta's Llama 3.1 series, and more, offering a range of options from lightweight to high-performance, supporting tasks such as text generation, conversation, and image processing for businesses of varying scales and needs.
 - **[Google](https://lobechat.com/discover/provider/google)**: Google's Gemini series represents its most advanced, versatile AI models, developed by Google DeepMind, designed for multimodal capabilities, supporting seamless understanding and processing of text, code, images, audio, and video. Suitable for various environments from data centers to mobile devices, it significantly enhances the efficiency and applicability of AI models.
 - **[DeepSeek](https://lobechat.com/discover/provider/deepseek)**: DeepSeek is a company focused on AI technology research and application, with its latest model DeepSeek-V2.5 integrating general dialogue and code processing capabilities, achieving significant improvements in human preference alignment, writing tasks, and instruction following.
+- **[PPIO](https://lobechat.com/discover/provider/ppio)**: PPIO supports stable and cost-efficient open-source LLM APIs, such as DeepSeek, Llama, Qwen etc.
 - **[HuggingFace](https://lobechat.com/discover/provider/huggingface)**: The HuggingFace Inference API provides a fast and free way for you to explore thousands of models for various tasks. Whether you are prototyping for a new application or experimenting with the capabilities of machine learning, this API gives you instant access to high-performance models across multiple domains.
 - **[OpenRouter](https://lobechat.com/discover/provider/openrouter)**: OpenRouter is a service platform providing access to various cutting-edge large model interfaces, supporting OpenAI, Anthropic, LLaMA, and more, suitable for diverse development and application needs. Users can flexibly choose the optimal model and pricing based on their requirements, enhancing the AI experience.
 - **[Cloudflare Workers AI](https://lobechat.com/discover/provider/cloudflare)**: Run serverless GPU-powered machine learning models on Cloudflare's global network.
+
+<details><summary><kbd>See more providers (+30)</kbd></summary>
+
 - **[GitHub](https://lobechat.com/discover/provider/github)**: With GitHub Models, developers can become AI engineers and leverage the industry's leading AI models.
-
-<details><summary><kbd>See more providers (+27)</kbd></summary>
-
 - **[Novita](https://lobechat.com/discover/provider/novita)**: Novita AI is a platform providing a variety of large language models and AI image generation API services, flexible, reliable, and cost-effective. It supports the latest open-source models like Llama3 and Mistral, offering a comprehensive, user-friendly, and auto-scaling API solution for generative AI application development, suitable for the rapid growth of AI startups.
 - **[PPIO](https://lobechat.com/discover/provider/ppio)**: PPIO supports stable and cost-efficient open-source LLM APIs, such as DeepSeek, Llama, Qwen etc.
 - **[Together AI](https://lobechat.com/discover/provider/togetherai)**: Together AI is dedicated to achieving leading performance through innovative AI models, offering extensive customization capabilities, including rapid scaling support and intuitive deployment processes to meet various enterprise needs.
@@ -225,10 +226,12 @@ We have implemented support for the following model service providers:
 - **[Gitee AI](https://lobechat.com/discover/provider/giteeai)**: Gitee AI's Serverless API provides AI developers with an out of the box large model inference API service.
 - **[Taichu](https://lobechat.com/discover/provider/taichu)**: The Institute of Automation, Chinese Academy of Sciences, and Wuhan Artificial Intelligence Research Institute have launched a new generation of multimodal large models, supporting comprehensive question-answering tasks such as multi-turn Q\&A, text creation, image generation, 3D understanding, and signal analysis, with stronger cognitive, understanding, and creative abilities, providing a new interactive experience.
 - **[360 AI](https://lobechat.com/discover/provider/ai360)**: 360 AI is an AI model and service platform launched by 360 Company, offering various advanced natural language processing models, including 360GPT2 Pro, 360GPT Pro, 360GPT Turbo, and 360GPT Turbo Responsibility 8K. These models combine large-scale parameters and multimodal capabilities, widely applied in text generation, semantic understanding, dialogue systems, and code generation. With flexible pricing strategies, 360 AI meets diverse user needs, supports developer integration, and promotes the innovation and development of intelligent applications.
+- **[Search1API](https://lobechat.com/discover/provider/search1api)**: Search1API provides access to the DeepSeek series of models that can connect to the internet as needed, including standard and fast versions, supporting a variety of model sizes.
+- **[InfiniAI](https://lobechat.com/discover/provider/infiniai)**: Provides high-performance, easy-to-use, and secure large model services for application developers, covering the entire process from large model development to service deployment.

 </details>

-> 📊 Total providers: [<kbd>**37**</kbd>](https://lobechat.com/discover/providers)
+> 📊 Total providers: [<kbd>**40**</kbd>](https://lobechat.com/discover/providers)

 <!-- PROVIDER LIST -->

@@ -325,12 +328,12 @@ In addition, these plugins are not limited to news aggregation, but can also ext

 | Recent Submits                                                                                                               | Description                                                                                                             |
 | ---------------------------------------------------------------------------------------------------------------------------- | ----------------------------------------------------------------------------------------------------------------------- |
+| [PortfolioMeta](https://lobechat.com/discover/plugin/StockData)<br/><sup>By **portfoliometa** on **2025-03-23**</sup>        | Analyze stocks and get comprehensive real-time investment data and analytics.<br/>`stock`                               |
 | [Web](https://lobechat.com/discover/plugin/web)<br/><sup>By **Proghit** on **2025-01-24**</sup>                              | Smart web search that reads and analyzes pages to deliver comprehensive answers from Google results.<br/>`web` `search` |
 | [MintbaseSearch](https://lobechat.com/discover/plugin/mintbasesearch)<br/><sup>By **mintbase** on **2024-12-31**</sup>       | Find any NFT data on the NEAR Protocol.<br/>`crypto` `nft`                                                              |
 | [Bing_websearch](https://lobechat.com/discover/plugin/Bingsearch-identifier)<br/><sup>By **FineHow** on **2024-12-22**</sup> | Search for information from the internet base BingApi<br/>`bingsearch`                                                  |
-| [PortfolioMeta](https://lobechat.com/discover/plugin/StockData)<br/><sup>By **portfoliometa** on **2024-12-22**</sup>        | Analyze stocks and get comprehensive real-time investment data and analytics.<br/>`stock`                               |

-> 📊 Total plugins: [<kbd>**47**</kbd>](https://lobechat.com/discover/plugins)
+> 📊 Total plugins: [<kbd>**46**</kbd>](https://lobechat.com/discover/plugins)

 <!-- PLUGIN LIST -->

@@ -364,12 +367,12 @@ Our marketplace is not just a showcase platform but also a collaborative space.

 | Recent Submits                                                                                                                                                                                        | Description                                                                                                                                                      |
 | ----------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------- | ---------------------------------------------------------------------------------------------------------------------------------------------------------------- |
+| [学术论文综述专家](https://lobechat.com/discover/assistant/academic-paper-overview)<br/><sup>By **[arvinxx](https://github.com/arvinxx)** on **2025-03-11**</sup>                                     | 擅长高质量文献检索与分析的学术研究助手<br/>`学术研究` `文献检索` `数据分析` `信息提取` `咨询`                                                                    |
 | [Cron Expression Assistant](https://lobechat.com/discover/assistant/crontab-generate)<br/><sup>By **[edgesider](https://github.com/edgesider)** on **2025-02-17**</sup>                               | Crontab Expression Generator<br/>`crontab` `time-expression` `trigger-time` `generator` `technical-assistance`                                                   |
 | [Xiao Zhi French Translation Assistant](https://lobechat.com/discover/assistant/xiao-zhi-french-translation-asst-v-1)<br/><sup>By **[WeR-Best](https://github.com/WeR-Best)** on **2025-02-10**</sup> | A friendly, professional, and empathetic AI assistant for French translation<br/>`ai-assistant` `french-translation` `cross-cultural-communication` `creativity` |
-| [Language Charm Learning Mentor](https://lobechat.com/discover/assistant/bad-language-helper)<br/><sup>By **[Guducat](https://github.com/Guducat)** on **2025-02-06**</sup>                           | Specializes in teaching the charm of language and witty responses<br/>`language-learning` `dialogue-examples`                                                    |
-| [Astrology Researcher](https://lobechat.com/discover/assistant/fate-researcher)<br/><sup>By **[Jack980506](https://github.com/Jack980506)** on **2025-02-06**</sup>                                   | Expert in BaZi astrology<br/>`astrology` `ba-zi` `traditional-culture`                                                                                           |
+| [Investment Assistant](https://lobechat.com/discover/assistant/graham-investmentassi)<br/><sup>By **[farsightlin](https://github.com/farsightlin)** on **2025-02-06**</sup>                           | Helps users calculate the data needed for valuation<br/>`investment` `valuation` `financial-analysis` `calculator`                                               |

-> 📊 Total agents: [<kbd>**487**</kbd> ](https://lobechat.com/discover/assistants)
+> 📊 Total agents: [<kbd>**488**</kbd> ](https://lobechat.com/discover/assistants)

 <!-- AGENT LIST -->

@@ -759,7 +762,7 @@ Every bit counts and your one-time donation sparkles in our galaxy of support! Y

 </details>

-Copyright © 2024 [LobeHub][profile-link]. <br />
+Copyright © 2025 [LobeHub][profile-link]. <br />
 This project is [Apache 2.0](./LICENSE) licensed.

 <!-- LINK GROUP -->
@@ -191,13 +191,14 @@ LobeChat 支持文件上传与知识库功能，你可以上传文件、图片
 - **[Bedrock](https://lobechat.com/discover/provider/bedrock)**: Bedrock 是亚马逊 AWS 提供的一项服务，专注于为企业提供先进的 AI 语言模型和视觉模型。其模型家族包括 Anthropic 的 Claude 系列、Meta 的 Llama 3.1 系列等，涵盖从轻量级到高性能的多种选择，支持文本生成、对话、图像处理等多种任务，适用于不同规模和需求的企业应用。
 - **[Google](https://lobechat.com/discover/provider/google)**: Google 的 Gemini 系列是其最先进、通用的 AI 模型，由 Google DeepMind 打造，专为多模态设计，支持文本、代码、图像、音频和视频的无缝理解与处理。适用于从数据中心到移动设备的多种环境，极大提升了 AI 模型的效率与应用广泛性。
 - **[DeepSeek](https://lobechat.com/discover/provider/deepseek)**: DeepSeek 是一家专注于人工智能技术研究和应用的公司，其最新模型 DeepSeek-V3 多项评测成绩超越 Qwen2.5-72B 和 Llama-3.1-405B 等开源模型，性能对齐领军闭源模型 GPT-4o 与 Claude-3.5-Sonnet。
+- **[PPIO](https://lobechat.com/discover/provider/ppio)**: PPIO 派欧云提供稳定、高性价比的开源模型 API 服务，支持 DeepSeek 全系列、Llama、Qwen 等行业领先大模型。
 - **[HuggingFace](https://lobechat.com/discover/provider/huggingface)**: HuggingFace Inference API 提供了一种快速且免费的方式，让您可以探索成千上万种模型，适用于各种任务。无论您是在为新应用程序进行原型设计，还是在尝试机器学习的功能，这个 API 都能让您即时访问多个领域的高性能模型。
 - **[OpenRouter](https://lobechat.com/discover/provider/openrouter)**: OpenRouter 是一个提供多种前沿大模型接口的服务平台，支持 OpenAI、Anthropic、LLaMA 及更多，适合多样化的开发和应用需求。用户可根据自身需求灵活选择最优的模型和价格，助力 AI 体验的提升。
 - **[Cloudflare Workers AI](https://lobechat.com/discover/provider/cloudflare)**: 在 Cloudflare 的全球网络上运行由无服务器 GPU 驱动的机器学习模型。
+
+<details><summary><kbd>See more providers (+30)</kbd></summary>
+
 - **[GitHub](https://lobechat.com/discover/provider/github)**: 通过 GitHub 模型，开发人员可以成为 AI 工程师，并使用行业领先的 AI 模型进行构建。
-
-<details><summary><kbd>See more providers (+27)</kbd></summary>
-
 - **[Novita](https://lobechat.com/discover/provider/novita)**: Novita AI 是一个提供多种大语言模型与 AI 图像生成的 API 服务的平台，灵活、可靠且具有成本效益。它支持 Llama3、Mistral 等最新的开源模型，并为生成式 AI 应用开发提供了全面、用户友好且自动扩展的 API 解决方案，适合 AI 初创公司的快速发展。
 - **[PPIO](https://lobechat.com/discover/provider/ppio)**: PPIO 派欧云提供稳定、高性价比的开源模型 API 服务，支持 DeepSeek 全系列、Llama、Qwen 等行业领先大模型。
 - **[Together AI](https://lobechat.com/discover/provider/togetherai)**: Together AI 致力于通过创新的 AI 模型实现领先的性能，提供广泛的自定义能力，包括快速扩展支持和直观的部署流程，满足企业的各种需求。
@@ -225,10 +226,12 @@ LobeChat 支持文件上传与知识库功能，你可以上传文件、图片
 - **[Gitee AI](https://lobechat.com/discover/provider/giteeai)**: Gitee AI 的 Serverless API 为 AI 开发者提供开箱即用的大模型推理 API 服务。
 - **[Taichu](https://lobechat.com/discover/provider/taichu)**: 中科院自动化研究所和武汉人工智能研究院推出新一代多模态大模型，支持多轮问答、文本创作、图像生成、3D 理解、信号分析等全面问答任务，拥有更强的认知、理解、创作能力，带来全新互动体验。
 - **[360 AI](https://lobechat.com/discover/provider/ai360)**: 360 AI 是 360 公司推出的 AI 模型和服务平台，提供多种先进的自然语言处理模型，包括 360GPT2 Pro、360GPT Pro、360GPT Turbo 和 360GPT Turbo Responsibility 8K。这些模型结合了大规模参数和多模态能力，广泛应用于文本生成、语义理解、对话系统与代码生成等领域。通过灵活的定价策略，360 AI 满足多样化用户需求，支持开发者集成，推动智能化应用的革新和发展。
+- **[Search1API](https://lobechat.com/discover/provider/search1api)**: Search1API 提供可根据需要自行联网的 DeepSeek 系列模型的访问，包括标准版和快速版本，支持多种参数规模的模型选择。
+- **[InfiniAI](https://lobechat.com/discover/provider/infiniai)**: 为应用开发者提供高性能、易上手、安全可靠的大模型服务，覆盖从大模型开发到大模型服务化部署的全流程。

 </details>

-> 📊 Total providers: [<kbd>**37**</kbd>](https://lobechat.com/discover/providers)
+> 📊 Total providers: [<kbd>**40**</kbd>](https://lobechat.com/discover/providers)

 <!-- PROVIDER LIST -->

@@ -318,12 +321,12 @@ LobeChat 的插件生态系统是其核心功能的重要扩展，它极大地

 | 最近新增                                                                                                                   | 描述                                                                               |
 | -------------------------------------------------------------------------------------------------------------------------- | ---------------------------------------------------------------------------------- |
+| [PortfolioMeta](https://lobechat.com/discover/plugin/StockData)<br/><sup>By **portfoliometa** on **2025-03-23**</sup>      | 分析股票并获取全面的实时投资数据和分析。<br/>`股票`                                |
 | [网页](https://lobechat.com/discover/plugin/web)<br/><sup>By **Proghit** on **2025-01-24**</sup>                           | 智能网页搜索，读取和分析页面，以提供来自 Google 结果的全面答案。<br/>`网页` `搜索` |
 | [MintbaseSearch](https://lobechat.com/discover/plugin/mintbasesearch)<br/><sup>By **mintbase** on **2024-12-31**</sup>     | 在 NEAR 协议上查找任何 NFT 数据。<br/>`加密货币` `nft`                             |
 | [必应网页搜索](https://lobechat.com/discover/plugin/Bingsearch-identifier)<br/><sup>By **FineHow** on **2024-12-22**</sup> | 通过 BingApi 搜索互联网上的信息<br/>`bingsearch`                                   |
-| [PortfolioMeta](https://lobechat.com/discover/plugin/StockData)<br/><sup>By **portfoliometa** on **2024-12-22**</sup>      | 分析股票并获取全面的实时投资数据和分析。<br/>`股票`                                |

-> 📊 Total plugins: [<kbd>**47**</kbd>](https://lobechat.com/discover/plugins)
+> 📊 Total plugins: [<kbd>**46**</kbd>](https://lobechat.com/discover/plugins)

 <!-- PLUGIN LIST -->

@@ -351,14 +354,14 @@ LobeChat 的插件生态系统是其核心功能的重要扩展，它极大地

 <!-- AGENT LIST -->

-| 最近新增                                                                                                                                                                         | 描述                                                                                   |
-| -------------------------------------------------------------------------------------------------------------------------------------------------------------------------------- | -------------------------------------------------------------------------------------- |
-| [Cron 表达式助手](https://lobechat.com/discover/assistant/crontab-generate)<br/><sup>By **[edgesider](https://github.com/edgesider)** on **2025-02-17**</sup>                    | Crontab 表达式生成<br/>`crontab` `时间表达` `触发时间` `生成器` `技术辅助`             |
-| [小智法语翻译助手](https://lobechat.com/discover/assistant/xiao-zhi-french-translation-asst-v-1)<br/><sup>By **[WeR-Best](https://github.com/WeR-Best)** on **2025-02-10**</sup> | 友好、专业、富有同理心的法语翻译 AI 助手<br/>`ai助手` `法语翻译` `跨文化交流` `创造力` |
-| [语言魅力学习导师](https://lobechat.com/discover/assistant/bad-language-helper)<br/><sup>By **[Guducat](https://github.com/Guducat)** on **2025-02-06**</sup>                    | 擅长教学语言的魅力与花样回复<br/>`语言学习` `对话示例`                                 |
-| [命理研究员](https://lobechat.com/discover/assistant/fate-researcher)<br/><sup>By **[Jack980506](https://github.com/Jack980506)** on **2025-02-06**</sup>                        | 精通八字命<br/>`命理学` `八字` `传统文化`                                              |
+| 最近新增                                                                                                                                                                         | 描述                                                                                          |
+| -------------------------------------------------------------------------------------------------------------------------------------------------------------------------------- | --------------------------------------------------------------------------------------------- |
+| [学术论文综述专家](https://lobechat.com/discover/assistant/academic-paper-overview)<br/><sup>By **[arvinxx](https://github.com/arvinxx)** on **2025-03-11**</sup>                | 擅长高质量文献检索与分析的学术研究助手<br/>`学术研究` `文献检索` `数据分析` `信息提取` `咨询` |
+| [Cron 表达式助手](https://lobechat.com/discover/assistant/crontab-generate)<br/><sup>By **[edgesider](https://github.com/edgesider)** on **2025-02-17**</sup>                    | Crontab 表达式生成<br/>`crontab` `时间表达` `触发时间` `生成器` `技术辅助`                    |
+| [小智法语翻译助手](https://lobechat.com/discover/assistant/xiao-zhi-french-translation-asst-v-1)<br/><sup>By **[WeR-Best](https://github.com/WeR-Best)** on **2025-02-10**</sup> | 友好、专业、富有同理心的法语翻译 AI 助手<br/>`ai助手` `法语翻译` `跨文化交流` `创造力`        |
+| [投资小助手](https://lobechat.com/discover/assistant/graham-investmentassi)<br/><sup>By **[farsightlin](https://github.com/farsightlin)** on **2025-02-06**</sup>                | 帮助用户计算估值所需的一些数据<br/>`投资` `估值` `财务分析` `计算器`                          |

-> 📊 Total agents: [<kbd>**487**</kbd> ](https://lobechat.com/discover/assistants)
+> 📊 Total agents: [<kbd>**488**</kbd> ](https://lobechat.com/discover/assistants)

 <!-- AGENT LIST -->

@@ -781,7 +784,7 @@ $ pnpm run dev

 </details>

-Copyright © 2023 [LobeHub][profile-link]. <br />
+Copyright © 2025 [LobeHub][profile-link]. <br />
 This project is [Apache 2.0](./LICENSE) licensed.

 <!-- LINK GROUP -->
@@ -0,0 +1,8 @@
+node_modules
+dist
+out
+.DS_Store
+.eslintcache
+*.log*
+standalone
+release
@@ -0,0 +1,4 @@
+lockfile=false
+shamefully-hoist=true
+electron_mirror=https://npmmirror.com/mirrors/electron/
+electron_builder_binaries_mirror=https://npmmirror.com/mirrors/electron-builder-binaries/
@@ -0,0 +1,4 @@
+构建路径：
+
+- dist: 构建产物路径
+- release: 发布产物路径
@@ -0,0 +1,12 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE plist PUBLIC "-//Apple//DTD PLIST 1.0//EN" "http://www.apple.com/DTDs/PropertyList-1.0.dtd">
+<plist version="1.0">
+  <dict>
+    <key>com.apple.security.cs.allow-jit</key>
+    <true/>
+    <key>com.apple.security.cs.allow-unsigned-executable-memory</key>
+    <true/>
+    <key>com.apple.security.cs.allow-dyld-environment-variables</key>
+    <true/>
+  </dict>
+</plist>
@@ -0,0 +1,3 @@
+provider: generic
+url: https://example.com/auto-updates
+updaterCacheDirName: electron-app-updater
@@ -0,0 +1,71 @@
+/**
+ * @type {import('electron-builder').Configuration}
+ * @see https://www.electron.build/configuration
+ */
+const config = {
+  appId: 'com.lobehub.lobehub-desktop',
+  appImage: {
+    artifactName: '${productName}-${version}.${ext}',
+  },
+  asar: false,
+  // TODO: 研究下怎么样可以做成 asar 的模式
+  // asar: { smartUnpack: false },
+  // asarUnpack: ['dist/next'],
+  directories: {
+    buildResources: 'build',
+    output: 'release',
+  },
+  dmg: {
+    artifactName: '${productName}-${version}.${ext}',
+  },
+  electronDownload: {
+    mirror: 'https://npmmirror.com/mirrors/electron/',
+  },
+  files: [
+    'dist',
+    'resources',
+    '!dist/next/docs',
+    '!dist/next/packages',
+    '!dist/next/.next/server/app/sitemap',
+    // '!dist/next/.next/static/media',
+  ],
+  linux: {
+    category: 'Utility',
+    maintainer: 'electronjs.org',
+    target: ['AppImage', 'snap', 'deb'],
+  },
+  mac: {
+    compression: 'maximum',
+    entitlementsInherit: 'build/entitlements.mac.plist',
+    extendInfo: [
+      { NSCameraUsageDescription: "Application requests access to the device's camera." },
+      { NSMicrophoneUsageDescription: "Application requests access to the device's microphone." },
+      {
+        NSDocumentsFolderUsageDescription:
+          "Application requests access to the user's Documents folder.",
+      },
+      {
+        NSDownloadsFolderUsageDescription:
+          "Application requests access to the user's Downloads folder.",
+      },
+    ],
+    notarize: false,
+  },
+  npmRebuild: true,
+  nsis: {
+    artifactName: '${productName}-${version}-setup.${ext}',
+    createDesktopShortcut: 'always',
+    shortcutName: '${productName}',
+    uninstallDisplayName: '${productName}',
+  },
+  productName: 'LobeHub',
+  publish: {
+    provider: 'generic',
+    url: 'https://example.com/auto-updates',
+  },
+  win: {
+    executableName: 'electron-app',
+  },
+};
+
+export default config;
@@ -0,0 +1,22 @@
+import { defineConfig, externalizeDepsPlugin } from 'electron-vite';
+import { resolve } from 'node:path';
+
+export default defineConfig({
+  main: {
+    build: {
+      outDir: 'dist/main',
+    },
+    plugins: [externalizeDepsPlugin({})],
+    resolve: {
+      alias: {
+        '@': resolve(__dirname, 'src/main'),
+      },
+    },
+  },
+  preload: {
+    build: {
+      outDir: 'dist/preload',
+    },
+    plugins: [externalizeDepsPlugin({})],
+  },
+});
@@ -0,0 +1,51 @@
+{
+  "name": "lobehub-desktop",
+  "version": "0.0.2-nightly",
+  "description": "A minimal Electron application with TypeScript",
+  "homepage": "https://lobehub.com",
+  "author": "arvinxx",
+  "main": "./dist/main/index.js",
+  "scripts": {
+    "build": "npm run typecheck && electron-vite build",
+    "build:linux": "npm run build && electron-builder --linux --config electron-builder.js",
+    "build:mac": "npm run build && electron-builder --mac --config electron-builder.js",
+    "build:unpack": "npm run build && electron-builder --dir --config electron-builder.js",
+    "build:win": "npm run build && electron-builder --win --config electron-builder.js",
+    "electron:dev": "electron-vite dev",
+    "electron:run-unpack": "electron .",
+    "format": "prettier --write ",
+    "postinstall": "electron-builder install-app-deps",
+    "install-isolated": "pnpm install",
+    "lint": "eslint --cache ",
+    "pg-server": "bun run scripts/pglite-server.ts",
+    "start": "electron-vite preview",
+    "typecheck": "tsc --noEmit -p tsconfig.json"
+  },
+  "dependencies": {
+    "@electron-toolkit/utils": "^4.0.0",
+    "electron-updater": "^6.3.9",
+    "function-bind": "^1.1.2",
+    "get-port-please": "^3.1.2",
+    "next-electron-rsc": "^0.2.3"
+  },
+  "devDependencies": {
+    "@electron-toolkit/eslint-config-prettier": "^3.0.0",
+    "@electron-toolkit/eslint-config-ts": "^3.0.0",
+    "@electron-toolkit/preload": "^3.0.1",
+    "@electron-toolkit/tsconfig": "^1.0.1",
+    "@lobechat/electron-client-ipc": "workspace:*",
+    "@lobechat/electron-server-ipc": "workspace:*",
+    "electron": "35.1.1",
+    "electron-builder": "^26.0.12",
+    "electron-is": "^3.0.0",
+    "electron-vite": "^3.0.0",
+    "pglite-server": "^0.1.4",
+    "typescript": "^5.7.3",
+    "vite": "^6.2.4"
+  },
+  "pnpm": {
+    "onlyBuiltDependencies": [
+      "electron"
+    ]
+  }
+}
@@ -0,0 +1,4 @@
+packages:
+  - '../../packages/electron-server-ipc'
+  - '../../packages/electron-client-ipc'
+  - '.'
@@ -0,0 +1,124 @@
+<!doctype html>
+<html lang="en">
+  <head>
+    <meta charset="UTF-8" />
+    <meta name="viewport" content="width=device-width, initial-scale=1.0" />
+    <title>LobeHub - 连接错误</title>
+    <style>
+      body {
+        -webkit-app-region: drag;
+        margin: 0;
+        padding: 0;
+        height: 100vh;
+        display: flex;
+        justify-content: center;
+        align-items: center;
+        font-family:
+          -apple-system, BlinkMacSystemFont, 'Segoe UI', Roboto, Helvetica, Arial, sans-serif;
+        color: #1f1f1f;
+        overflow: hidden;
+      }
+
+      /* 添加暗色模式支持 */
+      @media (prefers-color-scheme: dark) {
+        body {
+          color: #f5f5f5;
+          background-color: #121212;
+        }
+        .error-message {
+          color: #f5f5f5;
+        }
+        .retry-button {
+          background-color: #2a2a2a;
+          color: #f5f5f5;
+          border: 1px solid #3a3a3a;
+        }
+        .retry-button:hover {
+          background-color: #3a3a3a;
+        }
+      }
+
+      .container {
+        text-align: center;
+        padding: 2rem;
+        max-width: 500px;
+      }
+
+      .lobe-brand {
+        width: 120px;
+        height: auto;
+        margin-bottom: 2rem;
+      }
+
+      .lobe-brand path {
+        fill: currentcolor;
+      }
+
+      .error-icon {
+        font-size: 3rem;
+        margin-bottom: 1rem;
+        color: #ff4d4f;
+      }
+
+      .error-title {
+        font-size: 1.5rem;
+        font-weight: 600;
+        margin-bottom: 1rem;
+      }
+
+      .error-message {
+        margin-bottom: 2rem;
+        line-height: 1.5;
+        color: #666;
+      }
+
+      .retry-button {
+        -webkit-app-region: no-drag;
+        padding: 0.75rem 1.5rem;
+        background-color: #f5f5f5;
+        color: #1f1f1f;
+        border: 1px solid #e0e0e0;
+        border-radius: 6px;
+        font-size: 1rem;
+        cursor: pointer;
+        transition: all 0.2s ease;
+      }
+
+      .retry-button:hover {
+        background-color: #e9e9e9;
+      }
+    </style>
+  </head>
+  <body>
+    <div class="container">
+      <div class="error-icon">⚠️</div>
+      <h1 class="error-title">Connection Error</h1>
+      <p class="error-message">
+        Unable to connect to the application, please check your network connection or confirm if the
+        development server is running.
+      </p>
+
+      <button id="retry-button" class="retry-button">Retry</button>
+    </div>
+
+    <script>
+      // 当按钮被点击时，通知主进程重试连接
+      const retryButton = document.getElementById('retry-button');
+      const errorMessage = document.querySelector('.error-message');
+
+      if (retryButton) {
+        retryButton.addEventListener('click', () => {
+          // 更新UI状态
+          retryButton.disabled = true;
+          retryButton.textContent = 'Retrying...';
+          errorMessage.textContent = 'Attempting to reconnect to the server, please wait...';
+
+          // 调用主进程的重试逻辑
+          if (window.electron && window.electron.ipcRenderer) {
+            window.electron.ipcRenderer.send('retry-connection');
+          }
+        });
+      }
+    </script>
+  </body>
+</html>
@@ -0,0 +1,88 @@
+<!doctype html>
+<html lang="en">
+  <head>
+    <meta charset="UTF-8" />
+    <meta name="viewport" content="width=device-width, initial-scale=1.0" />
+    <title>LobeHub</title>
+    <style>
+      body {
+        -webkit-app-region: drag;
+        margin: 0;
+        padding: 0;
+        height: 100vh;
+        display: flex;
+        justify-content: center;
+        align-items: center;
+        font-family:
+          -apple-system, BlinkMacSystemFont, 'Segoe UI', Roboto, Helvetica, Arial, sans-serif;
+        color: #1f1f1f;
+        overflow: hidden;
+      }
+
+      /* 添加暗色模式支持 */
+      @media (prefers-color-scheme: dark) {
+        body {
+          color: #f5f5f5;
+        }
+      }
+
+      .container {
+        text-align: center;
+      }
+
+      .lobe-brand-loading {
+        width: 120px;
+        height: auto;
+      }
+
+      .lobe-brand-loading path {
+        fill: currentcolor;
+        fill-opacity: 0%;
+        stroke: currentcolor;
+        stroke-dasharray: 1000;
+        stroke-dashoffset: 1000;
+        stroke-width: 0.25em;
+
+        animation:
+          draw 2s cubic-bezier(0.4, 0, 0.2, 1) infinite,
+          fill 2s cubic-bezier(0.4, 0, 0.2, 1) infinite;
+      }
+
+      @keyframes draw {
+        0% {
+          stroke-dashoffset: 1000;
+        }
+
+        100% {
+          stroke-dashoffset: 0;
+        }
+      }
+
+      @keyframes fill {
+        30% {
+          fill-opacity: 5%;
+        }
+
+        100% {
+          fill-opacity: 100%;
+        }
+      }
+    </style>
+  </head>
+  <body>
+    <div class="container">
+      <svg
+        class="lobe-brand-loading"
+        fill="currentColor"
+        fillRule="evenodd"
+        viewBox="0 0 940 320"
+        xmlns="http://www.w3.org/2000/svg"
+      >
+        <title>LobeHub</title>
+        <path
+          d="M15 240.035V87.172h39.24V205.75h66.192v34.285H15zM183.731 242c-11.759 0-22.196-2.621-31.313-7.862-9.116-5.241-16.317-12.447-21.601-21.619-5.153-9.317-7.729-19.945-7.729-31.883 0-11.937 2.576-22.492 7.729-31.664 5.164-8.963 12.159-15.98 20.982-21.05l.619-.351c9.117-5.241 19.554-7.861 31.313-7.861s22.196 2.62 31.313 7.861c9.248 5.096 16.449 12.229 21.601 21.401 5.153 9.172 7.729 19.727 7.729 31.664 0 11.938-2.576 22.566-7.729 31.883-5.152 9.172-12.353 16.378-21.601 21.619-9.117 5.241-19.554 7.862-31.313 7.862zm0-32.975c4.36 0 8.191-1.092 11.494-3.275 3.436-2.184 6.144-5.387 8.126-9.609 1.982-4.367 2.973-9.536 2.973-15.505 0-5.968-.991-10.991-2.973-15.067-1.906-4.06-4.483-7.177-7.733-9.352l-.393-.257c-3.303-2.184-7.134-3.276-11.494-3.276-4.228 0-8.059 1.092-11.495 3.276-3.303 2.184-6.011 5.387-8.125 9.609-1.982 4.076-2.973 9.099-2.973 15.067 0 5.969.991 11.138 2.973 15.505 2.114 4.222 4.822 7.425 8.125 9.609 3.436 2.183 7.267 3.275 11.495 3.275zM295.508 78l-.001 54.042a34.071 34.071 0 016.541-5.781c6.474-4.367 14.269-6.551 23.385-6.551 9.777 0 18.629 2.475 26.557 7.424 7.872 4.835 14.105 11.684 18.7 20.546l.325.637c4.756 9.026 7.135 19.799 7.135 32.319 0 12.666-2.379 23.585-7.135 32.757-4.624 9.026-10.966 16.087-19.025 21.182-7.928 4.95-16.78 7.425-26.557 7.425-9.644 0-17.704-2.184-24.178-6.551-2.825-1.946-5.336-4.355-7.532-7.226l.001 11.812h-35.87V78h37.654zm21.998 74.684c-4.228 0-8.059 1.092-11.494 3.276-3.303 2.184-6.012 5.387-8.126 9.609-1.982 4.076-2.972 9.099-2.972 15.067 0 5.969.99 11.138 2.972 15.505 2.114 4.222 4.823 7.425 8.126 9.609 3.435 2.183 7.266 3.275 11.494 3.275s7.994-1.092 11.297-3.275c3.435-2.184 6.143-5.387 8.125-9.609 2.114-4.367 3.171-9.536 3.171-15.505 0-5.968-1.057-10.991-3.171-15.067-1.906-4.06-4.483-7.177-7.732-9.352l-.393-.257c-3.303-2.184-7.069-3.276-11.297-3.276zm105.335 38.653l.084.337a27.857 27.857 0 002.057 5.559c2.246 4.222 5.417 7.498 9.513 9.827 4.096 2.184 8.984 3.276 14.665 3.276 5.285 0 9.777-.801 13.477-2.403 3.579-1.632 7.1-4.025 10.564-7.182l.732-.679 19.818 22.711c-5.153 6.26-11.494 11.064-19.025 14.413-7.531 3.203-16.449 4.804-26.755 4.804-12.683 0-23.782-2.621-33.294-7.862-9.381-5.386-16.713-12.665-21.998-21.837-5.153-9.317-7.729-19.872-7.729-31.665 0-11.792 2.51-22.274 7.53-31.446 5.036-9.105 11.902-16.195 20.596-21.268l.61-.351c8.984-5.241 19.091-7.861 30.322-7.861 10.311 0 19.743 2.286 28.294 6.859l.64.347c8.72 4.659 15.656 11.574 20.809 20.746 5.153 9.172 7.729 20.309 7.729 33.411 0 1.294-.052 2.761-.156 4.4l-.042.623-.17 2.353c-.075 1.01-.151 1.973-.227 2.888h-78.044zm21.365-42.147c-4.492 0-8.456 1.092-11.891 3.276-3.303 2.184-5.879 5.314-7.729 9.39a26.04 26.04 0 00-1.117 2.79 30.164 30.164 0 00-1.121 4.499l-.058.354h43.96l-.015-.106c-.401-2.638-1.122-5.055-2.163-7.252l-.246-.503c-1.776-3.774-4.282-6.742-7.519-8.906l-.409-.266c-3.303-2.184-7.2-3.276-11.692-3.276zm111.695-62.018l-.001 57.432h53.51V87.172h39.24v152.863h-39.24v-59.617H555.9l.001 59.617h-39.24V87.172h39.24zM715.766 242c-8.72 0-16.581-1.893-23.583-5.678-6.87-3.785-12.287-9.681-16.251-17.688-3.832-8.153-5.747-18.417-5.747-30.791v-66.168h37.654v59.398c0 9.172 1.519 15.723 4.558 19.654 3.171 3.931 7.597 5.896 13.278 5.896 3.7 0 7.069-.946 10.108-2.839 3.038-1.892 5.483-4.877 7.332-8.953 1.85-4.222 2.775-9.609 2.775-16.16v-56.996h37.654v118.36h-35.871l.004-12.38c-2.642 3.197-5.682 5.868-9.12 8.012-7.002 4.222-14.599 6.333-22.791 6.333zM841.489 78l-.001 54.041a34.1 34.1 0 016.541-5.78c6.474-4.367 14.269-6.551 23.385-6.551 9.777 0 18.629 2.475 26.556 7.424 7.873 4.835 14.106 11.684 18.701 20.546l.325.637c4.756 9.026 7.134 19.799 7.134 32.319 0 12.666-2.378 23.585-7.134 32.757-4.624 9.026-10.966 16.087-19.026 21.182-7.927 4.95-16.779 7.425-26.556 7.425-9.645 0-17.704-2.184-24.178-6.551-2.825-1.946-5.336-4.354-7.531-7.224v11.81h-35.87V78h37.654zm21.998 74.684c-4.228 0-8.059 1.092-11.495 3.276-3.303 2.184-6.011 5.387-8.125 9.609-1.982 4.076-2.973 9.099-2.973 15.067 0 5.969.991 11.138 2.973 15.505 2.114 4.222 4.822 7.425 8.125 9.609 3.436 2.183 7.267 3.275 11.495 3.275 4.228 0 7.993-1.092 11.296-3.275 3.435-2.184 6.144-5.387 8.126-9.609 2.114-4.367 3.171-9.536 3.171-15.505 0-5.968-1.057-10.991-3.171-15.067-1.906-4.06-4.484-7.177-7.733-9.352l-.393-.257c-3.303-2.184-7.068-3.276-11.296-3.276z"
+        />
+      </svg>
+    </div>
+  </body>
+</html>
@@ -0,0 +1,14 @@
+import { PGlite } from "@electric-sql/pglite";
+import { createServer } from "pglite-server";
+
+// 创建或连接到您现有的 PGlite 数据库
+const db = new PGlite("/Users/arvinxx/Library/Application Support/lobehub-desktop/lobehub-local-db");
+await db.waitReady;
+
+// 创建服务器并监听端口
+const PORT = 6543;
+const pgServer = createServer(db);
+
+pgServer.listen(PORT, () => {
+  console.log(`PGlite 服务器已启动，监听端口 ${PORT}`);
+});
@@ -0,0 +1,26 @@
+import type { BrowserWindowOpts } from './core/Browser';
+
+export const chat: BrowserWindowOpts = {
+  autoHideMenuBar: true,
+  height: 800,
+  identifier: 'chat',
+  keepAlive: true,
+  minWidth: 400,
+  path: '/chat',
+  titleBarStyle: 'hidden',
+  vibrancy: 'under-window',
+  width: 1200,
+};
+
+export const devtools: BrowserWindowOpts = {
+  autoHideMenuBar: true,
+  fullscreenable: false,
+  height: 600,
+  identifier: 'devtools',
+  maximizable: false,
+  minWidth: 400,
+  path: '/desktop/devtools',
+  titleBarStyle: 'hiddenInset',
+  vibrancy: 'under-window',
+  width: 1000,
+};
@@ -0,0 +1,14 @@
+import { app } from 'electron';
+import { join } from 'node:path';
+
+export const mainDir = join(__dirname);
+
+export const preloadDir = join(mainDir, '../preload');
+
+export const resourcesDir = join(mainDir, '../../resources');
+
+export const buildDir = join(mainDir, '../../build');
+
+const appPath = app.getAppPath();
+
+export const nextStandaloneDir = join(appPath, 'dist', 'next');
@@ -0,0 +1 @@
+export const isDev = process.env.NODE_ENV === 'development';
@@ -0,0 +1,9 @@
+import { devtools } from '../appBrowsers';
+import { ControllerModule } from './index';
+
+export default class DevtoolsCtr extends ControllerModule {
+  // @event('openDevtools')
+  async openDevtools() {
+    this.app.browserManager.retrieveOrInitialize(devtools);
+  }
+}
@@ -0,0 +1,30 @@
+import type { ClientDispatchEvents } from '@lobechat/electron-client-ipc';
+
+import type { App } from '../core/App';
+import { IoCContainer } from '../core/IoCContainer';
+
+const baseDecorator =
+  (name: string, showLog = true) =>
+  (target: any, methodName: string, descriptor?: any) => {
+    const actions = IoCContainer.controllers.get(target.constructor) || [];
+    actions.push({
+      methodName,
+      name,
+      showLog,
+    });
+    IoCContainer.controllers.set(target.constructor, actions);
+    return descriptor;
+  };
+
+/**
+ *  service 用的 event 装饰器
+ */
+export const ipcClientEvent = (method: keyof ClientDispatchEvents) => baseDecorator(method);
+
+export class ControllerModule {
+  constructor(public app: App) {
+    this.app = app;
+  }
+}
+
+export type IControlModule = typeof ControllerModule;
@@ -0,0 +1,138 @@
+import { Session, app, ipcMain, protocol } from 'electron';
+import { macOS, windows } from 'electron-is';
+import { createHandler } from 'next-electron-rsc';
+import { join } from 'node:path';
+
+import * as appBrowsers from '../appBrowsers';
+import { buildDir, nextStandaloneDir } from '../const/dir';
+import { isDev } from '../const/env';
+import { IControlModule } from '../controllers';
+import BrowserManager from './BrowserManager';
+import { initIPCServer } from './IPCServer';
+import { IoCContainer } from './IoCContainer';
+
+export type IPCClientEventMap = Map<string, any>;
+
+const importAll = (r: any) => Object.values(r).map((v: any) => v.default);
+
+export class App {
+  /**
+   * all controllers in app
+   */
+  private controllers = new WeakMap();
+  nextServerUrl = 'http://localhost:3010';
+
+  /**
+   * 承接 webview fetch 的事件表
+   */
+  private ipcClientEventMap: IPCClientEventMap = new Map();
+  browserManager: BrowserManager;
+  nextInterceptor: ({ session }: { session: Session }) => () => void;
+
+  constructor() {
+    // load controllers
+    const controllers: IControlModule[] = importAll(
+      // @ts-ignore
+      import.meta.glob('../controllers/*Ctr.ts', { eager: true }),
+    );
+
+    controllers.forEach((service) => this.addController(service));
+
+    // 批量注册 controller 中 event 事件 供 render 端消费
+    this.ipcClientEventMap.forEach((serviceInfo, key) => {
+      // 获取相应方法
+      const { service, methodName } = serviceInfo;
+
+      ipcMain.handle(key, async (e, ...data) => {
+        try {
+          return await service[methodName](...data);
+        } catch (error) {
+          return { error: error.message };
+        }
+      });
+    });
+
+    this.browserManager = new BrowserManager(this);
+  }
+
+  private onActivate = () => {
+    this.browserManager.showMainWindow();
+  };
+
+  bootstrap = async () => {
+    // make single instance
+    const isSingle = app.requestSingleInstanceLock();
+    if (!isSingle) app.exit(0);
+
+    this.initDevBranding();
+
+    //  ==============
+    await initIPCServer();
+
+    // register the schema to interceptor url
+    // it should register before app ready
+    this.registerNextHandler();
+
+    await app.whenReady();
+
+    app.on('ready', async () => {
+      this.initBrowsers();
+    });
+
+    app.on('window-all-closed', () => {
+      if (windows()) {
+        app.quit();
+      }
+    });
+
+    app.on('activate', this.onActivate);
+  };
+
+  private addController = (ControllerClass: IControlModule) => {
+    const service = new ControllerClass(this);
+    this.controllers.set(ControllerClass, service);
+
+    IoCContainer.controllers.get(ControllerClass)?.forEach((event) => {
+      // 将 event 装饰器中的对象全部存到 ipcClientEventMap 中
+      this.ipcClientEventMap.set(event.name, {
+        methodName: event.methodName,
+        service,
+      });
+    });
+  };
+
+  private initDevBranding = () => {
+    if (!isDev) return;
+
+    app.setName('LobeHub Dev');
+    if (macOS()) {
+      app.dock!.setIcon(join(buildDir, 'icon-dev.png'));
+    }
+  };
+
+  /**
+   * 添加窗口
+
+   */
+  private initBrowsers() {
+    Object.values(appBrowsers).forEach((item) => {
+      this.browserManager.retrieveOrInitialize(item);
+    });
+  }
+
+  private registerNextHandler() {
+    if (isDev) return;
+
+    const handler = createHandler({
+      debug: true,
+      localhostUrl: this.nextServerUrl,
+      protocol,
+      standaloneDir: nextStandaloneDir,
+    });
+    console.log(
+      `[APP] Server Debugging Enabled, ${this.nextServerUrl} will be intercepted to ${nextStandaloneDir}`,
+    );
+
+    this.nextInterceptor = handler.createInterceptor;
+  }
+}
@@ -0,0 +1,173 @@
+import { BrowserWindow, BrowserWindowConstructorOptions, ipcMain } from 'electron';
+import { join } from 'node:path';
+
+import { preloadDir, resourcesDir } from '../const/dir';
+import { isDev } from '../const/env';
+import type { App } from './App';
+
+export interface BrowserWindowOpts extends BrowserWindowConstructorOptions {
+  devTools?: boolean;
+  height?: number;
+  /**
+   * URL
+   */
+  identifier: string;
+  keepAlive?: boolean;
+  path: string;
+  title?: string;
+  width?: number;
+}
+
+export default class Browser {
+  private app: App;
+
+  /**
+   * 内部的 electron 窗口
+   */
+  private _browserWindow?: BrowserWindow;
+
+  private stopInterceptHandler;
+  /**
+   * 标识符
+   */
+  identifier: string;
+
+  /**
+   * 生成时的选项
+   */
+  options: BrowserWindowOpts;
+
+  /**
+   * 对外暴露的获取窗口的方法
+   */
+  get browserWindow() {
+    return this.retrieveOrInitialize();
+  }
+
+  /**
+   * 构建 BrowserWindows 对象的方法
+   * @param options
+   * @param application
+   */
+  constructor(options: BrowserWindowOpts, application: App) {
+    this.app = application;
+    this.identifier = options.identifier;
+    this.options = options;
+
+    // 初始化
+    this.retrieveOrInitialize();
+  }
+
+  loadUrl = async (path: string) => {
+    const initUrl = this.app.nextServerUrl + path;
+
+    try {
+      await this._browserWindow.loadURL(initUrl);
+      console.log('[APP] Loaded', initUrl);
+    } catch (error) {
+      console.error('[APP] Failed to load URL:', error);
+
+      // 加载本地错误页面
+      await this._browserWindow.loadFile(join(resourcesDir, 'error.html'));
+
+      // 设置简单的重试逻辑
+      ipcMain.on('retry-connection', async () => {
+        try {
+          await this._browserWindow?.loadURL(initUrl);
+          console.log('[APP] Reconnected successfully');
+        } catch (err) {
+          console.error('[APP] Retry failed:', err);
+          // 重新加载错误页面，重置状态
+          this._browserWindow?.loadFile(join(resourcesDir, 'error.html'));
+        }
+      });
+    }
+  };
+
+  loadPlaceholder = async () => {
+    // 首先加载一个本地的HTML加载页面
+    await this._browserWindow.loadFile(join(resourcesDir, 'splash.html'));
+  };
+
+  show() {
+    this.browserWindow.show();
+  }
+
+  hide() {
+    this.browserWindow.hide();
+  }
+
+  /**
+   * 销毁实例
+   */
+  destroy() {
+    this.stopInterceptHandler?.();
+    this._browserWindow = undefined;
+  }
+
+  /**
+   * 初始化
+   */
+  retrieveOrInitialize() {
+    // 当有这个窗口 且这个窗口没有被注销时
+    if (this._browserWindow && !this._browserWindow.isDestroyed()) {
+      return this._browserWindow;
+    }
+
+    const { path, title, width, height, devTools, ...res } = this.options;
+
+    const browserWindow = new BrowserWindow({
+      ...res,
+      height,
+      show: false,
+      title,
+      webPreferences: {
+        // 上下文隔离环境
+        // https://www.electronjs.org/docs/tutorial/context-isolation
+        contextIsolation: true,
+        preload: join(preloadDir, 'index.js'),
+        // devTools: isDev,
+      },
+      width,
+    });
+
+    this._browserWindow = browserWindow;
+    if (!isDev) {
+      this.stopInterceptHandler = this.app.nextInterceptor({
+        session: browserWindow.webContents.session,
+      });
+    }
+
+    // Windows 11 可以使用这个新 API
+    if (process.platform === 'win32' && browserWindow.setBackgroundMaterial) {
+      browserWindow.setBackgroundMaterial('acrylic');
+    }
+
+    this.loadPlaceholder().then(() => {
+      this.loadUrl(path).catch((e) => {
+        console.error(`load url error, ${path}`, e);
+      });
+    });
+
+    // 显示 devtools 就打开
+    if (devTools) {
+      browserWindow.webContents.openDevTools();
+    }
+
+    browserWindow.once('ready-to-show', () => {
+      browserWindow?.show();
+    });
+
+    browserWindow.on('close', () => {
+      // the ones who need keepAlive won't be destroyed
+      this.stopInterceptHandler();
+      if (this.options.keepAlive) {
+        console.log('needto');
+        // e.preventDefault();
+        // browserWindow.hide();
+      }
+    });
+
+    return browserWindow;
+  }
+}
@@ -0,0 +1,36 @@
+import { chat } from '../appBrowsers';
+import type { App } from './App';
+import type { BrowserWindowOpts } from './Browser';
+import Browser from './Browser';
+
+export default class BrowserManager {
+  app: App;
+
+  browsers: Map<string, Browser | null> = new Map();
+
+  constructor(app: App) {
+    this.app = app;
+  }
+
+  /**
+   * 启动或初始化
+   * @param options
+   */
+  retrieveOrInitialize(options: BrowserWindowOpts) {
+    let browser = this.browsers.get(options.identifier);
+    if (browser) {
+      return browser;
+    }
+
+    browser = new Browser(options, this.app);
+
+    this.browsers.set(options.identifier, browser);
+
+    return browser;
+  }
+
+  showMainWindow() {
+    const window = this.retrieveOrInitialize(chat);
+    window.show();
+  }
+}
@@ -0,0 +1,11 @@
+import { ElectronIPCServer } from '@lobechat/electron-server-ipc';
+
+import { ipcEvent } from '../ipcServer';
+
+const ipcServer = new ElectronIPCServer(ipcEvent);
+
+export const initIPCServer = async (): Promise<ElectronIPCServer> => {
+  await ipcServer.start();
+
+  return ipcServer;
+};
@@ -0,0 +1,9 @@
+/**
+ * 存储插件中的 service
+ */
+export class IoCContainer {
+  static controllers: WeakMap<any, { methodName: string; name: string; showLog?: boolean }[]> =
+    new WeakMap();
+
+  init() {}
+}
@@ -0,0 +1,5 @@
+import { App } from './core/App';
+
+const app = new App();
+
+app.bootstrap();
@@ -0,0 +1,29 @@
+import { IpcDispatchEvent } from '@lobechat/electron-server-ipc';
+import { app } from 'electron';
+import { readFileSync, writeFileSync } from 'node:fs';
+import path from 'node:path';
+
+const userDataPath = app.getPath('userData');
+
+const DB_SCHEMA_HASH_PATH = path.join(userDataPath, 'lobehub-local-db-schema-hash');
+
+export const ipcEvent: IpcDispatchEvent = {
+  getDatabasePath: async () => {
+    return path.join(userDataPath, 'lobehub-local-db');
+  },
+  getDatabaseSchemaHash: async () => {
+    try {
+      return readFileSync(DB_SCHEMA_HASH_PATH, 'utf8');
+    } catch {
+      return undefined;
+    }
+  },
+
+  getUserDataPath: async () => {
+    return userDataPath;
+  },
+
+  setDatabaseSchemaHash: async (hash: string) => {
+    writeFileSync(DB_SCHEMA_HASH_PATH, hash, 'utf8');
+  },
+};
@@ -0,0 +1,46 @@
+import { electronAPI } from '@electron-toolkit/preload';
+import { ClientDispatchEventKey, DispatchInvoke } from '@lobechat/electron-client-ipc';
+import { contextBridge, ipcRenderer } from 'electron';
+
+// Custom APIs for renderer
+const api = {};
+
+// 添加 IPC 通信接口
+const ipcApi = {
+  receive: (channel: string, callback: (...args: any[]) => void) => {
+    // 包装回调函数，确保安全性
+    const subscription = (_event: any, ...args: any[]) => callback(...args);
+    ipcRenderer.on(channel, subscription);
+
+    // 返回取消订阅的函数
+    return () => {
+      ipcRenderer.removeListener(channel, subscription);
+    };
+  },
+  send: (channel: string, ...args: any[]) => {
+    console.log('channel', channel);
+    ipcRenderer.send(channel, ...args);
+  },
+};
+
+// Use `contextBridge` APIs to expose Electron APIs to
+// renderer only if context isolation is enabled, otherwise
+// just add to the DOM global.
+
+try {
+  contextBridge.exposeInMainWorld('api', api);
+  contextBridge.exposeInMainWorld('electron', {
+    ...electronAPI,
+    ipcRenderer: ipcApi,
+  });
+} catch (error) {
+  console.error(error);
+}
+
+/**
+ * client 端请求 electron main 端方法
+ */
+const invoke: DispatchInvoke = async <T extends ClientDispatchEventKey>(event: T, ...data: any[]) =>
+  ipcRenderer.invoke(event, ...data);
+
+contextBridge.exposeInMainWorld('electronAPI', { invoke });
@@ -0,0 +1,19 @@
+{
+  "compilerOptions": {
+    "allowJs": true,
+    "skipLibCheck": true,
+    "forceConsistentCasingInFileNames": true,
+    "noEmit": true,
+    "target": "ESNext",
+    "esModuleInterop": true,
+    "emitDecoratorMetadata": true,
+    "experimentalDecorators": true,
+    "module": "esnext",
+    "moduleResolution": "bundler",
+    "resolveJsonModule": true,
+    "isolatedModules": true,
+    "incremental": true,
+    "baseUrl": "."
+  },
+  "include": ["src/main/**/*", "src/preload/**/*", "electron-builder.js"]
+}
@@ -1,4 +1,370 @@
 [
+  {
+    "children": {
+      "improvements": ["Refactor the db to context inject mode."]
+    },
+    "date": "2025-04-01",
+    "version": "1.77.6"
+  },
+  {
+    "children": {},
+    "date": "2025-04-01",
+    "version": "1.77.5"
+  },
+  {
+    "children": {
+      "improvements": ["Update branding."]
+    },
+    "date": "2025-03-31",
+    "version": "1.77.4"
+  },
+  {
+    "children": {
+      "improvements": ["Move general db models to database folder."]
+    },
+    "date": "2025-03-29",
+    "version": "1.77.3"
+  },
+  {
+    "children": {
+      "fixes": ["Fix decrypt error with imported pg data."]
+    },
+    "date": "2025-03-29",
+    "version": "1.77.2"
+  },
+  {
+    "children": {
+      "fixes": ["Fix export button and clean orphan agent."]
+    },
+    "date": "2025-03-29",
+    "version": "1.77.1"
+  },
+  {
+    "children": {
+      "features": ["Support pglite and postgres data export."]
+    },
+    "date": "2025-03-29",
+    "version": "1.77.0"
+  },
+  {
+    "children": {
+      "improvements": ["Supports OpenAI's latest voice model gpt-4o-mini-tts."]
+    },
+    "date": "2025-03-29",
+    "version": "1.76.1"
+  },
+  {
+    "children": {
+      "features": ["Add Hotkey Settings."]
+    },
+    "date": "2025-03-28",
+    "version": "1.76.0"
+  },
+  {
+    "children": {
+      "improvements": [
+        "Add tencentcloud deepseek-v3-0324, support for parsing imageOutput, update models for siliconcloud & infiniai."
+      ]
+    },
+    "date": "2025-03-28",
+    "version": "1.75.5"
+  },
+  {
+    "children": {
+      "improvements": ["Update models info."]
+    },
+    "date": "2025-03-27",
+    "version": "1.75.4"
+  },
+  {
+    "children": {
+      "fixes": ["Fix anthropic import issue."]
+    },
+    "date": "2025-03-26",
+    "version": "1.75.3"
+  },
+  {
+    "children": {
+      "fixes": ["Update 'gemini-2.5-pro-exp-03-25' maxOutput and contextWindowTokens."]
+    },
+    "date": "2025-03-26",
+    "version": "1.75.2"
+  },
+  {
+    "children": {
+      "improvements": ["Update siliconcloud models."]
+    },
+    "date": "2025-03-26",
+    "version": "1.75.1"
+  },
+  {
+    "children": {
+      "features": [
+        "Add reasoning content selector and update AutoScroll component, add Xinference provider support."
+      ],
+      "improvements": ["Add Gemini 2.5 Pro Experimental model, improve editing scroll experience."]
+    },
+    "date": "2025-03-26",
+    "version": "1.75.0"
+  },
+  {
+    "children": {
+      "improvements": ["Upgrade styles for Drawer."]
+    },
+    "date": "2025-03-25",
+    "version": "1.74.11"
+  },
+  {
+    "children": {
+      "improvements": ["Add hunyuan-t1-latest from Hunyuan."]
+    },
+    "date": "2025-03-25",
+    "version": "1.74.10"
+  },
+  {
+    "children": {
+      "improvements": ["Add reject pattern for browserless to boost crawl performance."]
+    },
+    "date": "2025-03-25",
+    "version": "1.74.9"
+  },
+  {
+    "children": {
+      "fixes": ["Update create message loading issue."]
+    },
+    "date": "2025-03-24",
+    "version": "1.74.8"
+  },
+  {
+    "children": {
+      "fixes": ["Remove Tooltip component in Topic in mobile mode."]
+    },
+    "date": "2025-03-24",
+    "version": "1.74.7"
+  },
+  {
+    "children": {
+      "fixes": ["Set max_completion_tokens to undefined for Azure OpenAI."]
+    },
+    "date": "2025-03-24",
+    "version": "1.74.6"
+  },
+  {
+    "children": {
+      "fixes": ["Fix wechat login error with next-auth."]
+    },
+    "date": "2025-03-23",
+    "version": "1.74.5"
+  },
+  {
+    "children": {
+      "fixes": ["Upgrade next to 15.2.3 to fix CVE-2025-29927."]
+    },
+    "date": "2025-03-23",
+    "version": "1.74.4"
+  },
+  {
+    "children": {
+      "improvements": ["Clear previous model check result."]
+    },
+    "date": "2025-03-22",
+    "version": "1.74.3"
+  },
+  {
+    "children": {
+      "fixes": ["CheckModel change clears other configs, update input and output prices."]
+    },
+    "date": "2025-03-22",
+    "version": "1.74.2"
+  },
+  {
+    "children": {
+      "improvements": ["Fix deepseek-r1-70b-online search tag missing from Search1API."]
+    },
+    "date": "2025-03-22",
+    "version": "1.74.1"
+  },
+  {
+    "children": {
+      "features": [
+        "Add infini-ai provider, add Search1API provider with web search DeepSeek models."
+      ]
+    },
+    "date": "2025-03-21",
+    "version": "1.74.0"
+  },
+  {
+    "children": {
+      "fixes": ["Fix agent chatConfig override issue."]
+    },
+    "date": "2025-03-21",
+    "version": "1.73.2"
+  },
+  {
+    "children": {
+      "improvements": ["Update shiki to v3."]
+    },
+    "date": "2025-03-21",
+    "version": "1.73.1"
+  },
+  {
+    "children": {
+      "features": [
+        "Add Cohere provider support, add search1api crawler implementation for WeChat Sogou links."
+      ]
+    },
+    "date": "2025-03-19",
+    "version": "1.73.0"
+  },
+  {
+    "children": {
+      "fixes": ["Allow historyCount to be set to 0."]
+    },
+    "date": "2025-03-19",
+    "version": "1.72.1"
+  },
+  {
+    "children": {
+      "features": ["Update db schema to add user_id for data export."]
+    },
+    "date": "2025-03-18",
+    "version": "1.72.0"
+  },
+  {
+    "children": {
+      "improvements": ["Support screenshot to clipboard when sharing."]
+    },
+    "date": "2025-03-17",
+    "version": "1.71.5"
+  },
+  {
+    "children": {
+      "improvements": ["Update Wenxin & Hunyuan model list."]
+    },
+    "date": "2025-03-17",
+    "version": "1.71.4"
+  },
+  {
+    "children": {
+      "fixes": ["Fix claude 3.5+ models context max output."]
+    },
+    "date": "2025-03-15",
+    "version": "1.71.3"
+  },
+  {
+    "children": {
+      "fixes": ["Fix knowledge base issue."]
+    },
+    "date": "2025-03-15",
+    "version": "1.71.2"
+  },
+  {
+    "children": {
+      "fixes": ["Fix google gemini output relative issue."],
+      "improvements": ["Update Vertex AI models."]
+    },
+    "date": "2025-03-15",
+    "version": "1.71.1"
+  },
+  {
+    "children": {
+      "features": ["Support gemini image output in chat."]
+    },
+    "date": "2025-03-14",
+    "version": "1.71.0"
+  },
+  {
+    "children": {},
+    "date": "2025-03-13",
+    "version": "1.70.11"
+  },
+  {
+    "children": {
+      "fixes": ["The agent setting -edit_agent not work."]
+    },
+    "date": "2025-03-12",
+    "version": "1.70.10"
+  },
+  {
+    "children": {},
+    "date": "2025-03-12",
+    "version": "1.70.9"
+  },
+  {
+    "children": {
+      "fixes": ["Fix theme flicking."]
+    },
+    "date": "2025-03-12",
+    "version": "1.70.8"
+  },
+  {
+    "children": {
+      "fixes": ["Fix crawl result for short content."]
+    },
+    "date": "2025-03-12",
+    "version": "1.70.7"
+  },
+  {
+    "children": {
+      "fixes": ["Link jump in mobile terminal data statistics."]
+    },
+    "date": "2025-03-11",
+    "version": "1.70.6"
+  },
+  {
+    "children": {
+      "fixes": ["Refactor the theme implement."]
+    },
+    "date": "2025-03-11",
+    "version": "1.70.5"
+  },
+  {
+    "children": {
+      "improvements": ["Support OpenRouter custom BaseURL."]
+    },
+    "date": "2025-03-11",
+    "version": "1.70.4"
+  },
+  {
+    "children": {},
+    "date": "2025-03-11",
+    "version": "1.70.3"
+  },
+  {
+    "children": {
+      "fixes": ["Update cvpr cvf url rules."]
+    },
+    "date": "2025-03-10",
+    "version": "1.70.2"
+  },
+  {
+    "children": {
+      "fixes": ["Fix anthropic max tokens."]
+    },
+    "date": "2025-03-10",
+    "version": "1.70.1"
+  },
+  {
+    "children": {
+      "features": ["Support no-fc models like deepseek r1 with online search."]
+    },
+    "date": "2025-03-09",
+    "version": "1.70.0"
+  },
+  {
+    "children": {
+      "fixes": ["Fix context cache control and model builtin search switch."]
+    },
+    "date": "2025-03-09",
+    "version": "1.69.6"
+  },
+  {
+    "children": {
+      "improvements": ["Support openrouter claude 3.7 sonnet reasoning."]
+    },
+    "date": "2025-03-09",
+    "version": "1.69.5"
+  },
  {
    "children": {
      "fixes": ["Fix mistral can not chat."]
@@ -0,0 +1,638 @@
+table agents {
+  id text [pk, not null]
+  slug varchar(100) [unique]
+  title text
+  description text
+  tags jsonb [default: `[]`]
+  avatar text
+  background_color text
+  plugins jsonb [default: `[]`]
+  client_id text
+  user_id text [not null]
+  chat_config jsonb
+  few_shots jsonb
+  model text
+  params jsonb [default: `{}`]
+  provider text
+  system_role text
+  tts jsonb
+  accessed_at "timestamp with time zone" [not null, default: `now()`]
+  created_at "timestamp with time zone" [not null, default: `now()`]
+  updated_at "timestamp with time zone" [not null, default: `now()`]
+
+  indexes {
+    (client_id, user_id) [name: 'client_id_user_id_unique', unique]
+  }
+}
+
+table agents_files {
+  file_id text [not null]
+  agent_id text [not null]
+  enabled boolean [default: true]
+  user_id text [not null]
+  accessed_at "timestamp with time zone" [not null, default: `now()`]
+  created_at "timestamp with time zone" [not null, default: `now()`]
+  updated_at "timestamp with time zone" [not null, default: `now()`]
+
+  indexes {
+    (file_id, agent_id, user_id) [pk]
+  }
+}
+
+table agents_knowledge_bases {
+  agent_id text [not null]
+  knowledge_base_id text [not null]
+  user_id text [not null]
+  enabled boolean [default: true]
+  accessed_at "timestamp with time zone" [not null, default: `now()`]
+  created_at "timestamp with time zone" [not null, default: `now()`]
+  updated_at "timestamp with time zone" [not null, default: `now()`]
+
+  indexes {
+    (agent_id, knowledge_base_id) [pk]
+  }
+}
+
+table ai_models {
+  id varchar(150) [not null]
+  display_name varchar(200)
+  description text
+  organization varchar(100)
+  enabled boolean
+  provider_id varchar(64) [not null]
+  type varchar(20) [not null, default: 'chat']
+  sort integer
+  user_id text [not null]
+  pricing jsonb
+  parameters jsonb [default: `{}`]
+  config jsonb
+  abilities jsonb [default: `{}`]
+  context_window_tokens integer
+  source varchar(20)
+  released_at varchar(10)
+  accessed_at "timestamp with time zone" [not null, default: `now()`]
+  created_at "timestamp with time zone" [not null, default: `now()`]
+  updated_at "timestamp with time zone" [not null, default: `now()`]
+
+  indexes {
+    (id, provider_id, user_id) [pk]
+  }
+}
+
+table ai_providers {
+  id varchar(64) [not null]
+  name text
+  user_id text [not null]
+  sort integer
+  enabled boolean
+  fetch_on_client boolean
+  check_model text
+  logo text
+  description text
+  key_vaults text
+  source varchar(20)
+  settings jsonb
+  accessed_at "timestamp with time zone" [not null, default: `now()`]
+  created_at "timestamp with time zone" [not null, default: `now()`]
+  updated_at "timestamp with time zone" [not null, default: `now()`]
+
+  indexes {
+    (id, user_id) [pk]
+  }
+}
+
+table async_tasks {
+  id uuid [pk, not null, default: `gen_random_uuid()`]
+  type text
+  status text
+  error jsonb
+  user_id text [not null]
+  duration integer
+  accessed_at "timestamp with time zone" [not null, default: `now()`]
+  created_at "timestamp with time zone" [not null, default: `now()`]
+  updated_at "timestamp with time zone" [not null, default: `now()`]
+}
+
+table files {
+  id text [pk, not null]
+  user_id text [not null]
+  file_type varchar(255) [not null]
+  file_hash varchar(64)
+  name text [not null]
+  size integer [not null]
+  url text [not null]
+  client_id text
+  metadata jsonb
+  chunk_task_id uuid
+  embedding_task_id uuid
+  accessed_at "timestamp with time zone" [not null, default: `now()`]
+  created_at "timestamp with time zone" [not null, default: `now()`]
+  updated_at "timestamp with time zone" [not null, default: `now()`]
+
+  indexes {
+    file_hash [name: 'file_hash_idx']
+    (client_id, user_id) [name: 'files_client_id_user_id_unique', unique]
+  }
+}
+
+table global_files {
+  hash_id varchar(64) [pk, not null]
+  file_type varchar(255) [not null]
+  size integer [not null]
+  url text [not null]
+  metadata jsonb
+  creator text [not null]
+  created_at "timestamp with time zone" [not null, default: `now()`]
+  accessed_at "timestamp with time zone" [not null, default: `now()`]
+}
+
+table knowledge_base_files {
+  knowledge_base_id text [not null]
+  file_id text [not null]
+  user_id text [not null]
+  created_at "timestamp with time zone" [not null, default: `now()`]
+
+  indexes {
+    (knowledge_base_id, file_id) [pk]
+  }
+}
+
+table knowledge_bases {
+  id text [pk, not null]
+  name text [not null]
+  description text
+  avatar text
+  type text
+  user_id text [not null]
+  client_id text
+  is_public boolean [default: false]
+  settings jsonb
+  accessed_at "timestamp with time zone" [not null, default: `now()`]
+  created_at "timestamp with time zone" [not null, default: `now()`]
+  updated_at "timestamp with time zone" [not null, default: `now()`]
+
+  indexes {
+    (client_id, user_id) [name: 'knowledge_bases_client_id_user_id_unique', unique]
+  }
+}
+
+table message_chunks {
+  message_id text
+  chunk_id uuid
+  user_id text [not null]
+
+  indexes {
+    (chunk_id, message_id) [pk]
+  }
+}
+
+table message_plugins {
+  id text [pk, not null]
+  tool_call_id text
+  type text [default: 'default']
+  api_name text
+  arguments text
+  identifier text
+  state jsonb
+  error jsonb
+  client_id text
+  user_id text [not null]
+
+  indexes {
+    (client_id, user_id) [name: 'message_plugins_client_id_user_id_unique', unique]
+  }
+}
+
+table message_queries {
+  id uuid [pk, not null, default: `gen_random_uuid()`]
+  message_id text [not null]
+  rewrite_query text
+  user_query text
+  client_id text
+  user_id text [not null]
+  embeddings_id uuid
+
+  indexes {
+    (client_id, user_id) [name: 'message_queries_client_id_user_id_unique', unique]
+  }
+}
+
+table message_query_chunks {
+  id text
+  query_id uuid
+  chunk_id uuid
+  similarity "numeric(6, 5)"
+  user_id text [not null]
+
+  indexes {
+    (chunk_id, id, query_id) [pk]
+  }
+}
+
+table message_tts {
+  id text [pk, not null]
+  content_md5 text
+  file_id text
+  voice text
+  client_id text
+  user_id text [not null]
+
+  indexes {
+    (client_id, user_id) [name: 'message_tts_client_id_user_id_unique', unique]
+  }
+}
+
+table message_translates {
+  id text [pk, not null]
+  content text
+  from text
+  to text
+  client_id text
+  user_id text [not null]
+
+  indexes {
+    (client_id, user_id) [name: 'message_translates_client_id_user_id_unique', unique]
+  }
+}
+
+table messages {
+  id text [pk, not null]
+  role text [not null]
+  content text
+  reasoning jsonb
+  search jsonb
+  metadata jsonb
+  model text
+  provider text
+  favorite boolean [default: false]
+  error jsonb
+  tools jsonb
+  trace_id text
+  observation_id text
+  client_id text
+  user_id text [not null]
+  session_id text
+  topic_id text
+  thread_id text
+  parent_id text
+  quota_id text
+  agent_id text
+  accessed_at "timestamp with time zone" [not null, default: `now()`]
+  created_at "timestamp with time zone" [not null, default: `now()`]
+  updated_at "timestamp with time zone" [not null, default: `now()`]
+
+  indexes {
+    created_at [name: 'messages_created_at_idx']
+    (client_id, user_id) [name: 'message_client_id_user_unique', unique]
+    topic_id [name: 'messages_topic_id_idx']
+    parent_id [name: 'messages_parent_id_idx']
+    quota_id [name: 'messages_quota_id_idx']
+  }
+}
+
+table messages_files {
+  file_id text [not null]
+  message_id text [not null]
+  user_id text [not null]
+
+  indexes {
+    (file_id, message_id) [pk]
+  }
+}
+
+table nextauth_accounts {
+  access_token text
+  expires_at integer
+  id_token text
+  provider text [not null]
+  providerAccountId text [not null]
+  refresh_token text
+  scope text
+  session_state text
+  token_type text
+  type text [not null]
+  userId text [not null]
+
+  indexes {
+    (provider, providerAccountId) [pk]
+  }
+}
+
+table nextauth_authenticators {
+  counter integer [not null]
+  credentialBackedUp boolean [not null]
+  credentialDeviceType text [not null]
+  credentialID text [not null, unique]
+  credentialPublicKey text [not null]
+  providerAccountId text [not null]
+  transports text
+  userId text [not null]
+
+  indexes {
+    (userId, credentialID) [pk]
+  }
+}
+
+table nextauth_sessions {
+  expires timestamp [not null]
+  sessionToken text [pk, not null]
+  userId text [not null]
+}
+
+table nextauth_verificationtokens {
+  expires timestamp [not null]
+  identifier text [not null]
+  token text [not null]
+
+  indexes {
+    (identifier, token) [pk]
+  }
+}
+
+table chunks {
+  id uuid [pk, not null, default: `gen_random_uuid()`]
+  text text
+  abstract text
+  metadata jsonb
+  index integer
+  type varchar
+  client_id text
+  user_id text
+  accessed_at "timestamp with time zone" [not null, default: `now()`]
+  created_at "timestamp with time zone" [not null, default: `now()`]
+  updated_at "timestamp with time zone" [not null, default: `now()`]
+
+  indexes {
+    (client_id, user_id) [name: 'chunks_client_id_user_id_unique', unique]
+  }
+}
+
+table embeddings {
+  id uuid [pk, not null, default: `gen_random_uuid()`]
+  chunk_id uuid [unique]
+  embeddings vector(1024)
+  model text
+  client_id text
+  user_id text
+
+  indexes {
+    (client_id, user_id) [name: 'embeddings_client_id_user_id_unique', unique]
+  }
+}
+
+table unstructured_chunks {
+  id uuid [pk, not null, default: `gen_random_uuid()`]
+  text text
+  metadata jsonb
+  index integer
+  type varchar
+  accessed_at "timestamp with time zone" [not null, default: `now()`]
+  created_at "timestamp with time zone" [not null, default: `now()`]
+  updated_at "timestamp with time zone" [not null, default: `now()`]
+  parent_id varchar
+  composite_id uuid
+  client_id text
+  user_id text
+  file_id varchar
+
+  indexes {
+    (client_id, user_id) [name: 'unstructured_chunks_client_id_user_id_unique', unique]
+  }
+}
+
+table rag_eval_dataset_records {
+  id integer [pk, not null]
+  dataset_id integer [not null]
+  ideal text
+  question text
+  reference_files text[]
+  metadata jsonb
+  user_id text
+  accessed_at "timestamp with time zone" [not null, default: `now()`]
+  created_at "timestamp with time zone" [not null, default: `now()`]
+  updated_at "timestamp with time zone" [not null, default: `now()`]
+}
+
+table rag_eval_datasets {
+  id integer [pk, not null]
+  description text
+  name text [not null]
+  knowledge_base_id text
+  user_id text
+  accessed_at "timestamp with time zone" [not null, default: `now()`]
+  created_at "timestamp with time zone" [not null, default: `now()`]
+  updated_at "timestamp with time zone" [not null, default: `now()`]
+}
+
+table rag_eval_evaluations {
+  id integer [pk, not null]
+  name text [not null]
+  description text
+  eval_records_url text
+  status text
+  error jsonb
+  dataset_id integer [not null]
+  knowledge_base_id text
+  language_model text
+  embedding_model text
+  user_id text
+  accessed_at "timestamp with time zone" [not null, default: `now()`]
+  created_at "timestamp with time zone" [not null, default: `now()`]
+  updated_at "timestamp with time zone" [not null, default: `now()`]
+}
+
+table rag_eval_evaluation_records {
+  id integer [pk, not null]
+  question text [not null]
+  answer text
+  context text[]
+  ideal text
+  status text
+  error jsonb
+  language_model text
+  embedding_model text
+  question_embedding_id uuid
+  duration integer
+  dataset_record_id integer [not null]
+  evaluation_id integer [not null]
+  user_id text
+  accessed_at "timestamp with time zone" [not null, default: `now()`]
+  created_at "timestamp with time zone" [not null, default: `now()`]
+  updated_at "timestamp with time zone" [not null, default: `now()`]
+}
+
+table agents_to_sessions {
+  agent_id text [not null]
+  session_id text [not null]
+  user_id text [not null]
+
+  indexes {
+    (agent_id, session_id) [pk]
+  }
+}
+
+table file_chunks {
+  file_id varchar
+  chunk_id uuid
+  created_at "timestamp with time zone" [not null, default: `now()`]
+  user_id text [not null]
+
+  indexes {
+    (file_id, chunk_id) [pk]
+  }
+}
+
+table files_to_sessions {
+  file_id text [not null]
+  session_id text [not null]
+  user_id text [not null]
+
+  indexes {
+    (file_id, session_id) [pk]
+  }
+}
+
+table session_groups {
+  id text [pk, not null]
+  name text [not null]
+  sort integer
+  user_id text [not null]
+  client_id text
+  accessed_at "timestamp with time zone" [not null, default: `now()`]
+  created_at "timestamp with time zone" [not null, default: `now()`]
+  updated_at "timestamp with time zone" [not null, default: `now()`]
+
+  indexes {
+    (client_id, user_id) [name: 'session_groups_client_id_user_id_unique', unique]
+  }
+}
+
+table sessions {
+  id text [pk, not null]
+  slug varchar(100) [not null]
+  title text
+  description text
+  avatar text
+  background_color text
+  type text [default: 'agent']
+  user_id text [not null]
+  group_id text
+  client_id text
+  pinned boolean [default: false]
+  accessed_at "timestamp with time zone" [not null, default: `now()`]
+  created_at "timestamp with time zone" [not null, default: `now()`]
+  updated_at "timestamp with time zone" [not null, default: `now()`]
+
+  indexes {
+    (slug, user_id) [name: 'slug_user_id_unique', unique]
+    (client_id, user_id) [name: 'sessions_client_id_user_id_unique', unique]
+  }
+}
+
+table threads {
+  id text [pk, not null]
+  title text
+  type text [not null]
+  status text [default: 'active']
+  topic_id text [not null]
+  source_message_id text [not null]
+  parent_thread_id text
+  client_id text
+  user_id text [not null]
+  last_active_at "timestamp with time zone" [default: `now()`]
+  accessed_at "timestamp with time zone" [not null, default: `now()`]
+  created_at "timestamp with time zone" [not null, default: `now()`]
+  updated_at "timestamp with time zone" [not null, default: `now()`]
+
+  indexes {
+    (client_id, user_id) [name: 'threads_client_id_user_id_unique', unique]
+  }
+}
+
+table topics {
+  id text [pk, not null]
+  title text
+  favorite boolean [default: false]
+  session_id text
+  user_id text [not null]
+  client_id text
+  history_summary text
+  metadata jsonb
+  accessed_at "timestamp with time zone" [not null, default: `now()`]
+  created_at "timestamp with time zone" [not null, default: `now()`]
+  updated_at "timestamp with time zone" [not null, default: `now()`]
+
+  indexes {
+    (client_id, user_id) [name: 'topics_client_id_user_id_unique', unique]
+  }
+}
+
+table user_installed_plugins {
+  user_id text [not null]
+  identifier text [not null]
+  type text [not null]
+  manifest jsonb
+  settings jsonb
+  custom_params jsonb
+  accessed_at "timestamp with time zone" [not null, default: `now()`]
+  created_at "timestamp with time zone" [not null, default: `now()`]
+  updated_at "timestamp with time zone" [not null, default: `now()`]
+
+  indexes {
+    (user_id, identifier) [pk]
+  }
+}
+
+table user_settings {
+  id text [pk, not null]
+  tts jsonb
+  hotkey jsonb
+  key_vaults text
+  general jsonb
+  language_model jsonb
+  system_agent jsonb
+  default_agent jsonb
+  tool jsonb
+}
+
+table users {
+  id text [pk, not null]
+  username text [unique]
+  email text
+  avatar text
+  phone text
+  first_name text
+  last_name text
+  full_name text
+  is_onboarded boolean [default: false]
+  clerk_created_at "timestamp with time zone"
+  email_verified_at "timestamp with time zone"
+  preference jsonb
+  accessed_at "timestamp with time zone" [not null, default: `now()`]
+  created_at "timestamp with time zone" [not null, default: `now()`]
+  updated_at "timestamp with time zone" [not null, default: `now()`]
+}
+
+ref: agents_knowledge_bases.knowledge_base_id - knowledge_bases.id
+
+ref: agents_knowledge_bases.agent_id > agents.id
+
+ref: agents_to_sessions.session_id > sessions.id
+
+ref: agents_to_sessions.agent_id > agents.id
+
+ref: unstructured_chunks.file_id - files.id
+
+ref: files.embedding_task_id - async_tasks.id
+
+ref: messages.session_id - sessions.id
+
+ref: messages.parent_id - messages.id
+
+ref: messages.topic_id - topics.id
+
+ref: threads.source_message_id - messages.id
+
+ref: sessions.group_id - session_groups.id
+
+ref: topics.session_id - sessions.id
@@ -36,7 +36,7 @@ tags:

  <Image alt={'Clerk 添加 Webhooks 端点'} src={'https://github.com/lobehub/lobe-chat/assets/28616219/f50f47fb-5e8e-4930-bf4e-8cf6f5b8afb9'} />

-  在 endppint 中填写你的项目 URL，如 `https://your-project.com/api/webhooks/clerk`。然后在订阅事件（Subscribe to events）中，勾选 user 的三个事件（`user.created` 、`user.deleted`、`user.updated`），然后点击创建。
+  在 endpoint 中填写你的项目 URL，如 `https://your-project.com/api/webhooks/clerk`。然后在订阅事件（Subscribe to events）中，勾选 user 的三个事件（`user.created` 、`user.deleted`、`user.updated`），然后点击创建。

  <Callout type={'warning'}>URL 的`https://`不可缺失，须保持 URL 的完整性</Callout>

@@ -14,10 +14,10 @@ tags:

 LobeChat supports customizing the model list during deployment. This configuration is done in the environment for each [model provider](/docs/self-hosting/environment-variables/model-provider).

-You can use `+` to add a model, `-` to hide a model, and use `model name=display name<extension configuration>` to customize the display name of a model, separated by English commas. The basic syntax is as follows:
+You can use `+` to add a model, `-` to hide a model, and use `model name->deploymentName=display name<extension configuration>` to customize the display name of a model, separated by English commas. The basic syntax is as follows:

 ```text
-id=displayName<maxToken:vision:reasoning:search:fc:file>,model2,model3
+id->deploymentName=displayName<maxToken:vision:reasoning:search:fc:file:imageOutput>,model2,model3
 ```

 For example: `+qwen-7b-chat,+glm-6b,-gpt-3.5-turbo,gpt-4-0125-preview=gpt-4-turbo`
@@ -29,7 +29,7 @@ In the above example, it adds `qwen-7b-chat` and `glm-6b` to the model list, rem
 Considering the diversity of model capabilities, we started to add extension configuration in version `0.147.8`, with the following rules:

 ```shell
-id=displayName<maxToken:vision:reasoning:search:fc:file>
+id->deploymentName=displayName<maxToken:vision:reasoning:search:fc:file:imageOutput>
 ```

 The first value in angle brackets is designated as the `maxToken` for this model. The second value and beyond are the model's extension capabilities, separated by colons `:`, and the order is not important.
@@ -41,7 +41,8 @@ Examples are as follows:
 - `gemini-1.5-flash-latest=Gemini 1.5 Flash<16000:vision>`: Google Vision model, maximum context of 16k, supports image recognition;
 - `o3-mini=OpenAI o3-mini<200000:reasoning:fc>`: OpenAI o3-mini model, maximum context of 200k, supports reasoning and Function Call;
 - `qwen-max-latest=Qwen Max<32768:search:fc>`: Qwen 2.5 Max model, maximum context of 32k, supports web search and Function Call;
- `gpt-4-all=ChatGPT Plus<128000:fc:vision:file>`, hacked version of ChatGPT Plus web, context of 128k, supports image recognition, Function Call, file upload.
+- `gpt-4-all=ChatGPT Plus<128000:fc:vision:file>`, hacked version of ChatGPT Plus web, context of 128k, supports image recognition, Function Call, file upload;
+- `gemini-2.0-flash-exp-image-generation=Gemini 2.0 Flash (Image Generation) Experimental<32768:imageOutput:vision>`, Gemini 2.0 Flash Experimental model for image generation, maximum context of 32k, supports image generation and recognition.

 Currently supported extension capabilities are:

@@ -49,6 +50,7 @@ Currently supported extension capabilities are:
 | ----------- | -------------------------------------------------------- |
 | `fc`        | Function Calling                                         |
 | `vision`    | Image Recognition                                        |
+| `imageOutput`    | Image Generation                                        |
 | `reasoning` | Support Reasoning                                        |
 | `search`    | Support Web Search                                        |
 | `file`      | File Upload (a bit hacky, not recommended for daily use) |
@@ -13,10 +13,10 @@ tags:

 LobeChat 支持在部署时自定义模型列表，详情请参考 [模型提供商](/zh/docs/self-hosting/environment-variables/model-provider) 。

-你可以使用 `+` 增加一个模型，使用 `-` 来隐藏一个模型，使用 `模型名=展示名<扩展配置>` 来自定义模型的展示名，用英文逗号隔开。通过 `<>` 来添加扩展配置。基本语法如下：
+你可以使用 `+` 增加一个模型，使用 `-` 来隐藏一个模型，使用 `模型名->部署名=展示名<扩展配置>` 来自定义模型的展示名，用英文逗号隔开。通过 `<>` 来添加扩展配置。基本语法如下：

 ```text
-id=displayName<maxToken:vision:reasoning:search:fc:file>,model2,model3
+id->deploymentName=displayName<maxToken:vision:reasoning:search:fc:file:imageOutput>,model2,model3
 ```

 例如： `+qwen-7b-chat,+glm-6b,-gpt-3.5-turbo,gpt-4-0125-preview=gpt-4-turbo`
@@ -28,7 +28,7 @@ id=displayName<maxToken:vision:reasoning:search:fc:file>,model2,model3
 考虑到模型的能力多样性，我们在 `0.147.8` 版本开始增加扩展性配置，它的规则如下：

 ```shell
-id=displayName<maxToken:vision:reasoning:search:fc:file>
+id->deploymentName=displayName<maxToken:vision:reasoning:search:fc:file:imageOutput>
 ```

 尖括号第一个值约定为这个模型的 `maxToken` 。第二个及以后作为模型的扩展能力，能力与能力之间用冒号 `:` 作为分隔符，顺序不重要。
@@ -40,7 +40,8 @@ id=displayName<maxToken:vision:reasoning:search:fc:file>
 - `gemini-1.5-flash-latest=Gemini 1.5 Flash<16000:vision>`：Google 视觉模型，最大上下文 16k，支持图像识别；
 - `o3-mini=OpenAI o3-mini<200000:reasoning:fc>`：OpenAI o3-mini 模型，最大上下文 200k，支持推理及 Function Call；
 - `qwen-max-latest=Qwen Max<32768:search:fc>`：通义千问 2.5 Max 模型，最大上下文 32k，支持联网搜索及 Function Call；
- `gpt-4-all=ChatGPT Plus<128000:fc:vision:file>`，hack 的 ChatGPT Plus 网页版，上下 128k ，支持图像识别、Function Call、文件上传
+- `gpt-4-all=ChatGPT Plus<128000:fc:vision:file>`，hack 的 ChatGPT Plus 网页版，上下 128k ，支持图像识别、Function Call、文件上传；
+- `gemini-2.0-flash-exp-image-generation=Gemini 2.0 Flash (Image Generation) Experimental<32768:imageOutput:vision>`，Gemini 2.0 Flash 实验模型，最大上下文 32k，支持图像生成和识别

 目前支持的扩展能力有：

@@ -48,6 +49,7 @@ id=displayName<maxToken:vision:reasoning:search:fc:file>
 | ----------- | ---------------------- |
 | `fc`        | 函数调用（function calling） |
 | `vision`    | 视觉识别                   |
+| `imageOutput`      | 图像生成  |
 | `reasoning` | 支持推理                   |
 | `search`    | 支持联网搜索                   |
 | `file`      | 文件上传（比较 hack，不建议日常使用）  |
@@ -94,7 +94,7 @@ If you need to use Azure OpenAI to provide model services, you can refer to the
 ### `AZURE_MODEL_LIST`

 - Type: Optional
- Description: Used to control the model list, use `+` to add a model, use `-` to hide a model, use `id->deplymentName=displayName` to customize the display name of a model, separated by commas. Definition syntax rules see [model-list][model-list]
+- Description: Used to control the model list, use `+` to add a model, use `-` to hide a model, use `id->deploymentName=displayName` to customize the display name of a model, separated by commas. Definition syntax rules see [model-list][model-list]
 - Default: `-`
 - Example: `gpt-35-turbo->my-deploy=GPT 3.5 Turbo` 或 `gpt-4-turbo->my-gpt4=GPT 4 Turbo<128000:vision:fc>`

@@ -173,8 +173,8 @@ If you need to use Azure OpenAI to provide model services, you can refer to the

 - Type: Optional
 - Description: If you manually configure the DeepSeek API proxy, you can use this configuration item to override the default DeepSeek API request base URL
- Default: -
- Example: `https://xxxx.models.ai.azure.com/v1`
+- Default: `https://api.deepseek.com`
+- Example: `https://my-deepseek-proxy.com`

 ### `DEEPSEEK_API_KEY`

@@ -183,6 +183,13 @@ If you need to use Azure OpenAI to provide model services, you can refer to the
 - Default: -
 - Example: `sk-xxxxxx...xxxxxx`

+### `DEEPSEEK_MODEL_LIST`
+
+- Type: Optional
+- Description: Used to control the model list, use `+` to add a model, use `-` to hide a model, use `model_name=displayName` to customize the display name of a model, separated by commas. Definition syntax rules see [model-list][model-list]
+- Default: `-`
+- Example: `-all,+deepseek-reasoner`
+
 ## XAI

 ### `XAI_API_KEY`
@@ -313,6 +320,13 @@ If you need to use Azure OpenAI to provide model services, you can refer to the
 - Default: -
 - Example: `Y2xpdGhpMzNhZXNoYjVtdnZjMWc6bXNrLWIxQlk3aDNPaXpBWnc0V1RaMDhSRmRFVlpZUWY=`

+### `MOONSHOT_PROXY_URL`
+
+- Type: Optional
+- Description: If you manually configure the Moonshot API proxy, you can use this configuration item to override the default Moonshot API request base URL
+- Default: `https://api.moonshot.cn/v1`
+- Example: `https://my-moonshot-proxy.com/v1`
+
 ## Perplexity AI

 ### `PERPLEXITY_API_KEY`
@@ -425,6 +439,13 @@ If you need to use Azure OpenAI to provide model services, you can refer to the
 - Default: `-`
 - Example: `-all,+qwen-turbo-latest,+qwen-plus-latest`

+### `QWEN_PROXY_URL`
+
+- Type: Optional
+- Description: If you manually configure the Qwen API proxy, you can use this configuration item to override the default Qwen API request base URL
+- Default: `https://dashscope.aliyuncs.com/compatible-mode/v1`
+- Example: `https://my-qwen-proxy.com/v1`
+
 ## Stepfun AI

 ### `STEPFUN_API_KEY`
@@ -555,9 +576,31 @@ If you need to use Azure OpenAI to provide model services, you can refer to the
 ### `VOLCENGINE_MODEL_LIST`

 - Type: Optional
- Description: Used to control the model list, use `+` to add a model, use `-` to hide a model, use `model_name=display_name` to customize the display name of a model, separated by commas. Definition syntax rules see [model-list][model-list]
+- Description: Used to control the model list, use `+` to add a model, use `-` to hide a model, use `model_name->deploymentName=display_name` to customize the display name of a model, separated by commas. Definition syntax rules see [model-list][model-list]
 - Default: `-`
- Example: `-all,+deepseek-r1-250120,+deepseek-v3-241226,+doubao-1-5-pro-256k-250115,+doubao-1-5-pro-32k-250115,+doubao-1-5-lite-32k-250115`
+- Example: `-all,+deepseek-r1->deepseek-r1-250120,+deepseek-v3->deepseek-v3-250324,+doubao-1.5-pro-256k->doubao-1-5-pro-256k-250115,+doubao-1.5-pro-32k->doubao-1-5-pro-32k-250115,+doubao-1.5-lite-32k->doubao-1-5-lite-32k-250115`

+### `VOLCENGINE_PROXY_URL`
+
+- Type: Optional
+- Description: If you manually configure the Volcengine API proxy, you can use this configuration item to override the default Volcengine API request base URL
+- Default: `https://ark.cn-beijing.volces.com/api/v3`
+- Example: `https://my-volcengine-proxy.com/v1`
+
+## InfiniAI
+
+### `INFINIAI_API_KEY`
+
+- Type: Required
+- Description: This is the API key you applied from Infini-AI, you can check it out [here](https://cloud.infini-ai.com)
+- Default: -
+- Example: `sk-xxxxxx...xxxxxx`
+
+### `INFINIAI_MODEL_LIST`
+
+- Type: Optional
+- Description: Used to control the model list, use `+` to add a model, use `-` to hide a model, use `model_name->deploymentName=display_name` to customize the display name of a model, separated by commas. Definition syntax rules see [model-list][model-list]
+- Default: `-`
+- Example: `-all,+qwq-32b,+deepseek-r1`

 [model-list]: /docs/self-hosting/advanced/model-list
@@ -171,8 +171,8 @@ LobeChat 在部署时提供了丰富的模型服务商相关的环境变量，

 - 类型：可选
 - 描述：如果您手动配置了 DeepSeek API 代理，可以使用此配置项覆盖默认的 DeepSeek API 请求基础 URL
- 默认值: -
- 示例: `https://xxxx.models.ai.azure.com/v1`
+- 默认值：`https://api.deepseek.com`
+- 示例：`https://my-deepseek-proxy.com`

 ### `DEEPSEEK_API_KEY`

@@ -181,6 +181,13 @@ LobeChat 在部署时提供了丰富的模型服务商相关的环境变量，
 - 默认值：-
 - 示例：`sk-xxxxxx...xxxxxx`

+### `DEEPSEEK_MODEL_LIST`
+
+- 类型：可选
+- 描述：用来控制模型列表，使用 `+` 增加一个模型，使用 `-` 来隐藏一个模型，使用 `模型名=展示名<扩展配置>` 来自定义模型的展示名，用英文逗号隔开。模型定义语法规则见 [模型列表][model-list]
+- 默认值：`-`
+- 示例：`-all,+deepseek-reasoner`
+
 ## XAI

 ### `XAI_API_KEY`
@@ -311,6 +318,14 @@ LobeChat 在部署时提供了丰富的模型服务商相关的环境变量，
 - 默认值：-
 - 示例：`Y2xpdGhpMzNhZXNoYjVtdnZjMWc6bXNrLWIxQlk3aDNPaXpBWnc0V1RaMDhSRmRFVlpZUWY=`

+### `MOONSHOT_PROXY_URL`
+
+- 类型：可选
+- 描述：如果你手动配置了 Moonshot 接口代理，可以使用此配置项来覆盖默认的 Moonshot API 请求基础 URL
+- 默认值：`https://api.moonshot.cn/v1`
+- 示例：`https://my-moonshot-proxy.com/v1`
+
+
 ## Perplexity AI

 ### `PERPLEXITY_API_KEY`
@@ -423,6 +438,13 @@ LobeChat 在部署时提供了丰富的模型服务商相关的环境变量，
 - 默认值：`-`
 - 示例：`-all,+qwen-turbo-latest,+qwen-plus-latest`

+### `QWEN_PROXY_URL`
+
+- 类型：可选
+- 描述：如果你手动配置了 Qwen 接口代理，可以使用此配置项来覆盖默认的 Qwen API 请求基础 URL
+- 默认值：`https://dashscope.aliyuncs.com/compatible-mode/v1`
+- 示例：`https://my-qwen-proxy.com/v1`
+
 ## Stepfun AI

 ### `STEPFUN_API_KEY`
@@ -553,8 +575,31 @@ LobeChat 在部署时提供了丰富的模型服务商相关的环境变量，
 ### `VOLCENGINE_MODEL_LIST`

 - 类型：可选
- 描述：用来控制模型列表，使用 `+` 增加一个模型，使用 `-` 来隐藏一个模型，使用 `模型名=展示名<扩展配置>` 来自定义模型的展示名，用英文逗号隔开。模型定义语法规则见 [模型列表][model-list]
+- 描述：用来控制模型列表，使用 `+` 增加一个模型，使用 `-` 来隐藏一个模型，使用 `模型名->部署名=展示名<扩展配置>` 来自定义模型的展示名，用英文逗号隔开。模型定义语法规则见 [模型列表][model-list]
 - 默认值：`-`
- 示例：`-all,+deepseek-r1-250120,+deepseek-v3-241226,+doubao-1-5-pro-256k-250115,+doubao-1-5-pro-32k-250115,+doubao-1-5-lite-32k-250115`
+- 示例：`-all,+deepseek-r1->deepseek-r1-250120,+deepseek-v3->deepseek-v3-250324,+doubao-1.5-pro-256k->doubao-1-5-pro-256k-250115,+doubao-1.5-pro-32k->doubao-1-5-pro-32k-250115,+doubao-1.5-lite-32k->doubao-1-5-lite-32k-250115`
+
+### `VOLCENGINE_PROXY_URL`
+
+- 类型：可选
+- 描述：如果你手动配置了 Volcengine 接口代理，可以使用此配置项来覆盖默认的 Volcengine API 请求基础 URL
+- 默认值：`https://ark.cn-beijing.volces.com/api/v3`
+- 示例：`https://my-volcengine-proxy.com/v1`
+
+## InfiniAI
+
+### `INFINIAI_API_KEY`
+
+- 类型：必选
+- 描述：这是你在 [Infini-AI](https://cloud.infini-ai.com) 申请的 API 密钥。
+- 默认值：-
+- 示例：`sk-xxxxxx...xxxxxx`
+
+### `INFINIAI_MODEL_LIST`
+
+- 类型：可选
+- 描述：用来控制模型列表，使用 `+` 增加一个模型，使用 `-` 来隐藏一个模型，使用 `模型名->部署名=展示名<扩展配置>` 来自定义模型的展示名，用英文逗号隔开。模型定义语法规则见 [模型列表][model-list]
+- 默认值：`-`
+- 示例：`-all,+qwq-32b,+deepseek-r1`

 [model-list]: /zh/docs/self-hosting/advanced/model-list
@@ -140,7 +140,7 @@ tags:

  <Image alt={'Clerk 添加 Webhooks 端点'} src={'https://github.com/lobehub/lobe-chat/assets/28616219/f50f47fb-5e8e-4930-bf4e-8cf6f5b8afb9'} />

-  在 endppint 中填写你的 Vercel 项目的 URL，如 `https://your-project.vercel.app/api/webhooks/clerk`。然后在订阅事件（Subscribe to events）中，勾选 user 的三个事件（`user.created` 、`user.deleted`、`user.updated`），然后点击创建。
+  在 endpoint 中填写你的 Vercel 项目的 URL，如 `https://your-project.vercel.app/api/webhooks/clerk`。然后在订阅事件（Subscribe to events）中，勾选 user 的三个事件（`user.created` 、`user.deleted`、`user.updated`），然后点击创建。

  <Callout type={'warning'}>URL 的`https://`不可缺失，须保持 URL 的完整性</Callout>

@@ -0,0 +1,29 @@
+---
+title: Using Infini-AI in LobeChat
+description: Learn how to configure and utilize Infini-AI's model services in LobeChat.
+tags:
+  - LobeChat
+  - Infini-AI
+  - API Key
+  - LLM Deployment
+---
+
+# Using Infini-AI in LobeChat
+
+[Infini-AI](https://cloud.infini-ai.com/) is a large model service platform optimized for multiple chip architectures, providing efficient and unified AGI infrastructure solutions.
+
+This guide will help you quickly integrate Infini-AI's AI capabilities into LobeChat.
+
+<Steps>
+  ### Step 1: Obtain Infini-AI API Key
+
+  - Log in to the [Large Model Service Platform](https://cloud.infini-ai.com/genstudio/model)
+  - Select "API KEY Management" in the left navigation bar
+  - In the newly opened page, click the "Create API KEY" button, enter a name, and click "Create"
+
+  ### Step 2: Configure LobeChat Model Service
+
+  - Open LobeChat and go to the "Settings" interface
+  - Select "Infini-AI" in the "Language Model" module
+  - Paste the API key you obtained
+</Steps>
@@ -0,0 +1,33 @@
+---
+title: 在 LobeChat 中使用无问芯穹
+description: 学习如何在 LobeChat 中配置和使用无问芯穹的 API Key，实现 AI 对话交互。
+tags:
+  - LobeChat
+  - 无问芯穹
+  - API密钥
+  - 大模型部署
+---
+
+# 在 LobeChat 中使用无问芯穹
+
+[无问芯穹](https://cloud.infini-ai.com/)是基于多元芯片优化的大模型服务平台，提供高效统一的 AGI 基础设施解决方案。
+
+本文将指导你如何在 LobeChat 中快速接入无问芯穹的 AI 能力。
+
+<Callout type="info">
+  无问芯穹的图片链接输入有白名单机制，目前已知支持阿里云 OSS / AWS S3 等服务的图片链接。如果您在使用图片对话时遇到 400 报错，请尝试[使用 base64 编码上传图片](/docs/self-hosting/environment-variables/s3#llm-vision-image-use-base-64)。
+</Callout>
+
+<Steps>
+  ### 步骤一：获取无问芯穹 API Key
+
+  - 登录[大模型服务平台](https://cloud.infini-ai.com/genstudio/model)
+  - 在左侧导航栏选择「API KEY 管理」
+  - 在新打开的页面中，点击「创建 API KEY」按钮，填入名称，点击「创建」
+
+  ### 步骤二：配置 LobeChat 模型服务
+
+  - 打开 LobeChat 进入「设置」界面
+  - 在「语言模型」模块选择「Infini-AI」
+  - 粘贴已获取的 API 密钥
+</Steps>
@@ -52,4 +52,4 @@ tags:
  </Callout>
 </Steps>

-至此你已经可以在 LobeChat 中使用 PPIO 提供的模型进行对话了。
+至此你已经可以在 LobeChat 中使用 PPIO 派欧云提供的模型进行对话了。
@@ -64,6 +64,9 @@
    "stop": "توقف",
    "warp": "تغيير السطر"
  },
+  "intentUnderstanding": {
+    "title": "جارٍ فهم وتحليل نواياك..."
+  },
  "knowledgeBase": {
    "all": "جميع المحتويات",
    "allFiles": "جميع الملفات",
@@ -144,7 +147,6 @@
        "desc": "تحديد ما إذا كان من الضروري البحث بناءً على محتوى المحادثة",
        "title": "الاتصال الذكي"
      },
-      "disable": "النموذج الحالي لا يدعم استدعاء الوظائف، لذا لا يمكن استخدام وظيفة الاتصال الذكي",
      "off": {
        "desc": "استخدام المعرفة الأساسية للنموذج فقط، دون إجراء بحث عبر الإنترنت",
        "title": "إيقاف الاتصال"
@@ -155,6 +157,10 @@
      },
      "useModelBuiltin": "استخدام محرك البحث المدمج في النموذج"
    },
+    "searchModel": {
+      "desc": "النموذج الحالي لا يدعم استدعاء الدوال، لذا يجب استخدام نموذج يدعم استدعاء الدوال للبحث عبر الإنترنت",
+      "title": "نموذج البحث المساعد"
+    },
    "title": "بحث عبر الإنترنت"
  },
  "searchAgentPlaceholder": "مساعد البحث...",
@@ -41,7 +41,10 @@
    "error": {
      "desc": "نعتذر، حدث خطأ أثناء عملية تهيئة قاعدة بيانات Pglite. يرجى النقر على الزر لإعادة المحاولة. إذا استمرت المشكلة بعد عدة محاولات، يرجى <1>تقديم مشكلة</1>، وسنساعدك في حلها في أسرع وقت ممكن",
      "detail": "سبب الخطأ: [{{type}}] {{message}}، التفاصيل كالتالي:",
+      "detailTitle": "سبب الخطأ",
+      "report": "الإبلاغ عن مشكلة",
      "retry": "إعادة المحاولة",
+      "selfSolve": "حل ذاتي",
      "title": "فشل تهيئة قاعدة البيانات"
    },
    "initing": {
@@ -80,6 +83,54 @@
      "button": "استخدم الآن",
      "desc": "استخدم الآن",
      "title": "قاعدة بيانات PGlite جاهزة"
+    },
+    "solve": {
+      "backup": {
+        "backup": "نسخ احتياطي",
+        "backupSuccess": "تم النسخ الاحتياطي بنجاح",
+        "desc": "تصدير البيانات الأساسية من قاعدة البيانات الحالية",
+        "export": "تصدير جميع البيانات",
+        "exportDesc": "سيتم حفظ البيانات المصدرة بتنسيق JSON، ويمكن استخدامها لاستعادة أو تحليل لاحق.",
+        "reset": {
+          "alert": "تحذير",
+          "alertDesc": "قد تؤدي العمليات التالية إلى فقدان البيانات. يرجى التأكد من أنك قد قمت بعمل نسخة احتياطية من البيانات الهامة قبل المتابعة.",
+          "button": "إعادة تعيين قاعدة البيانات بالكامل (حذف جميع البيانات)",
+          "confirm": {
+            "desc": "ستؤدي هذه العملية إلى حذف جميع البيانات ولا يمكن التراجع عنها، هل تؤكد المتابعة؟",
+            "title": "تأكيد إعادة تعيين قاعدة البيانات"
+          },
+          "desc": "إعادة تعيين قاعدة البيانات في حالة عدم إمكانية الاستعادة",
+          "title": "إعادة تعيين قاعدة البيانات"
+        },
+        "restore": "استعادة",
+        "restoreSuccess": "تم الاستعادة بنجاح",
+        "title": "نسخ احتياطي للبيانات"
+      },
+      "diagnosis": {
+        "createdAt": "تاريخ الإنشاء",
+        "migratedAt": "تاريخ اكتمال النقل",
+        "sql": "نقل SQL",
+        "title": "حالة النقل"
+      },
+      "repair": {
+        "desc": "إدارة حالة النقل يدويًا",
+        "runSQL": "تنفيذ مخصص",
+        "sql": {
+          "clear": "مسح",
+          "desc": "تنفيذ عبارة SQL مخصصة لإصلاح مشاكل قاعدة البيانات",
+          "markFinished": "تحديد كمنتهية",
+          "placeholder": "أدخل عبارة SQL...",
+          "result": "نتيجة التنفيذ",
+          "run": "تنفيذ",
+          "title": "منفذ SQL"
+        },
+        "title": "تحكم النقل"
+      },
+      "tabs": {
+        "backup": "نسخ احتياطي واستعادة",
+        "diagnosis": "تشخيص",
+        "repair": "إصلاح"
+      }
    }
  },
  "close": "إغلاق",
@@ -132,7 +183,7 @@
  },
  "fullscreen": "وضع كامل الشاشة",
  "historyRange": "نطاق التاريخ",
-  "import": "استيراد الإعدادات",
+  "importData": "استيراد البيانات",
  "importModal": {
    "error": {
      "desc": "عذرًا، حدث استثناء أثناء عملية استيراد البيانات. يرجى المحاولة مرة أخرى، أو <1>تقديم مشكلتك</1>، وسنقوم بمساعدتك على الفور في تحديد المشكلة.",
@@ -154,7 +205,8 @@
      "sessions": "الجلسات",
      "skips": "التخطيات",
      "topics": "المواضيع",
-      "type": "نوع البيانات"
+      "type": "نوع البيانات",
+      "update": "تحديث السجل"
    },
    "title": "استيراد البيانات",
    "uploading": {
@@ -163,6 +215,16 @@
      "speed": "سرعة الرفع"
    }
  },
+  "importPreview": {
+    "confirmImport": "تأكيد الاستيراد",
+    "tables": {
+      "count": "عدد السجلات",
+      "name": "اسم الجدول"
+    },
+    "title": "معاينة بيانات الاستيراد",
+    "totalRecords": "إجمالي السجلات التي سيتم استيرادها {{count}}",
+    "totalTables": "{{count}} جدول"
+  },
  "information": "المجتمع والمعلومات",
  "installPWA": "تثبيت تطبيق المتصفح",
  "lang": {
@@ -76,6 +76,7 @@
      "custom": "نموذج مخصص، الإعداد الافتراضي يدعم الاستدعاء الوظيفي والتعرف البصري، يرجى التحقق من قدرة النموذج على القيام بذلك بناءً على الحالة الفعلية",
      "file": "يدعم هذا النموذج قراءة وتعرف الملفات المرفوعة",
      "functionCall": "يدعم هذا النموذج استدعاء الوظائف",
+      "imageOutput": "يدعم هذا النموذج إنشاء الصور",
      "reasoning": "يدعم هذا النموذج التفكير العميق",
      "search": "يدعم هذا النموذج البحث عبر الإنترنت",
      "tokens": "يدعم هذا النموذج حتى {{tokens}} رمزًا في جلسة واحدة",
@@ -85,6 +86,8 @@
  },
  "ModelSwitchPanel": {
    "emptyModel": "لا توجد نماذج ممكن تمكينها، يرجى الانتقال إلى الإعدادات لتمكينها",
+    "emptyProvider": "لا توجد مزودات مفعلة، يرجى الذهاب إلى الإعدادات لتفعيلها",
+    "goToSettings": "اذهب إلى الإعدادات",
    "provider": "مزود"
  },
  "OllamaSetupGuide": {
@@ -16,6 +16,16 @@
    "detail": "تفاصيل الخطأ",
    "title": "فشل الطلب"
  },
+  "import": {
+    "importConfigFile": {
+      "description": "سبب الخطأ: {{reason}}",
+      "title": "فشل الاستيراد"
+    },
+    "incompatible": {
+      "description": "تم تصدير هذا الملف من إصدار أعلى، يرجى محاولة الترقية إلى أحدث إصدار ثم إعادة الاستيراد",
+      "title": "التطبيق الحالي لا يدعم استيراد هذا الملف"
+    }
+  },
  "loginRequired": {
    "desc": "سيتم التحويل تلقائيًا إلى صفحة تسجيل الدخول",
    "title": "يرجى تسجيل الدخول لاستخدام هذه الميزة"
@@ -69,6 +79,7 @@
    "524": "عذرًا، انتهت مهلة الخادم أثناء الانتظار للرد، قد يكون ذلك بسبب بطء الاستجابة، يرجى المحاولة مرة أخرى لاحقًا",
    "AgentRuntimeError": "حدث خطأ في تشغيل نموذج Lobe اللغوي، يرجى التحقق من المعلومات التالية أو إعادة المحاولة",
    "ConnectionCheckFailed": "الاستجابة فارغة، يرجى التحقق من أن عنوان وكيل الـ API لا ينتهي بـ `/v1`",
+    "CreateMessageError": "عذرًا، لم يتم إرسال الرسالة بشكل صحيح، يرجى نسخ المحتوى وإعادة إرساله، بعد تحديث الصفحة لن يتم الاحتفاظ بهذه الرسالة",
    "ExceededContextWindow": "المحتوى المطلوب الحالي يتجاوز الطول الذي يمكن للنموذج معالجته، يرجى تقليل كمية المحتوى ثم إعادة المحاولة",
    "FreePlanLimit": "أنت حاليًا مستخدم مجاني، لا يمكنك استخدام هذه الوظيفة، يرجى الترقية إلى خطة مدفوعة للمتابعة",
    "InsufficientQuota": "عذرًا، لقد reached الحد الأقصى للحصة (quota) لهذه المفتاح، يرجى التحقق من رصيد الحساب الخاص بك أو زيادة حصة المفتاح ثم المحاولة مرة أخرى",
@@ -0,0 +1,46 @@
+{
+  "addUserMessage": {
+    "desc": "إضافة المحتوى الحالي كرسالة مستخدم دون تفعيل التوليد",
+    "title": "إضافة رسالة مستخدم"
+  },
+  "editMessage": {
+    "desc": "الدخول إلى وضع التحرير عن طريق الضغط على مفتاح Alt والنقر المزدوج على الرسالة",
+    "title": "تحرير الرسالة"
+  },
+  "openChatSettings": {
+    "desc": "عرض وتعديل إعدادات المحادثة الحالية",
+    "title": "فتح إعدادات المحادثة"
+  },
+  "openHotkeyHelper": {
+    "desc": "عرض جميع تعليمات استخدام الاختصارات",
+    "title": "فتح مساعدة الاختصارات"
+  },
+  "regenerateMessage": {
+    "desc": "إعادة توليد آخر رسالة",
+    "title": "إعادة توليد الرسالة"
+  },
+  "saveTopic": {
+    "desc": "حفظ الموضوع الحالي وفتح موضوع جديد",
+    "title": "فتح موضوع جديد"
+  },
+  "search": {
+    "desc": "استدعاء مربع البحث الرئيسي في الصفحة الحالية",
+    "title": "بحث"
+  },
+  "switchAgent": {
+    "desc": "تبديل المساعد المثبت في الشريط الجانبي عن طريق الضغط على Ctrl مع الأرقام من 0 إلى 9",
+    "title": "تبديل المساعد بسرعة"
+  },
+  "toggleLeftPanel": {
+    "desc": "عرض أو إخفاء لوحة المساعد على اليسار",
+    "title": "عرض/إخفاء لوحة المساعد"
+  },
+  "toggleRightPanel": {
+    "desc": "عرض أو إخفاء لوحة المواضيع على اليمين",
+    "title": "عرض/إخفاء لوحة الموضوع"
+  },
+  "toggleZenMode": {
+    "desc": "في وضع التركيز، عرض المحادثة الحالية فقط، وإخفاء واجهة المستخدم الأخرى",
+    "title": "تبديل وضع التركيز"
+  }
+}
@@ -1,13 +1,4 @@
 {
-  "01-ai/Yi-1.5-34B-Chat-16K": {
-    "description": "Yi-1.5 34B، يقدم أداءً ممتازًا في التطبيقات الصناعية بفضل مجموعة التدريب الغنية."
-  },
-  "01-ai/Yi-1.5-6B-Chat": {
-    "description": "Yi-1.5-6B-Chat هو متغير من سلسلة Yi-1.5، وهو نموذج دردشة مفتوح المصدر. Yi-1.5 هو إصدار مطور من Yi، تم تدريبه على 500B من البيانات عالية الجودة، وتم تحسينه على 3M من عينات التعديل المتنوعة. مقارنةً بـ Yi، يظهر Yi-1.5 أداءً أقوى في الترميز، والرياضيات، والاستدلال، والامتثال للتعليمات، مع الحفاظ على قدرة ممتازة في فهم اللغة، والاستدلال العام، وفهم القراءة. يتوفر هذا النموذج بإصدارات بطول سياق 4K و16K و32K، مع إجمالي تدريب يصل إلى 3.6T توكن."
-  },
-  "01-ai/Yi-1.5-9B-Chat-16K": {
-    "description": "Yi-1.5 9B يدعم 16K توكن، ويوفر قدرة توليد لغوية فعالة وسلسة."
-  },
  "01-ai/yi-1.5-34b-chat": {
    "description": "Zero One Everything، أحدث نموذج مفتوح المصدر تم تعديله، يحتوي على 34 مليار معلمة، ويدعم تعديلات متعددة لمشاهد الحوار، مع بيانات تدريب عالية الجودة تتماشى مع تفضيلات البشر."
  },
@@ -149,12 +140,6 @@
  "Llama-3.2-90B-Vision-Instruct\t": {
    "description": "قدرات استدلال الصور المتقدمة المناسبة لتطبيقات الوكلاء في الفهم البصري."
  },
-  "LoRA/Qwen/Qwen2.5-72B-Instruct": {
-    "description": "Qwen2.5-72B-Instruct هو أحد أحدث نماذج اللغة الكبيرة التي أصدرتها Alibaba Cloud. يتمتع هذا النموذج بقدرات محسنة بشكل ملحوظ في مجالات الترميز والرياضيات. كما يوفر دعمًا للغات متعددة، تغطي أكثر من 29 لغة، بما في ذلك الصينية والإنجليزية. أظهر النموذج تحسينات ملحوظة في اتباع التعليمات، وفهم البيانات الهيكلية، وتوليد المخرجات الهيكلية (خاصة JSON)."
-  },
-  "LoRA/Qwen/Qwen2.5-7B-Instruct": {
-    "description": "Qwen2.5-7B-Instruct هو أحد أحدث نماذج اللغة الكبيرة التي أصدرتها Alibaba Cloud. يتمتع هذا النموذج بقدرات محسنة بشكل ملحوظ في مجالات الترميز والرياضيات. كما يوفر دعمًا للغات متعددة، تغطي أكثر من 29 لغة، بما في ذلك الصينية والإنجليزية. أظهر النموذج تحسينات ملحوظة في اتباع التعليمات، وفهم البيانات الهيكلية، وتوليد المخرجات الهيكلية (خاصة JSON)."
-  },
  "Meta-Llama-3.1-405B-Instruct": {
    "description": "نموذج نصي تم تعديله تحت الإشراف من Llama 3.1، تم تحسينه لحالات الحوار متعددة اللغات، حيث يتفوق في العديد من نماذج الدردشة مفتوحة ومغلقة المصدر المتاحة في المعايير الصناعية الشائعة."
  },
@@ -179,9 +164,6 @@
  "NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO": {
    "description": "Nous Hermes 2 - Mixtral 8x7B-DPO (46.7B) هو نموذج تعليمات عالي الدقة، مناسب للحسابات المعقدة."
  },
-  "OpenGVLab/InternVL2-26B": {
-    "description": "أظهر InternVL2 أداءً رائعًا في مجموعة متنوعة من مهام اللغة البصرية، بما في ذلك فهم الوثائق والرسوم البيانية، وفهم النصوص في المشاهد، وOCR، وحل المشكلات العلمية والرياضية."
-  },
  "Phi-3-medium-128k-instruct": {
    "description": "نموذج Phi-3-medium نفسه، ولكن مع حجم سياق أكبر لـ RAG أو التوجيه القليل."
  },
@@ -206,9 +188,6 @@
  "Phi-3.5-vision-instrust": {
    "description": "النسخة المحدثة من نموذج Phi-3-vision."
  },
-  "Pro/OpenGVLab/InternVL2-8B": {
-    "description": "أظهر InternVL2 أداءً رائعًا في مجموعة متنوعة من مهام اللغة البصرية، بما في ذلك فهم الوثائق والرسوم البيانية، وفهم النصوص في المشاهد، وOCR، وحل المشكلات العلمية والرياضية."
-  },
  "Pro/Qwen/Qwen2-1.5B-Instruct": {
    "description": "Qwen2-1.5B-Instruct هو نموذج لغوي كبير تم تعديله وفقًا للتعليمات في سلسلة Qwen2، بحجم 1.5B. يعتمد هذا النموذج على بنية Transformer، ويستخدم تقنيات مثل دالة تنشيط SwiGLU، وتحويل QKV، والانتباه الجماعي. أظهر أداءً ممتازًا في فهم اللغة، والتوليد، والقدرات متعددة اللغات، والترميز، والرياضيات، والاستدلال في العديد من اختبارات المعايير، متجاوزًا معظم النماذج مفتوحة المصدر."
  },
@@ -224,20 +203,26 @@
  "Pro/Qwen/Qwen2.5-Coder-7B-Instruct": {
    "description": "Qwen2.5-Coder-7B-Instruct هو أحدث إصدار من سلسلة نماذج اللغة الكبيرة المحددة للشيفرة التي أصدرتها Alibaba Cloud. تم تحسين هذا النموذج بشكل كبير في توليد الشيفرة، والاستدلال، وإصلاح الأخطاء، من خلال تدريب على 55 تريليون توكن."
  },
+  "Pro/Qwen/Qwen2.5-VL-7B-Instruct": {
+    "description": "Qwen2.5-VL هو العضو الجديد في سلسلة Qwen، يتمتع بقدرات فهم بصري قوية، يمكنه تحليل النصوص والرسوم البيانية والتخطيطات في الصور، وفهم مقاطع الفيديو الطويلة واستيعاب الأحداث. بإمكانه القيام بالاستدلال والتعامل مع الأدوات، يدعم تحديد الكائنات متعددة التنسيقات وإنشاء مخرجات منظمة، كما تم تحسين ديناميكية الدقة ومعدل الإطارات في التدريب لفهم الفيديو، مع تعزيز كفاءة مشفر الرؤية."
+  },
  "Pro/THUDM/glm-4-9b-chat": {
    "description": "GLM-4-9B-Chat هو الإصدار مفتوح المصدر من نموذج GLM-4 الذي أطلقته Zhizhu AI. أظهر هذا النموذج أداءً ممتازًا في مجالات الدلالات، والرياضيات، والاستدلال، والشيفرة، والمعرفة. بالإضافة إلى دعم المحادثات متعددة الجولات، يتمتع GLM-4-9B-Chat أيضًا بميزات متقدمة مثل تصفح الويب، وتنفيذ الشيفرة، واستدعاء الأدوات المخصصة (Function Call)، والاستدلال على النصوص الطويلة. يدعم النموذج 26 لغة، بما في ذلك الصينية، والإنجليزية، واليابانية، والكورية، والألمانية. أظهر GLM-4-9B-Chat أداءً ممتازًا في العديد من اختبارات المعايير مثل AlignBench-v2 وMT-Bench وMMLU وC-Eval. يدعم النموذج طول سياق يصل إلى 128K، مما يجعله مناسبًا للأبحاث الأكاديمية والتطبيقات التجارية."
  },
  "Pro/deepseek-ai/DeepSeek-R1": {
    "description": "DeepSeek-R1 هو نموذج استدلال مدفوع بالتعلم المعزز (RL)، يعالج مشكلات التكرار وقابلية القراءة في النموذج. قبل التعلم المعزز، أدخل DeepSeek-R1 بيانات بدء التشغيل الباردة، مما أدى إلى تحسين أداء الاستدلال. إنه يتفوق في المهام الرياضية، والبرمجة، والاستدلال مقارنةً بـ OpenAI-o1، وقد حسّن الأداء العام من خلال طرق تدريب مصممة بعناية."
  },
+  "Pro/deepseek-ai/DeepSeek-R1-Distill-Qwen-1.5B": {
+    "description": "DeepSeek-R1-Distill-Qwen-1.5B هو نموذج تم الحصول عليه من خلال تقطير المعرفة بناءً على Qwen2.5-Math-1.5B. تم ضبط هذا النموذج باستخدام 800 ألف عينة مختارة تم إنشاؤها بواسطة DeepSeek-R1، حيث أظهر أداءً جيدًا في معايير متعددة. كنموذج خفيف الوزن، حقق دقة 83.9٪ في MATH-500، ومعدل نجاح 28.9٪ في AIME 2024، وحصل على تقييم 954 في CodeForces، مما يظهر قدرة استدلالية تتجاوز حجم معلماته."
+  },
+  "Pro/deepseek-ai/DeepSeek-R1-Distill-Qwen-7B": {
+    "description": "DeepSeek-R1-Distill-Qwen-7B هو نموذج تم الحصول عليه من خلال تقطير المعرفة بناءً على Qwen2.5-Math-7B. تم ضبط هذا النموذج باستخدام 800 ألف عينة مختارة تم إنشاؤها بواسطة DeepSeek-R1، مما يظهر قدرات استدلالية ممتازة. أظهر أداءً متميزًا في العديد من الاختبارات المعيارية، حيث حقق دقة 92.8٪ في MATH-500، ومعدل نجاح 55.5٪ في AIME 2024، ودرجة 1189 في CodeForces، مما يظهر قدرات قوية في الرياضيات والبرمجة كنموذج بحجم 7B."
+  },
  "Pro/deepseek-ai/DeepSeek-V3": {
    "description": "DeepSeek-V3 هو نموذج لغوي مختلط الخبراء (MoE) يحتوي على 6710 مليار معلمة، يستخدم الانتباه المتعدد الرؤوس (MLA) وهيكل DeepSeekMoE، ويجمع بين استراتيجيات توازن الحمل بدون خسائر مساعدة، مما يحسن كفاءة الاستدلال والتدريب. تم تدريبه مسبقًا على 14.8 تريليون توكن عالية الجودة، وتم إجراء تعديل دقيق تحت الإشراف والتعلم المعزز، مما يجعل DeepSeek-V3 يتفوق على نماذج مفتوحة المصدر الأخرى، ويقترب من النماذج المغلقة الرائدة."
  },
-  "Pro/google/gemma-2-9b-it": {
-    "description": "Gemma هو أحد نماذج Google المتقدمة والخفيفة الوزن من سلسلة النماذج المفتوحة. إنه نموذج لغوي كبير يعتمد على فك الشيفرة فقط، يدعم اللغة الإنجليزية، ويقدم أوزان مفتوحة، ومتغيرات مدربة مسبقًا، ومتغيرات معدلة وفقًا للتعليمات. نموذج Gemma مناسب لمجموعة متنوعة من مهام توليد النصوص، بما في ذلك الأسئلة والأجوبة، والتلخيص، والاستدلال. تم تدريب هذا النموذج 9B على 8 تريليون توكن. حجمه النسبي الصغير يجعله مناسبًا للنشر في بيئات ذات موارد محدودة، مثل أجهزة الكمبيوتر المحمولة، وأجهزة الكمبيوتر المكتبية، أو البنية التحتية السحابية الخاصة بك، مما يتيح لمزيد من الأشخاص الوصول إلى نماذج الذكاء الاصطناعي المتقدمة وتعزيز الابتكار."
-  },
-  "Pro/meta-llama/Meta-Llama-3.1-8B-Instruct": {
-    "description": "Meta Llama 3.1 هو جزء من عائلة نماذج اللغة الكبيرة متعددة اللغات التي طورتها Meta، بما في ذلك متغيرات مدربة مسبقًا ومعدلة وفقًا للتعليمات بحجم 8B و70B و405B. تم تحسين هذا النموذج 8B وفقًا لمشاهدات المحادثات متعددة اللغات، وأظهر أداءً ممتازًا في العديد من اختبارات المعايير الصناعية. تم تدريب النموذج باستخدام أكثر من 15 تريليون توكن من البيانات العامة، واستخدم تقنيات مثل التعديل الخاضع للإشراف والتعلم المعزز من ردود الفعل البشرية لتحسين فائدة النموذج وأمانه. يدعم Llama 3.1 توليد النصوص وتوليد الشيفرة، مع تاريخ معرفة حتى ديسمبر 2023."
+  "Pro/deepseek-ai/DeepSeek-V3-1226": {
+    "description": "DeepSeek-V3 هو نموذج لغوي مختلط الخبراء (MoE) يحتوي على 6710 مليار معلمة، ويستخدم الانتباه المتعدد الرؤوس (MLA) وبنية DeepSeekMoE، مع دمج استراتيجية توازن الحمل بدون خسارة مساعدة، لتحسين كفاءة الاستدلال والتدريب. تم تدريبه مسبقًا على 14.8 تريليون توكن عالي الجودة، وتمت معالجته من خلال التعديل الإشرافي والتعلم المعزز، يتفوق DeepSeek-V3 في الأداء على النماذج مفتوحة المصدر الأخرى، ويقترب من النماذج المغلقة الرائدة."
  },
  "QwQ-32B-Preview": {
    "description": "QwQ-32B-Preview هو نموذج معالجة اللغة الطبيعية المبتكر، قادر على معالجة مهام توليد الحوار وفهم السياق بشكل فعال."
@@ -290,6 +275,12 @@
  "Qwen/Qwen2.5-Coder-7B-Instruct": {
    "description": "Qwen2.5-Coder-7B-Instruct هو أحدث إصدار من سلسلة نماذج اللغة الكبيرة المحددة للشيفرة التي أصدرتها Alibaba Cloud. تم تحسين هذا النموذج بشكل كبير في توليد الشيفرة، والاستدلال، وإصلاح الأخطاء، من خلال تدريب على 55 تريليون توكن."
  },
+  "Qwen/Qwen2.5-VL-32B-Instruct": {
+    "description": "Qwen2.5-VL-32B-Instruct هو نموذج متعدد الوسائط تم تطويره بواسطة فريق Tongyi Qianwen، وهو جزء من سلسلة Qwen2.5-VL. لا يتقن هذا النموذج فقط التعرف على الأشياء الشائعة، بل يمكنه أيضًا تحليل النصوص والرسوم البيانية والرموز والأشكال والتخطيطات في الصور. يعمل كعامل ذكي بصري قادر على التفكير والتعامل الديناميكي مع الأدوات، مع امتلاك القدرة على استخدام الحاسوب والهاتف المحمول. بالإضافة إلى ذلك، يمكن لهذا النموذج تحديد مواقع الكائنات في الصور بدقة وإنتاج مخرجات منظمة للفواتير والجداول وغيرها. مقارنةً بالنموذج السابق Qwen2-VL، فقد تم تحسين هذه النسخة بشكل أكبر في القدرات الرياضية وحل المشكلات من خلال التعلم المعزز، كما أن أسلوب الاستجابة أصبح أكثر توافقًا مع تفضيلات البشر."
+  },
+  "Qwen/Qwen2.5-VL-72B-Instruct": {
+    "description": "Qwen2.5-VL هو نموذج اللغة البصرية في سلسلة Qwen2.5. يتميز هذا النموذج بتحسينات كبيرة في جوانب متعددة: قدرة أقوى على الفهم البصري، مع القدرة على التعرف على الأشياء الشائعة وتحليل النصوص والرسوم البيانية والتخطيطات؛ كوسيط بصري يمكنه التفكير وتوجيه استخدام الأدوات ديناميكيًا؛ يدعم فهم مقاطع الفيديو الطويلة التي تزيد عن ساعة واحدة مع القدرة على التقاط الأحداث الرئيسية؛ يمكنه تحديد موقع الأشياء في الصور بدقة من خلال إنشاء مربعات حدودية أو نقاط؛ يدعم إنشاء مخرجات منظمة، وهو مفيد بشكل خاص للبيانات الممسوحة ضوئيًا مثل الفواتير والجداول."
+  },
  "Qwen2-72B-Instruct": {
    "description": "Qwen2 هو أحدث سلسلة من نموذج Qwen، ويدعم سياقًا يصل إلى 128 ألف، مقارنةً بأفضل النماذج مفتوحة المصدر الحالية، يتفوق Qwen2-72B بشكل ملحوظ في فهم اللغة الطبيعية والمعرفة والترميز والرياضيات والقدرات متعددة اللغات."
  },
@@ -374,9 +365,6 @@
  "TeleAI/TeleChat2": {
    "description": "نموذج TeleChat2 هو نموذج كبير تم تطويره ذاتيًا من قبل China Telecom، يدعم وظائف مثل الأسئلة والأجوبة الموسوعية، وتوليد الشيفرة، وتوليد النصوص الطويلة، ويقدم خدمات استشارية للمستخدمين، مما يمكنه من التفاعل مع المستخدمين، والإجابة على الأسئلة، والمساعدة في الإبداع، وتوفير المعلومات والمعرفة والإلهام بكفاءة وسهولة. أظهر النموذج أداءً ممتازًا في معالجة مشكلات الهلوسة، وتوليد النصوص الطويلة، وفهم المنطق."
  },
-  "TeleAI/TeleMM": {
-    "description": "نموذج TeleMM هو نموذج كبير لفهم متعدد الوسائط تم تطويره ذاتيًا من قبل China Telecom، يمكنه معالجة مدخلات متعددة الوسائط مثل النصوص والصور، ويدعم وظائف مثل فهم الصور، وتحليل الرسوم البيانية، مما يوفر خدمات فهم متعددة الوسائط للمستخدمين. يمكن للنموذج التفاعل مع المستخدمين بطرق متعددة الوسائط، وفهم المحتوى المدخل بدقة، والإجابة على الأسئلة، والمساعدة في الإبداع، وتوفير معلومات متعددة الوسائط ودعم الإلهام بكفاءة. أظهر أداءً ممتازًا في المهام متعددة الوسائط مثل الإدراك الدقيق، والاستدلال المنطقي."
-  },
  "Vendor-A/Qwen/Qwen2.5-72B-Instruct": {
    "description": "Qwen2.5-72B-Instruct هو أحد أحدث نماذج اللغة الكبيرة التي أصدرتها Alibaba Cloud. يتمتع هذا النموذج بقدرات محسنة بشكل ملحوظ في مجالات الترميز والرياضيات. كما يوفر دعمًا للغات متعددة، تغطي أكثر من 29 لغة، بما في ذلك الصينية والإنجليزية. أظهر النموذج تحسينات ملحوظة في اتباع التعليمات، وفهم البيانات الهيكلية، وتوليد المخرجات الهيكلية (خاصة JSON)."
  },
@@ -506,6 +494,9 @@
  "anthropic/claude-3.5-sonnet": {
    "description": "Claude 3.5 Sonnet يقدم قدرات تتجاوز Opus وسرعة أكبر من Sonnet، مع الحفاظ على نفس السعر. يتميز Sonnet بمهارات خاصة في البرمجة وعلوم البيانات ومعالجة الصور والمهام الوكيلة."
  },
+  "anthropic/claude-3.7-sonnet": {
+    "description": "Claude 3.7 Sonnet هو أكثر النماذج ذكاءً من Anthropic حتى الآن، وهو أيضًا أول نموذج مختلط للتفكير في السوق. يمكن لـ Claude 3.7 Sonnet إنتاج استجابات شبه فورية أو تفكير تدريجي ممتد، حيث يمكن للمستخدمين رؤية هذه العمليات بوضوح. يتميز Sonnet بشكل خاص في البرمجة، وعلوم البيانات، ومعالجة الصور، والمهام الوكيلة."
+  },
  "aya": {
    "description": "Aya 23 هو نموذج متعدد اللغات أطلقته Cohere، يدعم 23 لغة، مما يسهل التطبيقات اللغوية المتنوعة."
  },
@@ -515,9 +506,27 @@
  "baichuan/baichuan2-13b-chat": {
    "description": "Baichuan-13B هو نموذج لغوي كبير مفتوح المصدر قابل للاستخدام التجاري تم تطويره بواسطة Baichuan Intelligence، ويحتوي على 13 مليار معلمة، وقد حقق أفضل النتائج في المعايير الصينية والإنجليزية."
  },
+  "c4ai-aya-expanse-32b": {
+    "description": "Aya Expanse هو نموذج متعدد اللغات عالي الأداء بسعة 32B، يهدف إلى تحدي أداء النماذج أحادية اللغة من خلال تحسين التعليمات، وتداول البيانات، وتدريب التفضيلات، وابتكارات دمج النماذج. يدعم 23 لغة."
+  },
+  "c4ai-aya-expanse-8b": {
+    "description": "Aya Expanse هو نموذج متعدد اللغات عالي الأداء بسعة 8B، يهدف إلى تحدي أداء النماذج أحادية اللغة من خلال تحسين التعليمات، وتداول البيانات، وتدريب التفضيلات، وابتكارات دمج النماذج. يدعم 23 لغة."
+  },
+  "c4ai-aya-vision-32b": {
+    "description": "Aya Vision هو نموذج متعدد الوسائط متقدم، يظهر أداءً ممتازًا في عدة معايير رئيسية للغة والنص والصورة. يدعم 23 لغة. يركز هذا الإصدار الذي يحتوي على 32 مليار معلمة على الأداء المتقدم متعدد اللغات."
+  },
+  "c4ai-aya-vision-8b": {
+    "description": "Aya Vision هو نموذج متعدد الوسائط متقدم، يظهر أداءً ممتازًا في عدة معايير رئيسية للغة والنص والصورة. يركز هذا الإصدار الذي يحتوي على 8 مليار معلمة على تقليل زمن الاستجابة وتحقيق أفضل أداء."
+  },
  "charglm-3": {
    "description": "CharGLM-3 مصمم خصيصًا للأدوار التفاعلية والمرافقة العاطفية، يدعم ذاكرة متعددة الجولات طويلة الأمد وحوارات مخصصة، ويستخدم على نطاق واسع."
  },
+  "chatglm3": {
+    "description": "ChatGLM3 هو نموذج مغلق المصدر تم إصداره بواسطة مختبر KEG في جامعة تسينغهوا وشركة Zhizhu AI، وقد تم تدريبه مسبقًا على كميات هائلة من المعرفة المعرفية باللغتين الصينية والإنجليزية، وتم تحسينه وفقًا للاختيارات البشرية. مقارنة بالنموذج الأول، حقق تحسينات بنسبة 16٪ و 36٪ و 280٪ في MMLU و C-Eval و GSM8K على التوالي، وتصدر قائمة المهام الصينية C-Eval. يناسب هذا النموذج السيناريوهات التي تتطلب كميات كبيرة من المعرفة وقدرات الاستدلال والإبداع، مثل كتابة النصوص الإعلانية وكتابة الروايات وكتابة المحتوى المعرفي وتكوين الكود."
+  },
+  "chatglm3-6b-base": {
+    "description": "ChatGLM3-6b-base هو النموذج الأساسي المفتوح المصدر الأحدث من سلسلة ChatGLM التي طورتها شركة Zhìpǔ، ويحتوي على 6 مليارات معلمة."
+  },
  "chatgpt-4o-latest": {
    "description": "ChatGPT-4o هو نموذج ديناميكي يتم تحديثه في الوقت الحقيقي للحفاظ على أحدث إصدار. يجمع بين فهم اللغة القوي وقدرات التوليد، مما يجعله مناسبًا لمجموعة واسعة من التطبيقات، بما في ذلك خدمة العملاء والتعليم والدعم الفني."
  },
@@ -593,12 +602,39 @@
  "cohere-command-r-plus": {
    "description": "نموذج RAG محسّن من الطراز الأول مصمم للتعامل مع أحمال العمل على مستوى المؤسسات."
  },
+  "command": {
+    "description": "نموذج حواري يتبع التعليمات، يظهر جودة عالية وموثوقية أكبر في المهام اللغوية، ويتميز بطول سياق أطول مقارنة بنموذجنا الأساسي للتوليد."
+  },
+  "command-a-03-2025": {
+    "description": "الأمر A هو أقوى نموذج لدينا حتى الآن، حيث يظهر أداءً ممتازًا في استخدام الأدوات، والوكالات، والتوليد المعزز بالاسترجاع (RAG)، وسيناريوهات التطبيقات متعددة اللغات. يتمتع الأمر A بطول سياق يبلغ 256K، ويمكن تشغيله باستخدام وحدتي GPU فقط، وقد زادت الإنتاجية بنسبة 150% مقارنةً بالأمر R+ 08-2024."
+  },
+  "command-light": {
+    "description": "إصدار أصغر وأسرع من الأمر، قوي تقريبًا بنفس القدر ولكنه أسرع."
+  },
+  "command-light-nightly": {
+    "description": "لتقليل الفجوة الزمنية بين إصدارات النسخ الرئيسية، أطلقنا إصدارًا ليليًا من نموذج الأمر. بالنسبة لسلسلة command-light، يُطلق على هذا الإصدار اسم command-light-nightly. يرجى ملاحظة أن command-light-nightly هو الإصدار الأحدث والأكثر تجريبية (وربما غير مستقر). يتم تحديث الإصدارات الليلية بانتظام دون إشعار مسبق، لذا لا يُنصح باستخدامها في بيئات الإنتاج."
+  },
+  "command-nightly": {
+    "description": "لتقليل الفجوة الزمنية بين إصدارات النسخ الرئيسية، أطلقنا إصدارًا ليليًا من نموذج الأمر. بالنسبة لسلسلة الأمر، يُطلق على هذا الإصدار اسم command-cightly. يرجى ملاحظة أن command-nightly هو الإصدار الأحدث والأكثر تجريبية (وربما غير مستقر). يتم تحديث الإصدارات الليلية بانتظام دون إشعار مسبق، لذا لا يُنصح باستخدامها في بيئات الإنتاج."
+  },
  "command-r": {
    "description": "Command R هو نموذج LLM محسن لمهام الحوار والسياقات الطويلة، مناسب بشكل خاص للتفاعل الديناميكي وإدارة المعرفة."
  },
+  "command-r-03-2024": {
+    "description": "الأمر R هو نموذج حواري يتبع التعليمات، ويظهر جودة أعلى وموثوقية أكبر في المهام اللغوية، ويتميز بطول سياق أطول مقارنة بالنماذج السابقة. يمكن استخدامه في عمليات العمل المعقدة مثل توليد الشيفرات، والتوليد المعزز بالاسترجاع (RAG)، واستخدام الأدوات، والوكالات."
+  },
+  "command-r-08-2024": {
+    "description": "الأمر-r-08-2024 هو إصدار محدث من نموذج الأمر R، تم إصداره في أغسطس 2024."
+  },
  "command-r-plus": {
    "description": "Command R+ هو نموذج لغوي كبير عالي الأداء، مصمم لمشاهد الأعمال الحقيقية والتطبيقات المعقدة."
  },
+  "command-r-plus-04-2024": {
+    "description": "الأمر R+ هو نموذج حواري يتبع التعليمات، ويظهر جودة أعلى وموثوقية أكبر في المهام اللغوية، ويتميز بطول سياق أطول مقارنة بالنماذج السابقة. إنه الأنسب لعمليات العمل المعقدة في RAG واستخدام الأدوات متعددة الخطوات."
+  },
+  "command-r7b-12-2024": {
+    "description": "الأمر-r7b-12-2024 هو إصدار صغير وفعال تم إصداره في ديسمبر 2024. يظهر أداءً ممتازًا في المهام التي تتطلب استدلالًا معقدًا ومعالجة متعددة الخطوات مثل RAG، واستخدام الأدوات، والوكالات."
+  },
  "dall-e-2": {
    "description": "النموذج الثاني من DALL·E، يدعم توليد صور أكثر واقعية ودقة، بدقة تعادل أربعة أضعاف الجيل الأول."
  },
@@ -614,9 +650,6 @@
  "deepseek-ai/DeepSeek-R1-Distill-Llama-70B": {
    "description": "نموذج التقطير DeepSeek-R1، تم تحسين أداء الاستدلال من خلال التعلم المعزز وبيانات البداية الباردة، ويعيد نموذج المصدر فتح معايير المهام المتعددة."
  },
-  "deepseek-ai/DeepSeek-R1-Distill-Llama-8B": {
-    "description": "DeepSeek-R1-Distill-Llama-8B هو نموذج تم تطويره بناءً على Llama-3.1-8B. تم ضبط هذا النموذج باستخدام عينات تم إنشاؤها بواسطة DeepSeek-R1، ويظهر قدرة استدلال ممتازة. حقق أداءً جيدًا في اختبارات المعايير، حيث حقق دقة 89.1% في MATH-500، وحقق معدل نجاح 50.4% في AIME 2024، وحصل على تقييم 1205 في CodeForces، مما يظهر قدرة قوية في الرياضيات والبرمجة كنموذج بحجم 8B."
-  },
  "deepseek-ai/DeepSeek-R1-Distill-Qwen-1.5B": {
    "description": "نموذج التقطير DeepSeek-R1، تم تحسين أداء الاستدلال من خلال التعلم المعزز وبيانات البداية الباردة، ويعيد نموذج المصدر فتح معايير المهام المتعددة."
  },
@@ -659,12 +692,30 @@
  "deepseek-r1": {
    "description": "DeepSeek-R1 هو نموذج استدلال مدفوع بالتعلم المعزز (RL) يعالج مشكلات التكرار وقابلية القراءة في النموذج. قبل استخدام RL، قدم DeepSeek-R1 بيانات بدء باردة، مما أدى إلى تحسين أداء الاستدلال. إنه يقدم أداءً مماثلاً لـ OpenAI-o1 في المهام الرياضية والبرمجية والاستدلال، وقد حسّن النتائج العامة من خلال طرق تدريب مصممة بعناية."
  },
+  "deepseek-r1-70b-fast-online": {
+    "description": "DeepSeek R1 70B النسخة السريعة، تدعم البحث المتصل في الوقت الحقيقي، وتوفر سرعة استجابة أسرع مع الحفاظ على أداء النموذج."
+  },
+  "deepseek-r1-70b-online": {
+    "description": "DeepSeek R1 70B النسخة القياسية، تدعم البحث المتصل في الوقت الحقيقي، مناسبة للمحادثات والمهام النصية التي تتطلب معلومات حديثة."
+  },
+  "deepseek-r1-distill-llama": {
+    "description": "deepseek-r1-distill-llama هو نموذج مستخلص من DeepSeek-R1 بناءً على Llama."
+  },
  "deepseek-r1-distill-llama-70b": {
    "description": "DeepSeek R1 - النموذج الأكبر والأذكى في مجموعة DeepSeek - تم تقطيره إلى بنية Llama 70B. بناءً على اختبارات المعايير والتقييمات البشرية، يظهر هذا النموذج ذكاءً أكبر من Llama 70B الأصلي، خاصة في المهام التي تتطلب دقة رياضية وحقائق."
  },
  "deepseek-r1-distill-llama-8b": {
    "description": "نموذج DeepSeek-R1-Distill تم تطويره من خلال تقنية تقطير المعرفة، حيث تم تعديل عينات تم إنشاؤها بواسطة DeepSeek-R1 على نماذج مفتوحة المصدر مثل Qwen وLlama."
  },
+  "deepseek-r1-distill-qianfan-llama-70b": {
+    "description": "تم إصداره لأول مرة في 14 فبراير 2025، تم استخلاصه بواسطة فريق تطوير نموذج Qianfan باستخدام Llama3_70B كنموذج أساسي (مبني على Meta Llama)، وتم إضافة نصوص Qianfan إلى بيانات الاستخلاص."
+  },
+  "deepseek-r1-distill-qianfan-llama-8b": {
+    "description": "تم إصداره لأول مرة في 14 فبراير 2025، تم استخلاصه بواسطة فريق تطوير نموذج Qianfan باستخدام Llama3_8B كنموذج أساسي (مبني على Meta Llama)، وتم إضافة نصوص Qianfan إلى بيانات الاستخلاص."
+  },
+  "deepseek-r1-distill-qwen": {
+    "description": "deepseek-r1-distill-qwen هو نموذج مستخلص من DeepSeek-R1 بناءً على Qwen."
+  },
  "deepseek-r1-distill-qwen-1.5b": {
    "description": "نموذج DeepSeek-R1-Distill تم تطويره من خلال تقنية تقطير المعرفة، حيث تم تعديل عينات تم إنشاؤها بواسطة DeepSeek-R1 على نماذج مفتوحة المصدر مثل Qwen وLlama."
  },
@@ -677,6 +728,12 @@
  "deepseek-r1-distill-qwen-7b": {
    "description": "نموذج DeepSeek-R1-Distill تم تطويره من خلال تقنية تقطير المعرفة، حيث تم تعديل عينات تم إنشاؤها بواسطة DeepSeek-R1 على نماذج مفتوحة المصدر مثل Qwen وLlama."
  },
+  "deepseek-r1-fast-online": {
+    "description": "DeepSeek R1 النسخة السريعة الكاملة، تدعم البحث المتصل في الوقت الحقيقي، تجمع بين القدرات القوية لـ 671 مليار معلمة وسرعة استجابة أسرع."
+  },
+  "deepseek-r1-online": {
+    "description": "DeepSeek R1 النسخة الكاملة، تحتوي على 671 مليار معلمة، تدعم البحث المتصل في الوقت الحقيقي، وتتمتع بقدرات فهم وتوليد أقوى."
+  },
  "deepseek-reasoner": {
    "description": "نموذج الاستدلال الذي أطلقته DeepSeek. قبل تقديم الإجابة النهائية، يقوم النموذج أولاً بإخراج سلسلة من المحتوى الفكري لتحسين دقة الإجابة النهائية."
  },
@@ -689,6 +746,9 @@
  "deepseek-v3": {
    "description": "DeepSeek-V3 هو نموذج MoE تم تطويره بواسطة شركة Hangzhou DeepSeek AI Technology Research Co.، Ltd، وقد حقق نتائج بارزة في العديد من التقييمات، ويحتل المرتبة الأولى بين نماذج المصدر المفتوح في القوائم الرئيسية. مقارنةً بنموذج V2.5، حقق V3 زيادة في سرعة التوليد بمقدار 3 مرات، مما يوفر تجربة استخدام أسرع وأكثر سلاسة للمستخدمين."
  },
+  "deepseek-v3-0324": {
+    "description": "DeepSeek-V3-0324 هو نموذج MoE يحتوي على 671 مليار معلمة، ويتميز بقدرات بارزة في البرمجة والتقنية، وفهم السياق ومعالجة النصوص الطويلة."
+  },
  "deepseek/deepseek-chat": {
    "description": "نموذج مفتوح المصدر جديد يجمع بين القدرات العامة وقدرات البرمجة، لا يحتفظ فقط بقدرات الحوار العامة لنموذج الدردشة الأصلي وقدرات معالجة الأكواد القوية لنموذج Coder، بل يتماشى أيضًا بشكل أفضل مع تفضيلات البشر. بالإضافة إلى ذلك، حقق DeepSeek-V2.5 تحسينات كبيرة في مهام الكتابة، واتباع التعليمات، وغيرها من المجالات."
  },
@@ -755,6 +815,9 @@
  "ernie-4.0-turbo-8k-preview": {
    "description": "نموذج اللغة الكبير الرائد الذي طورته بايدو، والذي يظهر أداءً ممتازًا بشكل شامل، ويستخدم على نطاق واسع في مشاهد المهام المعقدة في مختلف المجالات؛ يدعم الاتصال التلقائي بمكونات البحث من بايدو، مما يضمن تحديث معلومات الإجابة. مقارنةً بـ ERNIE 4.0، يظهر أداءً أفضل."
  },
+  "ernie-4.5-8k-preview": {
+    "description": "نموذج ونسين 4.5 هو نموذج أساسي جديد متعدد الوسائط تم تطويره ذاتيًا بواسطة بايدو، من خلال نمذجة متعددة الوسائط لتحقيق تحسين متزامن، ويظهر قدرة ممتازة على الفهم متعدد الوسائط؛ يتمتع بقدرات لغوية متقدمة، مع تحسين شامل في الفهم، والتوليد، والمنطق، والذاكرة، مع تحسين كبير في إزالة الأوهام، والاستدلال المنطقي، وقدرات البرمجة."
+  },
  "ernie-char-8k": {
    "description": "نموذج اللغة الكبير المخصص الذي طورته بايدو، مناسب لتطبيقات مثل NPC في الألعاب، محادثات خدمة العملاء، وأدوار الحوار، حيث يتميز بأسلوب شخصيات واضح ومتسق، وقدرة قوية على اتباع التعليمات، وأداء استدلال ممتاز."
  },
@@ -788,9 +851,6 @@
  "gemini-1.0-pro-latest": {
    "description": "Gemini 1.0 Pro هو نموذج ذكاء اصطناعي عالي الأداء من Google، مصمم للتوسع في مجموعة واسعة من المهام."
  },
-  "gemini-1.5-flash": {
-    "description": "جمني 1.5 فلاش هو أحدث نموذج ذكاء اصطناعي متعدد الوسائط من جوجل، يتمتع بقدرة معالجة سريعة، ويدعم إدخال النصوص والصور والفيديو، مما يجعله مناسبًا للتوسع الفعال في مجموعة متنوعة من المهام."
-  },
  "gemini-1.5-flash-001": {
    "description": "Gemini 1.5 Flash 001 هو نموذج متعدد الوسائط فعال، يدعم التوسع في التطبيقات الواسعة."
  },
@@ -803,6 +863,9 @@
  "gemini-1.5-flash-8b-exp-0924": {
    "description": "جمني 1.5 فلاش 8B 0924 هو النموذج التجريبي الأحدث، حيث حقق تحسينات ملحوظة في الأداء في حالات الاستخدام النصية ومتعددة الوسائط."
  },
+  "gemini-1.5-flash-8b-latest": {
+    "description": "Gemini 1.5 Flash 8B هو نموذج متعدد الوسائط فعال يدعم التوسع في مجموعة واسعة من التطبيقات."
+  },
  "gemini-1.5-flash-exp-0827": {
    "description": "جيميني 1.5 فلاش 0827 يقدم قدرة معالجة متعددة الوسائط محسنة، مناسب لمجموعة متنوعة من سيناريوهات المهام المعقدة."
  },
@@ -830,24 +893,27 @@
  "gemini-2.0-flash-001": {
    "description": "Gemini 2.0 Flash يقدم ميزات وتحسينات من الجيل التالي، بما في ذلك سرعة فائقة، واستخدام أدوات أصلية، وتوليد متعدد الوسائط، ونافذة سياق تصل إلى 1M توكن."
  },
+  "gemini-2.0-flash-exp": {
+    "description": "نموذج جمنيس 2.0 فلاش، تم تحسينه لتحقيق أهداف مثل الكفاءة من حيث التكلفة وانخفاض الكمون."
+  },
+  "gemini-2.0-flash-exp-image-generation": {
+    "description": "نموذج تجريبي Gemini 2.0 Flash، يدعم توليد الصور"
+  },
  "gemini-2.0-flash-lite": {
    "description": "نموذج جمنّي 2.0 فلاش هو نسخة معدلة، تم تحسينها لتحقيق الكفاءة من حيث التكلفة والحد من التأخير."
  },
  "gemini-2.0-flash-lite-001": {
    "description": "نموذج جمنّي 2.0 فلاش هو نسخة معدلة، تم تحسينها لتحقيق الكفاءة من حيث التكلفة والحد من التأخير."
  },
-  "gemini-2.0-flash-lite-preview-02-05": {
-    "description": "نموذج Gemini 2.0 Flash، تم تحسينه لأهداف التكلفة المنخفضة والكمون المنخفض."
-  },
-  "gemini-2.0-flash-thinking-exp": {
-    "description": "Gemini 2.0 Flash Exp هو أحدث نموذج تجريبي متعدد الوسائط من Google، يتمتع بميزات الجيل التالي، وسرعة فائقة، واستدعاء أدوات أصلية، وتوليد متعدد الوسائط."
-  },
  "gemini-2.0-flash-thinking-exp-01-21": {
    "description": "Gemini 2.0 Flash Exp هو أحدث نموذج تجريبي متعدد الوسائط من Google، يتمتع بميزات الجيل التالي، وسرعة فائقة، واستدعاء أدوات أصلية، وتوليد متعدد الوسائط."
  },
  "gemini-2.0-pro-exp-02-05": {
    "description": "Gemini 2.0 Pro Experimental هو أحدث نموذج ذكاء اصطناعي متعدد الوسائط التجريبي من Google، مع تحسينات ملحوظة في الجودة مقارنة بالإصدارات السابقة، خاصة في المعرفة العالمية، والبرمجة، والسياقات الطويلة."
  },
+  "gemini-2.5-pro-exp-03-25": {
+    "description": "نموذج Gemini 2.5 Pro التجريبي هو الأكثر تقدمًا من Google، قادر على استنتاج المشكلات المعقدة في البرمجة والرياضيات وعلوم STEM، بالإضافة إلى تحليل مجموعات البيانات الكبيرة ومكتبات الشيفرات والمستندات باستخدام سياقات طويلة."
+  },
  "gemma-7b-it": {
    "description": "Gemma 7B مناسب لمعالجة المهام المتوسطة والصغيرة، ويجمع بين الكفاءة من حيث التكلفة."
  },
@@ -1016,6 +1082,9 @@
  "gpt-4o-mini-realtime-preview": {
    "description": "الإصدار المصغر الفوري من GPT-4o، يدعم إدخال وإخراج الصوت والنص في الوقت الحقيقي."
  },
+  "gpt-4o-mini-tts": {
+    "description": "GPT-4o mini TTS هو نموذج تحويل النص إلى كلام، مبني على GPT-4o mini، يقدم إنتاج كلمات صوتية عالية الجودة بسعر أقل."
+  },
  "gpt-4o-realtime-preview": {
    "description": "الإصدار الفوري من GPT-4o، يدعم إدخال وإخراج الصوت والنص في الوقت الحقيقي."
  },
@@ -1073,6 +1142,12 @@
  "hunyuan-standard-vision": {
    "description": "نموذج متعدد الوسائط حديث يدعم الإجابة بعدة لغات، مع توازن في القدرات بين الصينية والإنجليزية."
  },
+  "hunyuan-t1-20250321": {
+    "description": "بناء شامل لقدرات النموذج في العلوم الإنسانية والطبيعية، مع قدرة قوية على التقاط المعلومات من النصوص الطويلة. يدعم الاستدلال والإجابة على مشكلات علمية متنوعة من الرياضيات/المنطق/العلوم/الشيفرات."
+  },
+  "hunyuan-t1-latest": {
+    "description": "أول نموذج استدلال هجين ضخم في الصناعة، يوسع قدرات الاستدلال، بسرعة فك تشفير فائقة، ويعزز التوافق مع تفضيلات البشر."
+  },
  "hunyuan-translation": {
    "description": "يدعم الترجمة بين 15 لغة بما في ذلك الصينية والإنجليزية واليابانية والفرنسية والبرتغالية والإسبانية والتركية والروسية والعربية والكورية والإيطالية والألمانية والفيتنامية والماليزية والإندونيسية، ويعتمد على مجموعة تقييم الترجمة متعددة السيناريوهات لتقييم تلقائي باستخدام درجة COMET، حيث يتفوق بشكل عام على نماذج السوق المماثلة في القدرة على الترجمة بين اللغات الشائعة."
  },
@@ -1082,9 +1157,6 @@
  "hunyuan-turbo": {
    "description": "نسخة المعاينة من الجيل الجديد من نموذج اللغة الكبير، يستخدم هيكل نموذج الخبراء المختلط (MoE) الجديد، مما يوفر كفاءة استدلال أسرع وأداء أقوى مقارنة بـ hunyuan-pro."
  },
-  "hunyuan-turbo-20241120": {
-    "description": "الإصدار الثابت من hunyuan-turbo بتاريخ 20 نوفمبر 2024، وهو إصدار يقع بين hunyuan-turbo و hunyuan-turbo-latest."
-  },
  "hunyuan-turbo-20241223": {
    "description": "تحسينات في هذا الإصدار: توجيه البيانات، مما يعزز بشكل كبير قدرة النموذج على التعميم؛ تحسين كبير في القدرات الرياضية، البرمجية، وقدرات الاستدلال المنطقي؛ تحسين القدرات المتعلقة بفهم النصوص والكلمات؛ تحسين جودة إنشاء محتوى النص."
  },
@@ -1094,6 +1166,15 @@
  "hunyuan-turbo-vision": {
    "description": "نموذج اللغة البصرية الرائد من الجيل الجديد، يستخدم هيكل نموذج الخبراء المختلط (MoE) الجديد، مع تحسين شامل في القدرات المتعلقة بفهم النصوص والصور، وإنشاء المحتوى، والأسئلة والأجوبة المعرفية، والتحليل والاستدلال مقارنة بالنماذج السابقة."
  },
+  "hunyuan-turbos-20250226": {
+    "description": "hunyuan-TurboS pv2.1.2 هو إصدار ثابت تم تحديث قاعدة التدريب لرموز التوكن؛ تعزيز القدرات الفكرية في الرياضيات/المنطق/البرمجة؛ تحسين تجربة الاستخدام العامة باللغتين الصينية والإنجليزية، بما في ذلك إنشاء النصوص، وفهم النصوص، والأسئلة والأجوبة المعرفية، والدردشة."
+  },
+  "hunyuan-turbos-20250313": {
+    "description": "توحيد أسلوب خطوات حل المسائل الرياضية، وتعزيز الأسئلة والأجوبة الرياضية متعددة الجولات. تحسين أسلوب الإجابة في إنشاء النصوص، وإزالة طابع الذكاء الاصطناعي، وزيادة البلاغة."
+  },
+  "hunyuan-turbos-latest": {
+    "description": "hunyuan-TurboS هو أحدث إصدار من نموذج هونيان الرائد، يتمتع بقدرات تفكير أقوى وتجربة أفضل."
+  },
  "hunyuan-vision": {
    "description": "نموذج Hunyuan الأحدث متعدد الوسائط، يدعم إدخال الصور والنصوص لتوليد محتوى نصي."
  },
@@ -1124,12 +1205,18 @@
  "lite": {
    "description": "سبارك لايت هو نموذج لغوي كبير خفيف الوزن، يتميز بتأخير منخفض للغاية وكفاءة عالية في المعالجة، وهو مجاني تمامًا ومفتوح، ويدعم وظيفة البحث عبر الإنترنت في الوقت الحقيقي. تجعل خصائص استجابته السريعة منه مثاليًا لتطبيقات الاستدلال على الأجهزة ذات القدرة الحاسوبية المنخفضة وضبط النماذج، مما يوفر للمستخدمين قيمة ممتازة من حيث التكلفة وتجربة ذكية، خاصة في مجالات الأسئلة والأجوبة المعرفية، وتوليد المحتوى، وسيناريوهات البحث."
  },
+  "llama-2-7b-chat": {
+    "description": "Llama2 هو سلسلة من النماذج اللغوية الكبيرة (LLM) التي طورتها Meta وأطلقتها كمصدر مفتوح، وهي تتكون من نماذج توليد نص مسبقة التدريب ومتخصصة بحجم يتراوح من 7 مليارات إلى 70 مليار معلمة. على مستوى العمارة، Llama2 هو نموذج لغوي تراجعي تلقائي يستخدم معمارية محول محسنة. الإصدارات المعدلة تستخدم التدريب الدقيق تحت الإشراف (SFT) والتعلم التقويمي مع تعزيزات من البشر (RLHF) لتوافق تفضيلات البشر فيما يتعلق بالفائدة والأمان. أظهر Llama2 أداءً أفضل بكثير من سلسلة Llama في العديد من المجموعات الأكاديمية، مما قدم إلهامًا لتصميم وتطوير العديد من النماذج الأخرى."
+  },
  "llama-3.1-70b-versatile": {
    "description": "Llama 3.1 70B يوفر قدرة استدلال ذكائي أقوى، مناسب للتطبيقات المعقدة، يدعم معالجة حسابية ضخمة ويضمن الكفاءة والدقة."
  },
  "llama-3.1-8b-instant": {
    "description": "Llama 3.1 8B هو نموذج عالي الأداء، يوفر قدرة سريعة على توليد النصوص، مما يجعله مثاليًا لمجموعة من التطبيقات التي تتطلب كفاءة كبيرة وتكلفة فعالة."
  },
+  "llama-3.1-instruct": {
+    "description": "تم تحسين نموذج Llama 3.1 المعدل للتعليمات خصيصًا لسيناريوهات الحوار، حيث يتفوق على العديد من نماذج الدردشة مفتوحة المصدر الحالية في معايير الصناعة الشائعة."
+  },
  "llama-3.2-11b-vision-instruct": {
    "description": "قدرة استدلال الصور التي تبرز في الصور عالية الدقة، مناسبة لتطبيقات الفهم البصري."
  },
@@ -1142,12 +1229,18 @@
  "llama-3.2-90b-vision-preview": {
    "description": "Llama 3.2 مصمم للتعامل مع المهام التي تجمع بين البيانات البصرية والنصية. يظهر أداءً ممتازًا في مهام وصف الصور والأسئلة البصرية، متجاوزًا الفجوة بين توليد اللغة والاستدلال البصري."
  },
+  "llama-3.2-vision-instruct": {
+    "description": "تم تحسين نموذج Llama 3.2-Vision المعدل للتعليمات للتعرف البصري، والاستدلال على الصور، ووصف الصور، والإجابة على الأسئلة العامة المتعلقة بالصور."
+  },
  "llama-3.3-70b-instruct": {
    "description": "Llama 3.3 هو النموذج الأكثر تقدمًا في سلسلة Llama، وهو نموذج لغوي مفتوح المصدر متعدد اللغات، يوفر تجربة أداء تنافس نموذج 405B بتكلفة منخفضة للغاية. يعتمد على هيكل Transformer، وتم تحسين فائدته وأمانه من خلال التعديل الدقيق تحت الإشراف (SFT) والتعلم المعزز من خلال التغذية الراجعة البشرية (RLHF). تم تحسين نسخة التعديل الخاصة به لتكون مثالية للحوار متعدد اللغات، حيث يتفوق في العديد من المعايير الصناعية على العديد من نماذج الدردشة المفتوحة والمغلقة. تاريخ انتهاء المعرفة هو ديسمبر 2023."
  },
  "llama-3.3-70b-versatile": {
    "description": "ميتّا لاما 3.3 هو نموذج لغة كبير متعدد اللغات (LLM) يضم 70 مليار (إدخال نص/إخراج نص) من النموذج المدرب مسبقًا والمعدل وفقًا للتعليمات. تم تحسين نموذج لاما 3.3 المعدل وفقًا للتعليمات للاستخدامات الحوارية متعددة اللغات ويتفوق على العديد من النماذج المتاحة مفتوحة المصدر والمغلقة في المعايير الصناعية الشائعة."
  },
+  "llama-3.3-instruct": {
+    "description": "تم تحسين نموذج Llama 3.3 المعدل للتعليمات خصيصًا لسيناريوهات المحادثة، حيث تفوق على العديد من نماذج الدردشة مفتوحة المصدر الحالية في اختبارات المعايير الصناعية الشائعة."
+  },
  "llama3-70b-8192": {
    "description": "Meta Llama 3 70B يوفر قدرة معالجة معقدة لا مثيل لها، مصمم خصيصًا للمشاريع ذات المتطلبات العالية."
  },
@@ -1187,6 +1280,9 @@
  "max-32k": {
    "description": "سبارك ماكس 32K مزود بقدرة معالجة سياق كبيرة، مع فهم أقوى للسياق وقدرة على الاستدلال المنطقي، يدعم إدخال نصوص تصل إلى 32K توكن، مما يجعله مناسبًا لقراءة الوثائق الطويلة، والأسئلة والأجوبة المعرفية الخاصة، وغيرها من السيناريوهات."
  },
+  "megrez-3b-instruct": {
+    "description": "Megrez-3B-Instruct هو نموذج لغة كبير تم تدريبه بشكل مستقل من قبل شركة ووون تشينغ. يهدف Megrez-3B-Instruct إلى تقديم حل ذكاء على جهاز نهائي سريع وصغير وسهل الاستخدام من خلال مفهوم التكامل بين البرمجيات والأجهزة."
+  },
  "meta-llama-3-70b-instruct": {
    "description": "نموذج قوي بحجم 70 مليار معلمة يتفوق في التفكير، والترميز، وتطبيقات اللغة الواسعة."
  },
@@ -1223,9 +1319,6 @@
  "meta-llama/Llama-3.2-90B-Vision-Instruct-Turbo": {
    "description": "تم تصميم LLaMA 3.2 لمعالجة المهام التي تجمع بين البيانات البصرية والنصية. إنه يبرز في مهام وصف الصور والأسئلة البصرية، متجاوزًا الفجوة بين توليد اللغة واستدلال الرؤية."
  },
-  "meta-llama/Llama-3.3-70B-Instruct": {
-    "description": "Llama 3.3 هو أحدث نموذج لغوي مفتوح المصدر متعدد اللغات من سلسلة Llama، يقدم تجربة مشابهة لأداء نموذج 405B بتكلفة منخفضة للغاية. يعتمد على هيكل Transformer، وتم تحسينه من خلال التعديل الإشرافي (SFT) والتعلم المعزز من خلال ردود الفعل البشرية (RLHF) لتعزيز الفائدة والأمان. تم تحسين نسخة التعديل الخاصة به للحوار متعدد اللغات، حيث يتفوق في العديد من المعايير الصناعية على العديد من نماذج الدردشة المفتوحة والمغلقة. تاريخ انتهاء المعرفة هو ديسمبر 2023."
-  },
  "meta-llama/Llama-3.3-70B-Instruct-Turbo": {
    "description": "نموذج Meta Llama 3.3 متعدد اللغات (LLM) هو نموذج توليد تم تدريبه مسبقًا وضبطه على التعليمات في 70B (إدخال نص/إخراج نص). تم تحسين نموذج Llama 3.3 المعدل على التعليمات لحالات استخدام الحوار متعدد اللغات، ويتفوق على العديد من نماذج الدردشة المفتوحة والمغلقة المتاحة في المعايير الصناعية الشائعة."
  },
@@ -1253,15 +1346,9 @@
  "meta-llama/Meta-Llama-3.1-70B": {
    "description": "Llama 3.1 هو نموذج رائد أطلقته Meta، يدعم ما يصل إلى 405B من المعلمات، ويمكن تطبيقه في مجالات المحادثات المعقدة، والترجمة متعددة اللغات، وتحليل البيانات."
  },
-  "meta-llama/Meta-Llama-3.1-70B-Instruct": {
-    "description": "LLaMA 3.1 70B يوفر دعمًا فعالًا للحوار متعدد اللغات."
-  },
  "meta-llama/Meta-Llama-3.1-70B-Instruct-Turbo": {
    "description": "نموذج Llama 3.1 70B تم ضبطه بدقة، مناسب للتطبيقات ذات الحمل العالي، تم تكميمه إلى FP8 لتوفير قدرة حسابية ودقة أعلى، مما يضمن أداءً ممتازًا في السيناريوهات المعقدة."
  },
-  "meta-llama/Meta-Llama-3.1-8B-Instruct": {
-    "description": "LLaMA 3.1 يوفر دعمًا متعدد اللغات، وهو واحد من النماذج الرائدة في الصناعة."
-  },
  "meta-llama/Meta-Llama-3.1-8B-Instruct-Turbo": {
    "description": "نموذج Llama 3.1 8B يستخدم FP8 للتكميم، يدعم ما يصل إلى 131,072 علامة سياق، وهو من بين الأفضل في النماذج المفتوحة المصدر، مناسب للمهام المعقدة، ويظهر أداءً ممتازًا في العديد من المعايير الصناعية."
  },
@@ -1355,12 +1442,18 @@
  "mistral-large": {
    "description": "Mixtral Large هو النموذج الرائد من Mistral، يجمع بين قدرات توليد الشيفرة، والرياضيات، والاستدلال، ويدعم نافذة سياق تصل إلى 128k."
  },
+  "mistral-large-instruct": {
+    "description": "Mistral-Large-Instruct-2407 هو نموذج لغوي كبير متقدم (LLM) بكثافة عالية، يضم 123 مليار معلمة، ويتمتع بقدرات استدلالية ومعرفية وبرمجية متطورة."
+  },
  "mistral-large-latest": {
    "description": "Mistral Large هو النموذج الرائد، يتفوق في المهام متعددة اللغات، والاستدلال المعقد، وتوليد الشيفرة، وهو الخيار المثالي للتطبيقات الراقية."
  },
  "mistral-nemo": {
    "description": "Mistral Nemo تم تطويره بالتعاون بين Mistral AI وNVIDIA، وهو نموذج 12B عالي الأداء."
  },
+  "mistral-nemo-instruct": {
+    "description": "Mistral-Nemo-Instruct-2407 هو نموذج لغوي كبير (LLM) وهو نسخة معدلة بالتعليمات من Mistral-Nemo-Base-2407."
+  },
  "mistral-small": {
    "description": "يمكن استخدام Mistral Small في أي مهمة تعتمد على اللغة تتطلب كفاءة عالية وزمن استجابة منخفض."
  },
@@ -1577,6 +1670,12 @@
  "qwen2": {
    "description": "Qwen2 هو نموذج لغوي كبير من الجيل الجديد من Alibaba، يدعم أداءً ممتازًا لتلبية احتياجات التطبيقات المتنوعة."
  },
+  "qwen2-72b-instruct": {
+    "description": "Qwen2 هو سلسلة نماذج لغوية كبيرة جديدة تم إطلاقها من قبل فريق Qwen. تعتمد هذه النماذج على هندسة Transformer وتستخدم دالة التنشيط SwiGLU، وتحيز الانتباه QKV (attention QKV bias)، وانتباه الاستفسار الجماعي (group query attention)، وخلط انتباه النافذة المتزحلقة والانتباه الكامل (mixture of sliding window attention and full attention). بالإضافة إلى ذلك، قام فريق Qwen بتحسين مجزئ يتكيف مع العديد من اللغات الطبيعية والأكواد."
+  },
+  "qwen2-7b-instruct": {
+    "description": "Qwen2 هو سلسلة نماذج لغوية كبيرة جديدة تم طرحها من قبل فريق Qwen. يعتمد هذا النموذج على هندسة Transformer، ويستخدم دالة التنشيط SwiGLU، وتحيز QKV للانتباه (attention QKV bias)، وانتباه الاستفسار الجماعي (group query attention)، وخلط انتباه النافذة المتزحلقة والانتباه الكامل. بالإضافة إلى ذلك، قام فريق Qwen بتحسين المقطّع الذي يتكيف مع العديد من اللغات الطبيعية والأكواد."
+  },
  "qwen2.5": {
    "description": "Qwen2.5 هو الجيل الجديد من نماذج اللغة الكبيرة من Alibaba، يدعم احتياجات التطبيقات المتنوعة بأداء ممتاز."
  },
@@ -1604,6 +1703,12 @@
  "qwen2.5-coder-7b-instruct": {
    "description": "نسخة مفتوحة المصدر من نموذج Qwen للبرمجة."
  },
+  "qwen2.5-coder-instruct": {
+    "description": "Qwen2.5-Coder هو أحدث نموذج لغوي كبير مخصص للبرمجة في سلسلة Qwen (المعروف سابقًا باسم CodeQwen)."
+  },
+  "qwen2.5-instruct": {
+    "description": "Qwen2.5 هي أحدث سلسلة من نماذج Qwen للغة الكبيرة. بالنسبة لـ Qwen2.5، قمنا بإصدار نماذج لغة أساسية متعددة ونماذج لغة مضبوطة بالتعليمات، مع نطاق معلمات يتراوح من 0.5 مليار إلى 72 مليار."
+  },
  "qwen2.5-math-1.5b-instruct": {
    "description": "نموذج Qwen-Math لديه قدرة قوية على حل المسائل الرياضية."
  },
@@ -1613,12 +1718,21 @@
  "qwen2.5-math-7b-instruct": {
    "description": "نموذج Qwen-Math يتمتع بقدرات قوية في حل المسائل الرياضية."
  },
+  "qwen2.5-omni-7b": {
+    "description": "تدعم نماذج سلسلة Qwen-Omni إدخال بيانات متعددة الأنماط، بما في ذلك الفيديو والصوت والصور والنصوص، وتخرج الصوت والنص."
+  },
+  "qwen2.5-vl-32b-instruct": {
+    "description": "سلسلة نماذج Qwen2.5-VL تعزز مستوى الذكاء والفعّالية والملاءمة للنماذج، مما يجعل أداءها أفضل في سيناريوهات مثل المحادثات الطبيعية، وإنشاء المحتوى، وتقديم الخدمات المتخصصة، وتطوير الأكواد. يستخدم الإصدار 32B تقنية التعلم المعزز لتحسين النموذج، مقارنةً بنماذج سلسلة Qwen2.5 VL الأخرى، حيث يقدم أسلوب إخراج أكثر توافقًا مع تفضيلات البشر، وقدرة على استنتاج المسائل الرياضية المعقدة، بالإضافة إلى فهم واستدلال دقيق للصور."
+  },
  "qwen2.5-vl-72b-instruct": {
    "description": "تحسين شامل في اتباع التعليمات، الرياضيات، حل المشكلات، والبرمجة، وزيادة قدرة التعرف على العناصر البصرية، يدعم تنسيقات متعددة لتحديد العناصر البصرية بدقة، ويدعم فهم ملفات الفيديو الطويلة (حتى 10 دقائق) وتحديد اللحظات الزمنية بدقة، قادر على فهم التسلسل الزمني والسرعة، يدعم التحكم في أنظمة التشغيل أو الوكلاء المحمولة بناءً على قدرات التحليل والتحديد، قوي في استخراج المعلومات الرئيسية وإخراج البيانات بتنسيق Json، هذه النسخة هي النسخة 72B، وهي الأقوى في هذه السلسلة."
  },
  "qwen2.5-vl-7b-instruct": {
    "description": "تحسين شامل في اتباع التعليمات، الرياضيات، حل المشكلات، والبرمجة، وزيادة قدرة التعرف على العناصر البصرية، يدعم تنسيقات متعددة لتحديد العناصر البصرية بدقة، ويدعم فهم ملفات الفيديو الطويلة (حتى 10 دقائق) وتحديد اللحظات الزمنية بدقة، قادر على فهم التسلسل الزمني والسرعة، يدعم التحكم في أنظمة التشغيل أو الوكلاء المحمولة بناءً على قدرات التحليل والتحديد، قوي في استخراج المعلومات الرئيسية وإخراج البيانات بتنسيق Json، هذه النسخة هي النسخة 72B، وهي الأقوى في هذه السلسلة."
  },
+  "qwen2.5-vl-instruct": {
+    "description": "Qwen2.5-VL هو أحدث إصدار من نماذج الرؤية واللغة في عائلة نماذج Qwen."
+  },
  "qwen2.5:0.5b": {
    "description": "Qwen2.5 هو الجيل الجديد من نماذج اللغة الكبيرة من Alibaba، يدعم احتياجات التطبيقات المتنوعة بأداء ممتاز."
  },
@@ -1754,6 +1868,9 @@
  "wizardlm2:8x22b": {
    "description": "WizardLM 2 هو نموذج لغوي تقدمه Microsoft AI، يتميز بأداء ممتاز في الحوار المعقد، واللغات المتعددة، والاستدلال، والمساعدين الذكيين."
  },
+  "yi-1.5-34b-chat": {
+    "description": "يي-1.5 هو إصدار مُحدّث من يي. تم تدريبه بشكل مُسبق باستخدام مكتبة بيانات عالية الجودة تحتوي على 500 مليار علامة (Token) على يي، وتم تحسينه أيضًا باستخدام 3 ملايين مثال متنوع للتدريب الدقيق."
+  },
  "yi-large": {
    "description": "نموذج جديد بمليارات المعلمات، يوفر قدرة قوية على الإجابة وتوليد النصوص."
  },
@@ -23,6 +23,9 @@
  "cloudflare": {
    "description": "تشغيل نماذج التعلم الآلي المدفوعة بوحدات معالجة الرسوميات بدون خادم على شبكة Cloudflare العالمية."
  },
+  "cohere": {
+    "description": "تقدم Cohere أحدث نماذج متعددة اللغات، وميزات بحث متقدمة، ومساحة عمل AI مصممة خصيصًا للشركات الحديثة - كل ذلك مدمج في منصة آمنة."
+  },
  "deepseek": {
    "description": "DeepSeek هي شركة تركز على أبحاث وتطبيقات تقنيات الذكاء الاصطناعي، حيث يجمع نموذجها الأحدث DeepSeek-V2.5 بين قدرات الحوار العامة ومعالجة الشيفرات، وقد حقق تحسينات ملحوظة في محاذاة تفضيلات البشر، ومهام الكتابة، واتباع التعليمات."
  },
@@ -53,6 +56,9 @@
  "hunyuan": {
    "description": "نموذج لغة متقدم تم تطويره بواسطة Tencent، يتمتع بقدرة قوية على الإبداع باللغة الصينية، وقدرة على الاستدلال المنطقي في سياقات معقدة، بالإضافة إلى قدرة موثوقة على تنفيذ المهام."
  },
+  "infiniai": {
+    "description": "يقدم خدمات نماذج كبيرة ذات أداء عالٍ وسهولة الاستخدام وأمان موثوق به للمطورين، تغطي كامل العملية من تطوير النماذج الكبيرة إلى نشرها كخدمات."
+  },
  "internlm": {
    "description": "منظمة مفتوحة المصدر مكرسة لأبحاث وتطوير أدوات النماذج الكبيرة. توفر منصة مفتوحة المصدر فعالة وسهلة الاستخدام لجميع مطوري الذكاء الاصطناعي، مما يجعل أحدث تقنيات النماذج الكبيرة والخوارزميات في متناول اليد."
  },
@@ -98,6 +104,9 @@
  "sambanova": {
    "description": "تتيح لك سحابة SambaNova استخدام أفضل النماذج مفتوحة المصدر بسهولة، والاستمتاع بأسرع سرعة استدلال."
  },
+  "search1api": {
+    "description": "يوفر Search1API الوصول إلى سلسلة نماذج DeepSeek التي يمكن الاتصال بها حسب الحاجة، بما في ذلك النسخة القياسية والنسخة السريعة، مع دعم لاختيار نماذج بمقاييس معلمات متعددة."
+  },
  "sensenova": {
    "description": "تقدم شركة SenseTime خدمات نماذج كبيرة شاملة وسهلة الاستخدام، مدعومة بقوة من البنية التحتية الكبيرة لشركة SenseTime."
  },
@@ -137,6 +146,9 @@
  "xai": {
    "description": "xAI هي شركة تكرّس جهودها لبناء الذكاء الاصطناعي لتسريع الاكتشافات العلمية البشرية. مهمتنا هي تعزيز فهمنا المشترك للكون."
  },
+  "xinference": {
+    "description": "Xorbits Inference (Xinference) هو منصة مفتوحة المصدر مصممة لتبسيط تشغيل ودمج نماذج الذكاء الاصطناعي المتنوعة. باستخدام Xinference، يمكنك تشغيل الاستدلال على نماذج LLM مفتوحة المصدر، ونماذج التضمين، والنماذج متعددة الوسائط سواء في السحابة أو في البيئات المحلية، وإنشاء تطبيقات ذكاء اصطناعي قوية."
+  },
  "zeroone": {
    "description": "01.AI تركز على تقنيات الذكاء الاصطناعي في عصر الذكاء الاصطناعي 2.0، وتعزز الابتكار والتطبيقات \"الإنسان + الذكاء الاصطناعي\"، باستخدام نماذج قوية وتقنيات ذكاء اصطناعي متقدمة لتعزيز إنتاجية البشر وتحقيق تمكين التكنولوجيا."
  },
@@ -42,6 +42,17 @@
    "sessionWithName": "إعدادات الجلسة · {{name}}",
    "title": "إعدادات"
  },
+  "hotkey": {
+    "conflicts": "يتعارض مع اختصارات لوحة المفاتيح الحالية",
+    "group": {
+      "conversation": "المحادثة",
+      "essential": "أساسي"
+    },
+    "invalidCombination": "يجب أن تحتوي اختصارات لوحة المفاتيح على مفتاح تعديل واحد على الأقل (Ctrl، Alt، Shift) ومفتاح عادي واحد",
+    "record": "اضغط على المفتاح لتسجيل اختصار لوحة المفاتيح",
+    "reset": "إعادة تعيين إلى اختصارات لوحة المفاتيح الافتراضية",
+    "title": "اختصارات لوحة المفاتيح"
+  },
  "llm": {
    "aesGcm": "سيتم استخدام خوارزمية التشفير <1>AES-GCM</1> لتشفير مفتاحك وعنوان الوكيل",
    "apiKey": {
@@ -335,6 +346,33 @@
    },
    "title": "إعدادات السمة"
  },
+  "storage": {
+    "actions": {
+      "export": {
+        "button": "تصدير",
+        "exportType": {
+          "agent": "تصدير إعدادات المساعد",
+          "agentWithMessage": "تصدير المساعد والرسائل",
+          "all": "تصدير الإعدادات العالمية وجميع بيانات المساعدين",
+          "allAgent": "تصدير جميع إعدادات المساعدين",
+          "allAgentWithMessage": "تصدير جميع المساعدين والرسائل",
+          "globalSetting": "تصدير الإعدادات العالمية"
+        },
+        "title": "تصدير البيانات"
+      },
+      "import": {
+        "button": "استيراد",
+        "title": "استيراد البيانات"
+      },
+      "title": "عمليات متقدمة"
+    },
+    "desc": "حجم التخزين في المتصفح الحالي",
+    "embeddings": {
+      "used": "تخزين المتجهات"
+    },
+    "title": "تخزين البيانات",
+    "used": "حجم التخزين"
+  },
  "submitAgentModal": {
    "button": "تقديم المساعد",
    "identifier": "معرف المساعد",
@@ -425,8 +463,10 @@
    "agent": "المساعد الافتراضي",
    "common": "إعدادات عامة",
    "experiment": "تجربة",
+    "hotkey": "اختصارات لوحة المفاتيح",
    "llm": "نموذج اللغة",
    "provider": "مزود خدمة الذكاء الاصطناعي",
+    "storage": "تخزين البيانات",
    "sync": "مزامنة السحابة",
    "system-agent": "مساعد النظام",
    "tts": "خدمة الكلام"
@@ -32,6 +32,7 @@
    "title": "قائمة المواضيع"
  },
  "searchPlaceholder": "ابحث عن موضوع...",
+  "searchResultEmpty": "لا توجد نتائج للبحث",
  "temp": "مؤقت",
  "title": "موضوع"
 }
@@ -64,6 +64,9 @@
    "stop": "Спри",
    "warp": "Нов ред"
  },
+  "intentUnderstanding": {
+    "title": "Разбирам и анализирам вашето намерение..."
+  },
  "knowledgeBase": {
    "all": "Всички съдържания",
    "allFiles": "Всички файлове",
@@ -144,7 +147,6 @@
        "desc": "Интелигентно определяне на необходимостта от търсене въз основа на съдържанието на разговора",
        "title": "Интелигентно свързване"
      },
-      "disable": "Текущият модел не поддържа извикване на функции, затова не може да се използва интелигентно свързване",
      "off": {
        "desc": "Използва само основните знания на модела, без интернет търсене",
        "title": "Изключване на свързването"
@@ -155,6 +157,10 @@
      },
      "useModelBuiltin": "Използване на вградената търсачка на модела"
    },
+    "searchModel": {
+      "desc": "Текущият модел не поддържа извикване на функции, затова е необходимо да се комбинира с модел, който поддържа извикване на функции, за да се извърши търсене в интернет",
+      "title": "Модел за търсене на помощ"
+    },
    "title": "Търсене в интернет"
  },
  "searchAgentPlaceholder": "Търсач на помощ...",
@@ -41,7 +41,10 @@
    "error": {
      "desc": "Извинявайте, но възникна проблем по време на инициализацията на Pglite базата данни. Моля, натиснете бутона, за да опиташ отново. Ако проблемът продължава след многократни опити, моля <1>подайте проблем</1>, и ние ще ви помогнем възможно най-скоро.",
      "detail": "Причина за грешка: [{{type}}] {{message}}. Подробности по-долу:",
+      "detailTitle": "Причина за грешка",
+      "report": "Докладвайте за проблема",
      "retry": "Опитай отново",
+      "selfSolve": "Самостоятелно решение",
      "title": "Неуспешна инициализация на базата данни"
    },
    "initing": {
@@ -80,6 +83,54 @@
      "button": "Използвайте сега",
      "desc": "Искам да използвам веднага",
      "title": "PGlite базата данни е готова"
+    },
+    "solve": {
+      "backup": {
+        "backup": "Резервно копие",
+        "backupSuccess": "Резервното копие е успешно",
+        "desc": "Експортиране на ключови данни от текущата база данни",
+        "export": "Експортиране на всички данни",
+        "exportDesc": "Експортираните данни ще бъдат запазени в JSON формат и могат да се използват за последващо възстановяване или анализ.",
+        "reset": {
+          "alert": "Предупреждение",
+          "alertDesc": "Следните действия могат да доведат до загуба на данни. Моля, уверете се, че сте направили резервно копие на важните данни, преди да продължите.",
+          "button": "Пълно нулиране на базата данни (изтриване на всички данни)",
+          "confirm": {
+            "desc": "Тази операция ще изтрие всички данни и не може да бъде отменена. Потвърдете, за да продължите?",
+            "title": "Потвърдете нулирането на базата данни"
+          },
+          "desc": "Нулиране на базата данни в случай на неизменяемо преместване",
+          "title": "Нулиране на базата данни"
+        },
+        "restore": "Възстановяване",
+        "restoreSuccess": "Възстановяването е успешно",
+        "title": "Резервно копие на данни"
+      },
+      "diagnosis": {
+        "createdAt": "Дата на създаване",
+        "migratedAt": "Дата на завършване на миграцията",
+        "sql": "Миграционен SQL",
+        "title": "Състояние на миграцията"
+      },
+      "repair": {
+        "desc": "Ръчно управление на състоянието на миграцията",
+        "runSQL": "Персонализирано изпълнение",
+        "sql": {
+          "clear": "Изчистване",
+          "desc": "Изпълнение на персонализирани SQL команди за поправка на проблеми с базата данни",
+          "markFinished": "Маркирай като завършено",
+          "placeholder": "Въведете SQL команда...",
+          "result": "Резултат от изпълнението",
+          "run": "Изпълни",
+          "title": "SQL изпълнител"
+        },
+        "title": "Контрол на миграцията"
+      },
+      "tabs": {
+        "backup": "Резервно копие и възстановяване",
+        "diagnosis": "Диагностика",
+        "repair": "Поправка"
+      }
    }
  },
  "close": "Затвори",
@@ -132,7 +183,7 @@
  },
  "fullscreen": "Цял екран",
  "historyRange": "Диапазон на историята",
-  "import": "Импортирай конфигурация",
+  "importData": "Импорт на данни",
  "importModal": {
    "error": {
      "desc": "Съжаляваме, възникна грешка по време на процеса на импорт на данни. Моля, опитайте отново да ги импортирате или <1>подайте проблем</1>, за да можем да помогнем веднага с отстраняването на проблема.",
@@ -154,7 +205,8 @@
      "sessions": "Агенти",
      "skips": "Пропуснати дубликати",
      "topics": "Теми",
-      "type": "Тип данни"
+      "type": "Тип данни",
+      "update": "Актуализиране на записа"
    },
    "title": "Импортирай данни",
    "uploading": {
@@ -163,6 +215,16 @@
      "speed": "Скорост на качване"
    }
  },
+  "importPreview": {
+    "confirmImport": "Потвърдете импорта",
+    "tables": {
+      "count": "Брой записи",
+      "name": "Име на таблицата"
+    },
+    "title": "Преглед на данните за импортиране",
+    "totalRecords": "Общо ще бъдат импортирани {{count}} записа",
+    "totalTables": "{{count}} таблици"
+  },
  "information": "Общност и информация",
  "installPWA": "Инсталиране на PWA",
  "lang": {
@@ -76,6 +76,7 @@
      "custom": "Потребителски модел, по подразбиране поддържа функционалност за функционални обаждания и визуално разпознаване, моля, потвърдете наличието на тези възможности спрямо реалните условия",
      "file": "Този модел поддържа качване на файлове и разпознаване",
      "functionCall": "Този модел поддържа функционални обаждания (Function Call)",
+      "imageOutput": "Този модел поддържа генериране на изображения",
      "reasoning": "Този модел поддържа дълбочинно мислене",
      "search": "Този модел поддържа търсене в мрежата",
      "tokens": "Този модел поддържа до {{tokens}} токена за една сесия",
@@ -85,6 +86,8 @@
  },
  "ModelSwitchPanel": {
    "emptyModel": "Няма активирани модели, моля, посетете настройките и ги активирайте",
+    "emptyProvider": "Няма активиран доставчик на услуги, моля, отидете в настройките, за да го активирате",
+    "goToSettings": "Отидете в настройките",
    "provider": "Доставчик"
  },
  "OllamaSetupGuide": {
@@ -16,6 +16,16 @@
    "detail": "Детайли за грешката",
    "title": "Заявката не успя"
  },
+  "import": {
+    "importConfigFile": {
+      "description": "Причина за грешка: {{reason}}",
+      "title": "Импортирането не успя"
+    },
+    "incompatible": {
+      "description": "Този файл е експортиран от по-висока версия, моля, опитайте да актуализирате до последната версия и след това опитайте отново да импортирате",
+      "title": "Текущото приложение не поддържа импортиране на този файл"
+    }
+  },
  "loginRequired": {
    "desc": "Ще бъдете автоматично пренасочени към страницата за вход",
    "title": "Моля, влезте, за да използвате тази функция"
@@ -69,6 +79,7 @@
    "524": "Съжаляваме, сървърът изтече времето за изчакване при очакване на отговор, вероятно поради бавен отговор, моля, опитайте отново по-късно",
    "AgentRuntimeError": "Грешка при изпълнение на времето за изпълнение на езиковия модел Lobe. Моля, отстранете неизправностите или опитайте отново въз основа на следната информация.",
    "ConnectionCheckFailed": "Заявката върна празен отговор. Моля, проверете дали адресът на API проксито не завършва с `/v1`.",
+    "CreateMessageError": "Съжалявам, съобщението не можа да бъде изпратено успешно. Моля, копирайте съдържанието и го изпратете отново. След опресняване на страницата, това съобщение няма да бъде запазено.",
    "ExceededContextWindow": "Текущото съдържание на заявката надвишава дължината, която моделът може да обработи. Моля, намалете обема на съдържанието и опитайте отново.",
    "FreePlanLimit": "В момента сте потребител на безплатен план и не можете да използвате тази функционалност. Моля, надстройте до платен план, за да продължите да я използвате.",
    "InsufficientQuota": "Съжаляваме, квотата за този ключ е достигнала лимита. Моля, проверете баланса на акаунта си или увеличете квотата на ключа и опитайте отново.",
@@ -0,0 +1,46 @@
+{
+  "addUserMessage": {
+    "desc": "Добавете текущото съдържание като съобщение от потребителя, без да задействате генерирането",
+    "title": "Добавяне на съобщение от потребителя"
+  },
+  "editMessage": {
+    "desc": "Влезте в режим на редактиране, като задържите Alt и два пъти кликнете върху съобщението",
+    "title": "Редактиране на съобщение"
+  },
+  "openChatSettings": {
+    "desc": "Прегледайте и променете настройките на текущия разговор",
+    "title": "Отворете настройките на чата"
+  },
+  "openHotkeyHelper": {
+    "desc": "Прегледайте инструкциите за използване на всички клавишни комбинации",
+    "title": "Отворете помощта за клавишни комбинации"
+  },
+  "regenerateMessage": {
+    "desc": "Прегенерирайте последното съобщение",
+    "title": "Прегенериране на съобщение"
+  },
+  "saveTopic": {
+    "desc": "Запазете текущата тема и отворете нова",
+    "title": "Създаване на нова тема"
+  },
+  "search": {
+    "desc": "Активирайте основното поле за търсене на текущата страница",
+    "title": "Търсене"
+  },
+  "switchAgent": {
+    "desc": "Сменете помощника, фиксиран в страничната лента, като задържите Ctrl и натиснете число от 0 до 9",
+    "title": "Бърза смяна на помощника"
+  },
+  "toggleLeftPanel": {
+    "desc": "Показване или скриване на панела с помощ отляво",
+    "title": "Показване/скриване на панела с помощника"
+  },
+  "toggleRightPanel": {
+    "desc": "Показване или скриване на панела с теми отдясно",
+    "title": "Показване/скриване на панела с теми"
+  },
+  "toggleZenMode": {
+    "desc": "В режим на фокус, показвайте само текущия разговор, скривайки другия интерфейс",
+    "title": "Превключване на режим на фокус"
+  }
+}
@@ -1,13 +1,4 @@
 {
-  "01-ai/Yi-1.5-34B-Chat-16K": {
-    "description": "Yi-1.5 34B предлага отлични резултати в индустриалните приложения с богат набор от обучителни примери."
-  },
-  "01-ai/Yi-1.5-6B-Chat": {
-    "description": "Yi-1.5-6B-Chat е вариант на Yi-1.5, който принадлежи към отворените модели за разговори. Yi-1.5 е подобрена версия на Yi, която е била предварително обучена на 500B висококачествени корпуси и е била фино настроена на 3M разнообразни примери. В сравнение с Yi, Yi-1.5 показва по-силни способности в кодирането, математиката, разсъжденията и следването на инструкции, като същевременно запазва отлични способности за разбиране на езика, разсъждения на общи познания и разбиране на текст. Моделът предлага версии с контекстна дължина от 4K, 16K и 32K, с общо количество предварително обучение от 3.6T токена."
-  },
-  "01-ai/Yi-1.5-9B-Chat-16K": {
-    "description": "Yi-1.5 9B поддържа 16K токена, предоставяйки ефективни и плавни способности за генериране на език."
-  },
  "01-ai/yi-1.5-34b-chat": {
    "description": "零一万物, най-новият отворен модел с фина настройка, с 34 милиарда параметри, който поддържа множество диалогови сценарии, с висококачествени обучителни данни, съобразени с човешките предпочитания."
  },
@@ -149,12 +140,6 @@
  "Llama-3.2-90B-Vision-Instruct\t": {
    "description": "Напреднали способности за визуално разсъждение, подходящи за приложения на агенти за визуално разбиране."
  },
-  "LoRA/Qwen/Qwen2.5-72B-Instruct": {
-    "description": "Qwen2.5-72B-Instruct е един от най-новите големи езикови модели, публикувани от Alibaba Cloud. Този 72B модел показва значителни подобрения в областите на кодирането и математиката. Моделът предлага многоезична поддръжка, обхващаща над 29 езика, включително китайски, английски и др. Моделът показва значителни подобрения в следването на инструкции, разбирането на структурирани данни и генерирането на структурирани изходи (особено JSON)."
-  },
-  "LoRA/Qwen/Qwen2.5-7B-Instruct": {
-    "description": "Qwen2.5-7B-Instruct е един от най-новите големи езикови модели, публикувани от Alibaba Cloud. Този 7B модел показва значителни подобрения в областите на кодирането и математиката. Моделът предлага многоезична поддръжка, обхващаща над 29 езика, включително китайски, английски и др. Моделът показва значителни подобрения в следването на инструкции, разбирането на структурирани данни и генерирането на структурирани изходи (особено JSON)."
-  },
  "Meta-Llama-3.1-405B-Instruct": {
    "description": "Текстов модел с оптимизация за инструкции на Llama 3.1, проектиран за многоезични диалогови случаи, който показва отлични резултати на много налични отворени и затворени чат модели на общи индустриални бенчмаркове."
  },
@@ -179,9 +164,6 @@
  "NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO": {
    "description": "Nous Hermes 2 - Mixtral 8x7B-DPO (46.7B) е модел с висока точност за инструкции, подходящ за сложни изчисления."
  },
-  "OpenGVLab/InternVL2-26B": {
-    "description": "InternVL2 демонстрира изключителни резултати в различни визуално-языкови задачи, включително разбиране на документи и графики, разбиране на текст в сцени, OCR, решаване на научни и математически проблеми."
-  },
  "Phi-3-medium-128k-instruct": {
    "description": "Същият модел Phi-3-medium, но с по-голям размер на контекста за RAG или малко подканване."
  },
@@ -206,9 +188,6 @@
  "Phi-3.5-vision-instrust": {
    "description": "Актуализирана версия на модела Phi-3-vision."
  },
-  "Pro/OpenGVLab/InternVL2-8B": {
-    "description": "InternVL2 демонстрира изключителни резултати в различни визуално-языкови задачи, включително разбиране на документи и графики, разбиране на текст в сцени, OCR, решаване на научни и математически проблеми."
-  },
  "Pro/Qwen/Qwen2-1.5B-Instruct": {
    "description": "Qwen2-1.5B-Instruct е голям езиков модел с параметри 1.5B от серията Qwen2, специално настроен за инструкции. Моделът е базиран на архитектурата Transformer и използва технологии като SwiGLU активационна функция, QKV отклонение за внимание и групова внимание. Той показва отлични резултати в множество бенчмаркове за разбиране на езика, генериране, многоезични способности, кодиране, математика и разсъждения, надминавайки повечето отворени модели. В сравнение с Qwen1.5-1.8B-Chat, Qwen2-1.5B-Instruct показва значителни подобрения в тестовете MMLU, HumanEval, GSM8K, C-Eval и IFEval, въпреки че параметрите са малко по-малко."
  },
@@ -224,20 +203,26 @@
  "Pro/Qwen/Qwen2.5-Coder-7B-Instruct": {
    "description": "Qwen2.5-Coder-7B-Instruct е най-новата версия на серията големи езикови модели, специфични за код, публикувана от Alibaba Cloud. Моделът значително подобрява способностите за генериране на код, разсъждения и корекции, след като е обучен с 55 трилиона токена на базата на Qwen2.5. Той не само подобрява кодовите умения, но и запазва предимствата в математиката и общите способности. Моделът предоставя по-пълна основа за практическите приложения като кодови интелигентни агенти."
  },
+  "Pro/Qwen/Qwen2.5-VL-7B-Instruct": {
+    "description": "Qwen2.5-VL е нов член от серията Qwen, който разполага с мощни възможности за визуално разбиране. Той може да анализира текст, диаграми и оформление в изображения, да разбира дълги видеоклипове и да улавя събития. Може да извършва логически изводи, да работи с инструменти, поддържа локализиране на обекти в различни формати и генериране на структуриран изход. Оптимизиран е с динамична резолюция и честота на кадрите за разбиране на видео и подобрена ефективност на визуалния кодиращ модул."
+  },
  "Pro/THUDM/glm-4-9b-chat": {
    "description": "GLM-4-9B-Chat е отворената версия на предварително обучен модел от серията GLM-4, пусната от Zhizhu AI. Моделът показва отлични резултати в семантика, математика, разсъждения, код и знания. Освен че поддържа многократни разговори, GLM-4-9B-Chat предлага и напреднали функции като уеб браузинг, изпълнение на код, извикване на персонализирани инструменти (Function Call) и разсъждения с дълги текстове. Моделът поддържа 26 езика, включително китайски, английски, японски, корейски и немски. В множество бенчмаркове, GLM-4-9B-Chat показва отлична производителност, като AlignBench-v2, MT-Bench, MMLU и C-Eval. Моделът поддържа максимална контекстна дължина от 128K, подходящ за академични изследвания и търговски приложения."
  },
  "Pro/deepseek-ai/DeepSeek-R1": {
    "description": "DeepSeek-R1 е модел за инференция, управляван от обучение с подсилване (RL), който решава проблемите с повторяемостта и четимостта в моделите. Преди RL, DeepSeek-R1 въвежда данни за студен старт, за да оптимизира допълнително производителността на инференцията. Той показва сравними резултати с OpenAI-o1 в математически, кодови и инференционни задачи и подобрява общата ефективност чрез внимателно проектирани методи на обучение."
  },
+  "Pro/deepseek-ai/DeepSeek-R1-Distill-Qwen-1.5B": {
+    "description": "DeepSeek-R1-Distill-Qwen-1.5B е модел, получен чрез дистилация на знания от Qwen2.5-Math-1.5B. Моделът е фино настроен с 800 000 избрани проби, генерирани от DeepSeek-R1, и демонстрира добро представяне в множество тестове. Като лек модел, той постига 83,9% точност в MATH-500, 28,9% успеваемост в AIME 2024 и рейтинг от 954 в CodeForces, показвайки способности за разсъждение, които надхвърлят неговия мащаб на параметри."
+  },
+  "Pro/deepseek-ai/DeepSeek-R1-Distill-Qwen-7B": {
+    "description": "DeepSeek-R1-Distill-Qwen-7B е модел, получен чрез дистилация на знания от Qwen2.5-Math-7B. Този модел е фино настроен с 800 000 избрани проби, генерирани от DeepSeek-R1, и демонстрира изключителни способности за разсъждение. Той се представя отлично в множество тестове, постигайки 92,8% точност в MATH-500, 55,5% успеваемост в AIME 2024 и рейтинг от 1189 в CodeForces, показвайки силни математически и програмистки способности за модел с мащаб 7B."
+  },
  "Pro/deepseek-ai/DeepSeek-V3": {
    "description": "DeepSeek-V3 е модел на езика с 6710 милиарда параметри, който използва архитектура на смесени експерти (MoE) с много глави на потенциално внимание (MLA) и стратегия за баланс на натоварването без помощни загуби, оптимизираща производителността на инференцията и обучението. Чрез предварително обучение на 14.8 трилиона висококачествени токени и последващо супервизирано фино настройване и обучение с подсилване, DeepSeek-V3 надминава производителността на други отворени модели и е близо до водещите затворени модели."
  },
-  "Pro/google/gemma-2-9b-it": {
-    "description": "Gemma е един от най-новите леки, авангардни отворени модели, разработени от Google. Това е голям езиков модел с един декодер, който поддържа английски и предлага отворени тегла, предварително обучени варианти и варианти с фино настройване на инструкции. Моделът Gemma е подходящ за различни задачи по генериране на текст, включително въпроси и отговори, резюмиране и разсъждения. Този 9B модел е обучен с 8 трилиона токена. Неговият относително малък размер позволява внедряване в среди с ограничени ресурси, като лаптопи, настолни компютри или собствена облачна инфраструктура, което позволява на повече хора да имат достъп до авангардни AI модели и да насърчават иновации."
-  },
-  "Pro/meta-llama/Meta-Llama-3.1-8B-Instruct": {
-    "description": "Meta Llama 3.1 е семейство от многоезични големи езикови модели, разработени от Meta, включващо предварително обучени и модели с фино настройване с параметри 8B, 70B и 405B. Този 8B модел с фино настройване на инструкции е оптимизиран за многоезични разговорни сценарии и показва отлични резултати в множество индустриални бенчмаркове. Моделът е обучен с над 15 трилиона токена от публични данни и използва технологии като наблюдавано фино настройване и обучение с човешка обратна връзка, за да подобри полезността и безопасността на модела. Llama 3.1 поддържа генериране на текст и генериране на код, с дата на прекратяване на знанията до декември 2023 г."
+  "Pro/deepseek-ai/DeepSeek-V3-1226": {
+    "description": "DeepSeek-V3 е хибриден езиков модел (MoE) с 6710 милиарда параметри, използващ многоглаво внимание (MLA) и архитектурата DeepSeekMoE, комбинираща стратегия за баланс на натоварването без помощни загуби, оптимизираща ефективността на извеждане и обучение. Чрез предварително обучение на 14.8 трилиона висококачествени токени и последващо наблюдавано фино настройване и обучение с подсилване, DeepSeek-V3 надминава други отворени модели по производителност, приближавайки се до водещите затворени модели."
  },
  "QwQ-32B-Preview": {
    "description": "QwQ-32B-Preview е иновативен модел за обработка на естествен език, способен да обработва ефективно сложни задачи за генериране на диалог и разбиране на контекста."
@@ -290,6 +275,12 @@
  "Qwen/Qwen2.5-Coder-7B-Instruct": {
    "description": "Qwen2.5-Coder-7B-Instruct е най-новата версия на серията големи езикови модели, специфични за код, публикувана от Alibaba Cloud. Моделът значително подобрява способностите за генериране на код, разсъждения и корекции, след като е обучен с 55 трилиона токена на базата на Qwen2.5. Той не само подобрява кодовите умения, но и запазва предимствата в математиката и общите способности. Моделът предоставя по-пълна основа за практическите приложения като кодови интелигентни агенти."
  },
+  "Qwen/Qwen2.5-VL-32B-Instruct": {
+    "description": "Qwen2.5-VL-32B-Instruct е многомодален голям модел, разработен от екипа на Tongyi Qianwen, част от серията Qwen2.5-VL. Този модел не само разпознава отлично обичайни обекти, но също така анализира текст, диаграми, икони, графики и оформление в изображения. Той може да функционира като визуален агент, способен да разсъждава и динамично да управлява инструменти, с възможности за работа с компютри и мобилни устройства. Освен това, моделът може точно да локализира обекти в изображения и да генерира структурирани изходи за фактури, таблици и други. В сравнение с предходния модел Qwen2-VL, тази версия е подобрена чрез усилено обучение в областта на математиката и способностите за решаване на проблеми, като стилът на отговорите е по-съобразен с човешките предпочитания."
+  },
+  "Qwen/Qwen2.5-VL-72B-Instruct": {
+    "description": "Qwen2.5-VL е визуален езиков модел от серията Qwen2.5. Този модел има значителни подобрения в различни аспекти: разполага с по-добри възможности за визуално разбиране, може да разпознава обикновени обекти, да анализира текст, диаграми и оформление; като визуален агент може да разсъждава и динамично да насочва използването на инструменти; поддържа разбиране на дълги видеоклипове с продължителност над 1 час и улавяне на ключови събития; може да локализира точно обекти в изображения чрез генериране на ограничителни кутии или точки; поддържа генериране на структуриран изход, особено подходящ за сканирани данни като фактури и таблици."
+  },
  "Qwen2-72B-Instruct": {
    "description": "Qwen2 е най-новата серия на модела Qwen, поддържаща 128k контекст. В сравнение с текущите най-добри отворени модели, Qwen2-72B значително надминава водещите модели в области като разбиране на естествен език, знания, код, математика и многоезичност."
  },
@@ -374,9 +365,6 @@
  "TeleAI/TeleChat2": {
    "description": "TeleChat2 е голям модел, разработен от China Telecom, който предлага генеративен семантичен модел, поддържащ функции като енциклопедични въпроси и отговори, генериране на код и генериране на дълги текстове, предоставяйки услуги за консултации на потребителите, способни да взаимодействат с потребителите, да отговарят на въпроси и да помагат в творчеството, ефективно и удобно помагайки на потребителите да получат информация, знания и вдъхновение. Моделът показва отлични резултати в проблеми с илюзии, генериране на дълги текстове и логическо разбиране."
  },
-  "TeleAI/TeleMM": {
-    "description": "TeleMM е многомодален голям модел, разработен от China Telecom, способен да обработва текст, изображения и други видове входни данни, поддържащ функции като разбиране на изображения и анализ на графики, предоставяйки услуги за разбиране на потребителите в различни модалности. Моделът може да взаимодейства с потребителите в многомодални сценарии, точно разбирайки входното съдържание, отговаряйки на въпроси, помагайки в творчеството и ефективно предоставяйки многомодална информация и вдъхновение. Моделът показва отлични резултати в задачи с фина перцепция и логическо разсъждение."
-  },
  "Vendor-A/Qwen/Qwen2.5-72B-Instruct": {
    "description": "Qwen2.5-72B-Instruct е един от най-новите големи езикови модели, публикувани от Alibaba Cloud. Този 72B модел показва значителни подобрения в областите на кодирането и математиката. Моделът предлага многоезична поддръжка, обхващаща над 29 езика, включително китайски, английски и др. Моделът показва значителни подобрения в следването на инструкции, разбирането на структурирани данни и генерирането на структурирани изходи (особено JSON)."
  },
@@ -506,6 +494,9 @@
  "anthropic/claude-3.5-sonnet": {
    "description": "Claude 3.5 Sonnet предлага способности, надхвърлящи Opus, и по-бърза скорост в сравнение с Sonnet, като същевременно запазва същата цена. Sonnet е особено силен в програмирането, науката за данни, визуалната обработка и агентските задачи."
  },
+  "anthropic/claude-3.7-sonnet": {
+    "description": "Claude 3.7 Sonnet е най-интелигентният модел на Anthropic до момента и е първият хибриден модел за разсъждение на пазара. Claude 3.7 Sonnet може да генерира почти мигновени отговори или удължено стъпково мислене, което позволява на потребителите ясно да видят тези процеси. Sonnet е особено добър в програмирането, науката за данни, визуалната обработка и агентските задачи."
+  },
  "aya": {
    "description": "Aya 23 е многозначен модел, представен от Cohere, поддържащ 23 езика, предоставяйки удобство за многоезични приложения."
  },
@@ -515,9 +506,27 @@
  "baichuan/baichuan2-13b-chat": {
    "description": "Baichuan-13B е отворен, комерсиален голям езиков модел, разработен от Baichuan Intelligence, с 13 милиарда параметри, който постига най-добрите резултати в своя размер на авторитетни бенчмаркове на китайски и английски."
  },
+  "c4ai-aya-expanse-32b": {
+    "description": "Aya Expanse е високопроизводителен многоезичен модел с 32B, проектиран да предизвика представянето на едноезични модели чрез иновации в настройката на инструкции, арбитраж на данни, обучение на предпочитания и комбиниране на модели. Той поддържа 23 езика."
+  },
+  "c4ai-aya-expanse-8b": {
+    "description": "Aya Expanse е високопроизводителен многоезичен модел с 8B, проектиран да предизвика представянето на едноезични модели чрез иновации в настройката на инструкции, арбитраж на данни, обучение на предпочитания и комбиниране на модели. Той поддържа 23 езика."
+  },
+  "c4ai-aya-vision-32b": {
+    "description": "Aya Vision е авангарден много модален модел, който показва отлични резултати в множество ключови бенчмаркове за езикови, текстови и визуални способности. Той поддържа 23 езика. Тази версия с 32 милиарда параметри се фокусира върху авангарден многоезичен представител."
+  },
+  "c4ai-aya-vision-8b": {
+    "description": "Aya Vision е авангарден много модален модел, който показва отлични резултати в множество ключови бенчмаркове за езикови, текстови и визуални способности. Тази версия с 8 милиарда параметри се фокусира върху ниска латентност и оптимална производителност."
+  },
  "charglm-3": {
    "description": "CharGLM-3 е проектиран за ролеви игри и емоционално придружаване, поддържаща дълга многократна памет и персонализиран диалог, с широко приложение."
  },
+  "chatglm3": {
+    "description": "ChatGLM3 е закритоизточен модел, обявен от интелигентната платформа AI и лабораторията KEG на Университета в Тайхуа. Той е претрениран с голям обем на китайски и английски идентификатори и е подложен на тренировка за съответствие с хуманите предпочитания. Сравнено с първата версия на модела, ChatGLM3 постига подобрения от 16%, 36% и 280% в MMLU, C-Eval и GSM8K съответно, и е класифициран на първо място в китайския рейтинг C-Eval. Този модел е подходящ за сценарии, които изискват високи стандарти за знания, умения за разсъждаване и креативност, като например създаване на рекламни текстове, писане на романи, научно-популярно писане и генериране на код."
+  },
+  "chatglm3-6b-base": {
+    "description": "ChatGLM3-6b-base е последната генерация на редицата ChatGLM, разработена от компанията Zhipu, с 6 милиарда параметри и е открит източник."
+  },
  "chatgpt-4o-latest": {
    "description": "ChatGPT-4o е динамичен модел, който се актуализира в реално време, за да поддържа най-новата версия. Той комбинира мощно разбиране на езика и генериране на текст, подходящ за мащабни приложения, включително обслужване на клиенти, образование и техническа поддръжка."
  },
@@ -593,12 +602,39 @@
  "cohere-command-r-plus": {
    "description": "Command R+ е модел, оптимизиран за RAG, проектиран да се справя с натоварвания на ниво предприятие."
  },
+  "command": {
+    "description": "Диалогов модел, следващ инструкции, който показва високо качество и надеждност в езиковите задачи, с по-дълга контекстна дължина в сравнение с нашия основен генеративен модел."
+  },
+  "command-a-03-2025": {
+    "description": "Команда A е нашият най-мощен модел до момента, който показва отлични резултати в използването на инструменти, агенти, подобрено генериране на информация (RAG) и многоезични приложения. Команда A разполага с контекстна дължина от 256K и може да работи само с две GPU, а производителността е увеличена с 150% в сравнение с Команда R+ 08-2024."
+  },
+  "command-light": {
+    "description": "По-малка и по-бърза версия на Команда, почти толкова мощна, но с по-бърза скорост."
+  },
+  "command-light-nightly": {
+    "description": "За да съкратим времевия интервал между основните версии, пуснахме нощна версия на модела Команда. За серията command-light, тази версия се нарича command-light-nightly. Обърнете внимание, че command-light-nightly е най-новата, най-експериментална и (възможно) нестабилна версия. Нощните версии се актуализират редовно и без предварително уведомление, затова не се препоръчва използването им в производствени среди."
+  },
+  "command-nightly": {
+    "description": "За да съкратим времевия интервал между основните версии, пуснахме нощна версия на модела Команда. За серията Команда, тази версия се нарича command-cightly. Обърнете внимание, че command-nightly е най-новата, най-експериментална и (възможно) нестабилна версия. Нощните версии се актуализират редовно и без предварително уведомление, затова не се препоръчва използването им в производствени среди."
+  },
  "command-r": {
    "description": "Command R е LLM, оптимизиран за диалогови и дълги контекстуални задачи, особено подходящ за динамично взаимодействие и управление на знания."
  },
+  "command-r-03-2024": {
+    "description": "Команда R е диалогов модел, следващ инструкции, който показва по-високо качество и надеждност в езиковите задачи, с по-дълга контекстна дължина в сравнение с предишните модели. Той може да се използва за сложни работни потоци, като генериране на код, подобрено генериране на информация (RAG), използване на инструменти и агенти."
+  },
+  "command-r-08-2024": {
+    "description": "command-r-08-2024 е актуализирана версия на модела Команда R, пусната през август 2024 г."
+  },
  "command-r-plus": {
    "description": "Command R+ е високопроизводителен голям езиков модел, проектиран за реални бизнес сценарии и сложни приложения."
  },
+  "command-r-plus-04-2024": {
+    "description": "Команда R+ е диалогов модел, следващ инструкции, който показва по-високо качество и надеждност в езиковите задачи, с по-дълга контекстна дължина в сравнение с предишните модели. Той е най-подходящ за сложни RAG работни потоци и многократна употреба на инструменти."
+  },
+  "command-r7b-12-2024": {
+    "description": "command-r7b-12-2024 е малка и ефективна актуализирана версия, пусната през декември 2024 г. Тя показва отлични резултати в задачи, изискващи сложни разсъждения и многократна обработка, като RAG, използване на инструменти и агенти."
+  },
  "dall-e-2": {
    "description": "Второ поколение модел DALL·E, поддържащ по-реалистично и точно генериране на изображения, с резолюция 4 пъти по-висока от първото поколение."
  },
@@ -614,9 +650,6 @@
  "deepseek-ai/DeepSeek-R1-Distill-Llama-70B": {
    "description": "DeepSeek-R1 дестилиран модел, оптимизира производителността на разсъжденията чрез подсилено учене и данни за студен старт, отворен модел, който обновява многозадачния стандарт."
  },
-  "deepseek-ai/DeepSeek-R1-Distill-Llama-8B": {
-    "description": "DeepSeek-R1-Distill-Llama-8B е дестилиран модел, базиран на Llama-3.1-8B. Този модел е финализиран с примери, генерирани от DeepSeek-R1, и показва отлична производителност на разсъжденията. Той постига добри резултати в множество бенчмаркове, включително 89.1% точност в MATH-500, 50.4% успеваемост в AIME 2024 и 1205 точки в CodeForces, демонстрирайки силни способности за математика и програмиране."
-  },
  "deepseek-ai/DeepSeek-R1-Distill-Qwen-1.5B": {
    "description": "DeepSeek-R1 дестилиран модел, оптимизира производителността на разсъжденията чрез подсилено учене и данни за студен старт, отворен модел, който обновява многозадачния стандарт."
  },
@@ -659,12 +692,30 @@
  "deepseek-r1": {
    "description": "DeepSeek-R1 е модел за извеждане, управляван от подсилено обучение (RL), който решава проблемите с повторяемостта и четимостта в модела. Преди RL, DeepSeek-R1 въвежда данни за студен старт, за да оптимизира допълнително производителността на извеждане. Той показва сравнима производителност с OpenAI-o1 в математически, кодови и извеждащи задачи и подобрява общите резултати чрез внимателно проектирани методи на обучение."
  },
+  "deepseek-r1-70b-fast-online": {
+    "description": "DeepSeek R1 70B бърза версия, поддържаща търсене в реално време, предлагаща по-бърза скорост на отговор, без да компрометира производителността на модела."
+  },
+  "deepseek-r1-70b-online": {
+    "description": "DeepSeek R1 70B стандартна версия, поддържаща търсене в реално време, подходяща за диалози и текстови задачи, изискващи най-новата информация."
+  },
+  "deepseek-r1-distill-llama": {
+    "description": "deepseek-r1-distill-llama е модел, дестилиран от DeepSeek-R1 на базата на Llama."
+  },
  "deepseek-r1-distill-llama-70b": {
    "description": "DeepSeek R1 - по-голям и по-интелигентен модел в комплекта DeepSeek - е дестилиран в архитектурата Llama 70B. На базата на бенчмаркове и човешка оценка, този модел е по-интелигентен от оригиналния Llama 70B, особено в задачи, изискващи математическа и фактическа точност."
  },
  "deepseek-r1-distill-llama-8b": {
    "description": "Моделите от серията DeepSeek-R1-Distill са получени чрез техника на знание дестилация, като се фино настройват образците, генерирани от DeepSeek-R1, спрямо отворени модели като Qwen и Llama."
  },
+  "deepseek-r1-distill-qianfan-llama-70b": {
+    "description": "Първоначално пуснат на 14 февруари 2025 г., дестилиран от екипа за разработка на модела Qianfan с базов модел Llama3_70B (създаден с Meta Llama), в дестилираните данни също е добавен корпус от Qianfan."
+  },
+  "deepseek-r1-distill-qianfan-llama-8b": {
+    "description": "Първоначално пуснат на 14 февруари 2025 г., дестилиран от екипа за разработка на модела Qianfan с базов модел Llama3_8B (създаден с Meta Llama), в дестилираните данни също е добавен корпус от Qianfan."
+  },
+  "deepseek-r1-distill-qwen": {
+    "description": "deepseek-r1-distill-qwen е модел, базиран на Qwen, дестилиран от DeepSeek-R1."
+  },
  "deepseek-r1-distill-qwen-1.5b": {
    "description": "Моделите от серията DeepSeek-R1-Distill са получени чрез техника на знание дестилация, като се фино настройват образците, генерирани от DeepSeek-R1, спрямо отворени модели като Qwen и Llama."
  },
@@ -677,6 +728,12 @@
  "deepseek-r1-distill-qwen-7b": {
    "description": "Моделите от серията DeepSeek-R1-Distill са получени чрез техника на знание дестилация, като се фино настройват образците, генерирани от DeepSeek-R1, спрямо отворени модели като Qwen и Llama."
  },
+  "deepseek-r1-fast-online": {
+    "description": "DeepSeek R1 пълна бърза версия, поддържаща търсене в реално време, комбинираща мощността на 671B параметри с по-бърза скорост на отговор."
+  },
+  "deepseek-r1-online": {
+    "description": "DeepSeek R1 пълна версия, с 671B параметри, поддържаща търсене в реално време, с по-силни способности за разбиране и генериране."
+  },
  "deepseek-reasoner": {
    "description": "Модел за извеждане, разработен от DeepSeek. Преди да предостави окончателния отговор, моделът първо извежда част от веригата на мислене, за да повиши точността на крайния отговор."
  },
@@ -689,6 +746,9 @@
  "deepseek-v3": {
    "description": "DeepSeek-V3 е MoE модел, разработен от Hangzhou DeepSeek AI Technology Research Co., Ltd., с отлични резултати в множество тестове, заемащ първото място в основните класации на отворените модели. V3 постига 3-кратно увеличение на скоростта на генериране в сравнение с V2.5, предоставяйки на потребителите по-бързо и гладко изживяване."
  },
+  "deepseek-v3-0324": {
+    "description": "DeepSeek-V3-0324 е MoE модел с 671B параметри, който се отличава с предимства в програмирането и техническите способности, разбирането на контекста и обработката на дълги текстове."
+  },
  "deepseek/deepseek-chat": {
    "description": "Новооткритият отворен модел, който съчетава общи и кодови способности, не само запазва общата диалогова способност на оригиналния Chat модел и мощната способност за обработка на код на Coder модела, но също така по-добре се съобразява с човешките предпочитания. Освен това, DeepSeek-V2.5 постигна значителни подобрения в задачи по писане, следване на инструкции и много други."
  },
@@ -755,6 +815,9 @@
  "ernie-4.0-turbo-8k-preview": {
    "description": "Флагманският голям езиков модел, разработен от Baidu, с отлични общи резултати, широко приложим в сложни задачи в различни области; поддържа автоматично свързване с плъгина за търсене на Baidu, осигурявайки актуалност на информацията. В сравнение с ERNIE 4.0, показва по-добри резултати."
  },
+  "ernie-4.5-8k-preview": {
+    "description": "Моделът Ernie 4.5 е ново поколение оригинален много модален основен модел, разработен от Baidu, който постига съвместна оптимизация чрез многомодално моделиране, с отлични способности за разбиране на много модалности; предлага усъвършенствани езикови способности, с подобрено разбиране, генериране, логика и памет, значително подобрени способности за избягване на халюцинации, логическо разсъждение и код."
+  },
  "ernie-char-8k": {
    "description": "Специализиран голям езиков модел, разработен от Baidu, подходящ за приложения като NPC в игри, диалози на клиентска поддръжка и ролеви игри, с по-изразителен и последователен стил на персонажите, по-силна способност за следване на инструкции и по-добра производителност на разсъжденията."
  },
@@ -788,9 +851,6 @@
  "gemini-1.0-pro-latest": {
    "description": "Gemini 1.0 Pro е високопроизводителен AI модел на Google, проектиран за разширяване на широк спектър от задачи."
  },
-  "gemini-1.5-flash": {
-    "description": "Gemini 1.5 Flash е най-новият мултимодален AI модел на Google, който предлага бърза обработка и поддържа текстови, изображенчески и видео входове, подходящ за ефективно разширяване на различни задачи."
-  },
  "gemini-1.5-flash-001": {
    "description": "Gemini 1.5 Flash 001 е ефективен многомодален модел, който поддържа разширяване на широк спектър от приложения."
  },
@@ -803,6 +863,9 @@
  "gemini-1.5-flash-8b-exp-0924": {
    "description": "Gemini 1.5 Flash 8B 0924 е най-новият експериментален модел, който показва значителни подобрения в производителността както в текстови, така и в мултимодални приложения."
  },
+  "gemini-1.5-flash-8b-latest": {
+    "description": "Gemini 1.5 Flash 8B е високоефективен мултимодален модел, който поддържа разширени приложения."
+  },
  "gemini-1.5-flash-exp-0827": {
    "description": "Gemini 1.5 Flash 0827 предлага оптимизирани мултимодални способности, подходящи за различни сложни задачи."
  },
@@ -830,24 +893,27 @@
  "gemini-2.0-flash-001": {
    "description": "Gemini 2.0 Flash предлага следващо поколение функции и подобрения, включително изключителна скорост, нативна употреба на инструменти, многомодално генериране и контекстен прозорец от 1M токена."
  },
+  "gemini-2.0-flash-exp": {
+    "description": "Gemini 2.0 Flash моделна вариация, оптимизирана за икономичност и ниска латентност."
+  },
+  "gemini-2.0-flash-exp-image-generation": {
+    "description": "Gemini 2.0 Flash експериментален модел, който поддържа генериране на изображения"
+  },
  "gemini-2.0-flash-lite": {
    "description": "Gemini 2.0 Flash е вариант на модела, оптимизиран за икономичност и ниска латентност."
  },
  "gemini-2.0-flash-lite-001": {
    "description": "Gemini 2.0 Flash е вариант на модела, оптимизиран за икономичност и ниска латентност."
  },
-  "gemini-2.0-flash-lite-preview-02-05": {
-    "description": "Модел на Gemini 2.0 Flash, оптимизиран за икономичност и ниска латентност."
-  },
-  "gemini-2.0-flash-thinking-exp": {
-    "description": "Gemini 2.0 Flash Exp е най-новият експериментален многомодален AI модел на Google, с ново поколение функции, изключителна скорост, нативно извикване на инструменти и многомодално генериране."
-  },
  "gemini-2.0-flash-thinking-exp-01-21": {
    "description": "Gemini 2.0 Flash Exp е най-новият експериментален многомодален AI модел на Google, с ново поколение функции, изключителна скорост, нативно извикване на инструменти и многомодално генериране."
  },
  "gemini-2.0-pro-exp-02-05": {
    "description": "Gemini 2.0 Pro Experimental е най-новият експериментален многомодален AI модел на Google, който предлага значително подобрение в качеството в сравнение с предишните версии, особено по отношение на световни знания, код и дълги контексти."
  },
+  "gemini-2.5-pro-exp-03-25": {
+    "description": "Gemini 2.5 Pro Experimental е най-напредналият модел на мислене на Google, способен да разсъждава по сложни проблеми в код, математика и STEM области, както и да анализира големи набори от данни, кодови библиотеки и документи, използвайки дълъг контекст."
+  },
  "gemma-7b-it": {
    "description": "Gemma 7B е подходяща за обработка на средни и малки задачи, съчетаваща икономичност."
  },
@@ -1016,6 +1082,9 @@
  "gpt-4o-mini-realtime-preview": {
    "description": "Реален вариант на GPT-4o-mini, поддържащ вход и изход на аудио и текст в реално време."
  },
+  "gpt-4o-mini-tts": {
+    "description": "GPT-4o mini TTS е модел за преобразуване на текст в реч, базиран на GPT-4o mini, предлагащ висококачествено генериране на реч при по-ниска цена."
+  },
  "gpt-4o-realtime-preview": {
    "description": "Реален вариант на GPT-4o, поддържащ вход и изход на аудио и текст в реално време."
  },
@@ -1073,6 +1142,12 @@
  "hunyuan-standard-vision": {
    "description": "Най-новият мултимодален модел на Hunyuan, поддържащ отговори на множество езици, с балансирани способности на китайски и английски."
  },
+  "hunyuan-t1-20250321": {
+    "description": "Цялостно изграждане на моделни способности в хуманитарни и точни науки, с висока способност за улавяне на дълги текстови информации. Поддържа разсъждения и отговори на научни въпроси от всякаква трудност, включително математика, логика, наука и код."
+  },
+  "hunyuan-t1-latest": {
+    "description": "Първият в индустрията свръхголям хибриден трансформаторен модел за инференция, който разширява инференционните способности, предлага изключителна скорост на декодиране и допълнително съгласува човешките предпочитания."
+  },
  "hunyuan-translation": {
    "description": "Поддържа автоматичен превод между 15 езика, включително китайски, английски, японски, френски, португалски, испански, турски, руски, арабски, корейски, италиански, немски, виетнамски, малайски и индонезийски, базиран на автоматизирана оценка COMET, с цялостна преводна способност, която е по-добра от моделите на пазара с подобен мащаб."
  },
@@ -1082,9 +1157,6 @@
  "hunyuan-turbo": {
    "description": "Предварителна версия на новото поколение голям езиков модел на HunYuan, използваща нова структура на смесен експертен модел (MoE), с по-бърза скорост на извеждане и по-силни резултати в сравнение с hunyuan-pro."
  },
-  "hunyuan-turbo-20241120": {
-    "description": "Фиксирана версия на hunyuan-turbo от 20 ноември 2024 г., която е между hunyuan-turbo и hunyuan-turbo-latest."
-  },
  "hunyuan-turbo-20241223": {
    "description": "Оптимизация в тази версия: скалиране на данни и инструкции, значително повишаване на общата генерализационна способност на модела; значително повишаване на математическите, кодовите и логическите способности; оптимизиране на свързаните с разбирането на текста и думите способности; оптимизиране на качеството на генерираното съдържание при създаване на текст."
  },
@@ -1094,6 +1166,15 @@
  "hunyuan-turbo-vision": {
    "description": "Новото поколение визуално езиково флагманско голямо модел на Hunyuan, използващо нова структура на смесен експертен модел (MoE), с цялостно подобрение на способностите за основно разпознаване, създаване на съдържание, отговори на въпроси и анализ и разсъждение в сравнение с предишното поколение модели."
  },
+  "hunyuan-turbos-20250226": {
+    "description": "hunyuan-TurboS pv2.1.2 фиксирана версия, предтренировъчна база с увеличен брой токени; подобрени способности за разсъждение в математика/логика/код и др.; подобрено изживяване на китайски и английски, включително текстово творчество, разбиране на текст, въпроси и отговори, разговори и др."
+  },
+  "hunyuan-turbos-20250313": {
+    "description": "Уеднаквяване на стила на математическите решения, засилване на многократните въпроси и отговори по математика. Оптимизация на стила на отговорите в текстовото творчество, премахване на AI привкус и добавяне на литературност."
+  },
+  "hunyuan-turbos-latest": {
+    "description": "hunyuan-TurboS е последната версия на флагманския модел Hunyuan, с по-силни способности за разсъждение и по-добро потребителско изживяване."
+  },
  "hunyuan-vision": {
    "description": "Най-новият мултимодален модел на HunYuan, поддържащ генериране на текстово съдържание от изображения и текстови входове."
  },
@@ -1124,12 +1205,18 @@
  "lite": {
    "description": "Spark Lite е лек модел на голям език, с изключително ниска латентност и ефективна обработка, напълно безплатен и отворен, поддържащ функции за онлайн търсене в реално време. Неговите бързи отговори го правят отличен за приложения на нискомощни устройства и фина настройка на модели, предоставяйки на потребителите отлична рентабилност и интелигентно изживяване, особено в контекста на въпроси и отговори, генериране на съдържание и търсене."
  },
+  "llama-2-7b-chat": {
+    "description": "Llama2 е серия от големи модели за език (LLM), разработени и с отворен код от Meta. Това е набор от генеративни текстови модели с различен размер, от 7 милиарда до 70 милиарда параметри, които са претренирани и майсторски оптимизирани. Архитектурно, Llama2 е автоматично регресивен езиков модел, използващ оптимизирана трансформаторна архитектура. Подобренията включват супервизирано майсторско трениране (SFT) и подкрепено с учене с награди (RLHF) за подреждане на предпочтенията на хората за полезност и безопасност. Llama2 демонстрира значително подобрени резултати върху множество академични набори от данни, което предоставя възможности за дизайн и развитие на много други модели."
+  },
  "llama-3.1-70b-versatile": {
    "description": "Llama 3.1 70B предлага по-мощни способности за разсъждение на AI, подходящи за сложни приложения, поддържащи множество изчислителни обработки и осигуряващи ефективност и точност."
  },
  "llama-3.1-8b-instant": {
    "description": "Llama 3.1 8B е модел с висока производителност, предлагащ бързи способности за генериране на текст, особено подходящ за приложения, изискващи мащабна ефективност и икономичност."
  },
+  "llama-3.1-instruct": {
+    "description": "Моделата Llama 3.1 с фина настройка за инструкции е оптимизирана за диалогови сценарии и надминава много съществуващи модели с отворен код в общи отраслови бенчмарк тестове."
+  },
  "llama-3.2-11b-vision-instruct": {
    "description": "Изключителни способности за визуално разсъждение върху изображения с висока разделителна способност, подходящи за приложения за визуално разбиране."
  },
@@ -1142,12 +1229,18 @@
  "llama-3.2-90b-vision-preview": {
    "description": "Llama 3.2 е проектиран да обработва задачи, свързващи визуални и текстови данни. Той показва отлични резултати в задачи като описание на изображения и визуални въпроси и отговори, преодолявайки пропастта между генерирането на език и визуалното разсъждение."
  },
+  "llama-3.2-vision-instruct": {
+    "description": "Моделът Llama 3.2-Vision с инструкции е оптимизиран за визуално разпознаване, изводи от изображения, описание на изображения и отговаряне на общи въпроси, свързани с изображения."
+  },
  "llama-3.3-70b-instruct": {
    "description": "Llama 3.3 е най-напредналият многоезичен отворен езиков модел от серията Llama, който предлага производителност, сравнима с 405B моделите, на изключително ниска цена. Базиран на структурата Transformer и подобрен чрез супервизирано фино настройване (SFT) и обучение с човешка обратна връзка (RLHF) за повишаване на полезността и безопасността. Неговата версия, оптимизирана за инструкции, е специално проектирана за многоезични диалози и показва по-добри резултати от много от отворените и затворените чат модели в множество индустриални бенчмаркове. Краен срок за знания: декември 2023."
  },
  "llama-3.3-70b-versatile": {
    "description": "Meta Llama 3.3 е многоезичен модел за генерация на език (LLM) с 70B (вход/изход на текст), който е предварително обучен и е пригоден за указания. Чистият текстов модел на Llama 3.3 е оптимизиран за многоезични диалогови случаи и надминава много налични отворени и затворени чат модели на стандартни индустриални тестове."
  },
+  "llama-3.3-instruct": {
+    "description": "Моделата Llama 3.3 с фина настройка за инструкции е оптимизирана за диалогови сценарии и надминава много съществуващи модели с отворен код в общи отраслови бенчмарк тестове."
+  },
  "llama3-70b-8192": {
    "description": "Meta Llama 3 70B предлага ненадмината способност за обработка на сложност, проектирана за високи изисквания."
  },
@@ -1187,6 +1280,9 @@
  "max-32k": {
    "description": "Spark Max 32K е конфигуриран с голяма способност за обработка на контекст, с по-силно разбиране на контекста и логическо разсъждение, поддържащ текстови входове до 32K токена, подходящ за четене на дълги документи, частни въпроси и отговори и други сценарии."
  },
+  "megrez-3b-instruct": {
+    "description": "Megrez-3B-Instruct е голям езиков модел, напълно обучен от безкрайната връху чиповете. Megrez-3B-Instruct се стреми чрез концепцията за съвместно хардуерно-софтуерно взаимодействие да създаде решение за крайните устройства, което е бързо за извършване, компактно и лесно за използване."
+  },
  "meta-llama-3-70b-instruct": {
    "description": "Мощен модел с 70 милиарда параметри, отличаващ се в разсъждения, кодиране и широки езикови приложения."
  },
@@ -1223,9 +1319,6 @@
  "meta-llama/Llama-3.2-90B-Vision-Instruct-Turbo": {
    "description": "LLaMA 3.2 е проектирана да обработва задачи, комбиниращи визуални и текстови данни. Тя демонстрира отлични резултати в задачи като описание на изображения и визуални въпроси и отговори, преодолявайки пропастта между генерирането на езици и визуалното разсъждение."
  },
-  "meta-llama/Llama-3.3-70B-Instruct": {
-    "description": "Llama 3.3 е най-напредналият многоезичен отворен голям езиков модел от серията Llama, предлагащ производителност, сравнима с 405B моделите на изключително ниска цена. Базиран на структурата Transformer и подобрен чрез супервизирано фино настройване (SFT) и обучение с човешка обратна връзка (RLHF) за повишаване на полезността и безопасността. Неговата версия за оптимизация на инструкции е специално проектирана за многоезични диалози и показва по-добри резултати от много от отворените и затворените чат модели в множество индустриални бенчмаркове. Краен срок за знания: декември 2023 г."
-  },
  "meta-llama/Llama-3.3-70B-Instruct-Turbo": {
    "description": "Meta Llama 3.3 многоезичен голям езиков модел (LLM) е предварително обучен и коригиран за инструкции в 70B (текстов вход/текстов изход). Моделът Llama 3.3, коригиран за инструкции, е оптимизиран за многоезични диалогови случаи и превъзхожда много налични отворени и затворени чат модели на общи индустриални бенчмаркове."
  },
@@ -1253,15 +1346,9 @@
  "meta-llama/Meta-Llama-3.1-70B": {
    "description": "Llama 3.1 е водещ модел, представен от Meta, поддържащ до 405B параметри, подходящ за сложни разговори, многоезичен превод и анализ на данни."
  },
-  "meta-llama/Meta-Llama-3.1-70B-Instruct": {
-    "description": "LLaMA 3.1 70B предлага ефективна поддръжка за многоезични диалози."
-  },
  "meta-llama/Meta-Llama-3.1-70B-Instruct-Turbo": {
    "description": "Llama 3.1 70B моделът е прецизно настроен за приложения с високо натоварване, квантован до FP8, осигурявайки по-ефективна изчислителна мощ и точност, гарантиращи изключителна производителност в сложни сценарии."
  },
-  "meta-llama/Meta-Llama-3.1-8B-Instruct": {
-    "description": "LLaMA 3.1 предлага многоезична поддръжка и е един от водещите генеративни модели в индустрията."
-  },
  "meta-llama/Meta-Llama-3.1-8B-Instruct-Turbo": {
    "description": "Llama 3.1 8B моделът използва FP8 квантоване, поддържа до 131,072 контекстови маркера и е сред най-добрите отворени модели, подходящи за сложни задачи, с производителност, превъзхождаща много индустриални стандарти."
  },
@@ -1355,12 +1442,18 @@
  "mistral-large": {
    "description": "Mixtral Large е флагманският модел на Mistral, комбиниращ способности за генериране на код, математика и разсъждение, поддържащ контекстен прозорец от 128k."
  },
+  "mistral-large-instruct": {
+    "description": "Mistral-Large-Instruct-2407 е усъвършенстван плътен голям езиков модел (LLM) с 123 милиарда параметъра, който притежава водещи във времето си способности за разсъждение, познания и кодиране."
+  },
  "mistral-large-latest": {
    "description": "Mistral Large е флагманският модел, специализиран в многоезични задачи, сложни разсъждения и генериране на код, идеален за висококачествени приложения."
  },
  "mistral-nemo": {
    "description": "Mistral Nemo е 12B модел, разработен в сътрудничество между Mistral AI и NVIDIA, предлагащ ефективна производителност."
  },
+  "mistral-nemo-instruct": {
+    "description": "Mistral-Nemo-Instruct-2407 е голям езиков модел (LLM), който представлява фино настроена за инструкции версия на Mistral-Nemo-Base-2407."
+  },
  "mistral-small": {
    "description": "Mistral Small може да се използва за всяка езикова задача, която изисква висока ефективност и ниска латентност."
  },
@@ -1577,6 +1670,12 @@
  "qwen2": {
    "description": "Qwen2 е новото поколение голям езиков модел на Alibaba, предлагащ отлична производителност за разнообразни приложения."
  },
+  "qwen2-72b-instruct": {
+    "description": "Qwen2 е новият серий на големи модели за език, предложен от екипа Qwen. Той се основава на архитектурата Transformer и използва SwiGLU активационна функция, внимание QKV смещение (attention QKV bias), групово запитване на внимание (group query attention), смесени техники за внимание с превъртващи се прозорци (mixture of sliding window attention) и пълно внимание. Освен това, екипът Qwen също е подобрал токенизатора, който поддържа множество езици и код."
+  },
+  "qwen2-7b-instruct": {
+    "description": "Qwen2 е новият серийен модел за големи езици, представен от екипа Qwen. Той се основава на архитектурата Transformer и използва SwiGLU активационна функция, внимание с QKV смещение (attention QKV bias), групово внимание за заявки (group query attention), смесени техники за обръщане на внимание с превъртващи се прозорци (mixture of sliding window attention) и пълно внимание. Освен това, екипът Qwen е подобрил токенизатора, който поддържа множество езици и код."
+  },
  "qwen2.5": {
    "description": "Qwen2.5 е новото поколение мащабен езиков модел на Alibaba, който предлага отлична производителност, за да отговори на разнообразни приложни нужди."
  },
@@ -1604,6 +1703,12 @@
  "qwen2.5-coder-7b-instruct": {
    "description": "Отворената версия на модела на кода Qwen."
  },
+  "qwen2.5-coder-instruct": {
+    "description": "Qwen2.5-Coder е най-новият специализиран голям езиков модел за код от серията Qwen (предишно име CodeQwen)."
+  },
+  "qwen2.5-instruct": {
+    "description": "Qwen2.5 е най-новата серия от големи езикови модели на Qwen. За Qwen2.5 публикувахме няколко основни езикови модели и модели с фино настройване на инструкции, с параметри в диапазона от 500 милиона до 7,2 милиарда."
+  },
  "qwen2.5-math-1.5b-instruct": {
    "description": "Qwen-Math моделът разполага със силни умения за решаване на математически задачи."
  },
@@ -1613,12 +1718,21 @@
  "qwen2.5-math-7b-instruct": {
    "description": "Моделът Qwen-Math притежава силни способности за решаване на математически задачи."
  },
+  "qwen2.5-omni-7b": {
+    "description": "Моделите от серията Qwen-Omni поддържат входни данни от множество модалности, включително видео, аудио, изображения и текст, и изходят аудио и текст."
+  },
+  "qwen2.5-vl-32b-instruct": {
+    "description": "Моделите от серията Qwen2.5-VL подобряват интелигентността, практичността и приложимостта на модела, като ги правят по-ефективни в сценарии като естествени разговори, създаване на съдържание, професионални услуги и разработка на код. Версията 32B използва технологии за обучение с подсилване за оптимизиране на модела, предлагайки в сравнение с другите модели от серията Qwen2.5 VL по-съответстващ на човешките предпочитания стил на изход, способност за разсъждение върху сложни математически проблеми, както и фино разбиране и разсъждение на изображения."
+  },
  "qwen2.5-vl-72b-instruct": {
    "description": "Подобрение на следването на инструкции, математика, решаване на проблеми и код, повишаване на способността за разпознаване на обекти, поддържа директно точно локализиране на визуални елементи в различни формати, поддържа разбиране на дълги видео файлове (до 10 минути) и локализиране на събития в секунда, може да разбира времеви последователности и скорости, базирано на способности за анализ и локализация, поддържа управление на OS или Mobile агенти, силна способност за извличане на ключова информация и изход в JSON формат, тази версия е 72B, най-силната версия в серията."
  },
  "qwen2.5-vl-7b-instruct": {
    "description": "Подобрение на следването на инструкции, математика, решаване на проблеми и код, повишаване на способността за разпознаване на обекти, поддържа директно точно локализиране на визуални елементи в различни формати, поддържа разбиране на дълги видео файлове (до 10 минути) и локализиране на събития в секунда, може да разбира времеви последователности и скорости, базирано на способности за анализ и локализация, поддържа управление на OS или Mobile агенти, силна способност за извличане на ключова информация и изход в JSON формат, тази версия е 72B, най-силната версия в серията."
  },
+  "qwen2.5-vl-instruct": {
+    "description": "Qwen2.5-VL е най-новата версия на визуално-езиковия модел от семейството Qwen."
+  },
  "qwen2.5:0.5b": {
    "description": "Qwen2.5 е новото поколение мащабен езиков модел на Alibaba, който предлага отлична производителност, за да отговори на разнообразни приложни нужди."
  },
@@ -1754,6 +1868,9 @@
  "wizardlm2:8x22b": {
    "description": "WizardLM 2 е езиков модел, предоставен от Microsoft AI, който се отличава в сложни диалози, многоезичност, разсъждение и интелигентни асистенти."
  },
+  "yi-1.5-34b-chat": {
+    "description": "Yi-1.5 е обновена версия на Yi. Тя използва висококачествен корпус от 500B токена за продължителна предварителна обучение на Yi и е майсторски подобрявана с 3M разнообразни примера за fino-tuning."
+  },
  "yi-large": {
    "description": "Новият модел с хиляда милиарда параметри предлага изключителни способности за отговори и генериране на текст."
  },
@@ -23,6 +23,9 @@
  "cloudflare": {
    "description": "Работа с модели на машинно обучение, задвижвани от безсървърни GPU, в глобалната мрежа на Cloudflare."
  },
+  "cohere": {
+    "description": "Cohere ви предлага най-съвременни многоезични модели, напреднали функции за търсене и AI работно пространство, проектирано специално за съвременните предприятия — всичко интегрирано в една сигурна платформа."
+  },
  "deepseek": {
    "description": "DeepSeek е компания, специализирана в изследвания и приложения на технологии за изкуствен интелект, чийто най-нов модел DeepSeek-V2.5 комбинира способности за общи диалози и обработка на код, постигайки значителни подобрения в съответствието с човешките предпочитания, писателските задачи и следването на инструкции."
  },
@@ -53,6 +56,9 @@
  "hunyuan": {
    "description": "Модел на голям език, разработен от Tencent, който притежава мощни способности за създаване на текст на китайски, логическо разсъждение в сложни контексти и надеждни способности за изпълнение на задачи."
  },
+  "infiniai": {
+    "description": "Предоставя високопроизводителни, лесни за използване и сигурни услуги с големи модели за приложението разработчици, покриващи целия процес от разработка на големи модели до техното услугово разгъване."
+  },
  "internlm": {
    "description": "Отворена организация, посветена на изследването и разработването на инструменти за големи модели. Предоставя на всички AI разработчици ефективна и лесна за използване отворена платформа, която прави най-съвременните технологии и алгоритми за големи модели достъпни."
  },
@@ -98,6 +104,9 @@
  "sambanova": {
    "description": "SambaNova Cloud позволява на разработчиците лесно да използват най-добрите отворени модели и да се наслаждават на най-бързата скорост на извеждане."
  },
+  "search1api": {
+    "description": "Search1API предоставя достъп до серията модели DeepSeek, които могат да се свързват в мрежа при нужда, включително стандартна и бърза версия, с поддръжка за избор на модели с различни параметри."
+  },
  "sensenova": {
    "description": "SenseNova, с мощната основа на SenseTime, предлага ефективни и лесни за използване услуги за големи модели с пълен стек."
  },
@@ -137,6 +146,9 @@
  "xai": {
    "description": "xAI е компания, която се стреми да изгражда изкуствен интелект за ускоряване на човешките научни открития. Нашата мисия е да насърчаваме общото ни разбиране за вселената."
  },
+  "xinference": {
+    "description": "Xorbits Inference (Xinference) е платформа с отворен код, предназначена да опрости изпълнението и интегрирането на различни AI модели. С Xinference можете да използвате всякакви LLM с отворен код, модели за вграждане и мултимодални модели за извършване на изводи в облак или локална среда, както и да създавате мощни AI приложения."
+  },
  "zeroone": {
    "description": "01.AI се фокусира върху технологии за изкуствен интелект от ерата на AI 2.0, активно насърчавайки иновации и приложения на \"човек + изкуствен интелект\", използвайки мощни модели и напреднали AI технологии за повишаване на производителността на човека и реализиране на технологично овластяване."
  },
@@ -42,6 +42,17 @@
    "sessionWithName": "Настройки на сесията · {{name}}",
    "title": "Настройки"
  },
+  "hotkey": {
+    "conflicts": "Конфликт с текущите клавишни комбинации",
+    "group": {
+      "conversation": "Разговор",
+      "essential": "Основен"
+    },
+    "invalidCombination": "Клавишната комбинация трябва да съдържа поне един модификатор (Ctrl, Alt, Shift) и един обикновен клавиш",
+    "record": "Натиснете клавиш, за да запишете клавишна комбинация",
+    "reset": "Нулиране до подразбиращите се клавишни комбинации",
+    "title": "Бързи клавиши"
+  },
  "llm": {
    "aesGcm": "Вашият ключ и адрес на агента ще бъдат криптирани с алгоритъма за криптиране <1>AES-GCM</1>",
    "apiKey": {
@@ -335,6 +346,33 @@
    },
    "title": "Настройки на темата"
  },
+  "storage": {
+    "actions": {
+      "export": {
+        "button": "Експортиране",
+        "exportType": {
+          "agent": "Експортиране на настройки на асистента",
+          "agentWithMessage": "Експортиране на асистента и съобщенията",
+          "all": "Експортиране на глобалните настройки и всички данни на асистентите",
+          "allAgent": "Експортиране на всички настройки на асистентите",
+          "allAgentWithMessage": "Експортиране на всички асистенти и съобщения",
+          "globalSetting": "Експортиране на глобалните настройки"
+        },
+        "title": "Експортиране на данни"
+      },
+      "import": {
+        "button": "Импортиране",
+        "title": "Импортиране на данни"
+      },
+      "title": "Разширени операции"
+    },
+    "desc": "Използване на хранилището в текущия браузър",
+    "embeddings": {
+      "used": "Векторно хранилище"
+    },
+    "title": "Данни за хранилище",
+    "used": "Използване на хранилището"
+  },
  "submitAgentModal": {
    "button": "Изпрати агент",
    "identifier": "Идентификатор на агент",
@@ -425,8 +463,10 @@
    "agent": "Агент по подразбиране",
    "common": "Общи настройки",
    "experiment": "Експеримент",
+    "hotkey": "Бързи клавиши",
    "llm": "Езиков модел",
    "provider": "AI доставчик",
+    "storage": "Данни за хранилище",
    "sync": "Синхронизиране в облака",
    "system-agent": "Системен асистент",
    "tts": "Текст към реч"
@@ -32,6 +32,7 @@
    "title": "Списък с теми"
  },
  "searchPlaceholder": "Търсене на теми...",
+  "searchResultEmpty": "Няма намерени резултати",
  "temp": "Временен",
  "title": "Тема"
 }
@@ -64,6 +64,9 @@
    "stop": "Stoppen",
    "warp": "Zeilenumbruch"
  },
+  "intentUnderstanding": {
+    "title": "Verstehe und analysiere gerade Ihre Absicht..."
+  },
  "knowledgeBase": {
    "all": "Alle Inhalte",
    "allFiles": "Alle Dateien",
@@ -144,7 +147,6 @@
        "desc": "Intelligente Beurteilung, ob eine Suche basierend auf dem Gesprächsinhalt erforderlich ist",
        "title": "Intelligente Vernetzung"
      },
-      "disable": "Das aktuelle Modell unterstützt keine Funktionsaufrufe, daher kann die intelligente Vernetzungsfunktion nicht verwendet werden",
      "off": {
        "desc": "Verwendet nur das Grundwissen des Modells, ohne Netzsuche",
        "title": "Vernetzung deaktivieren"
@@ -155,6 +157,10 @@
      },
      "useModelBuiltin": "Verwenden Sie die integrierte Suchmaschine des Modells"
    },
+    "searchModel": {
+      "desc": "Das aktuelle Modell unterstützt keine Funktionsaufrufe, daher muss es mit einem Modell kombiniert werden, das Funktionsaufrufe unterstützt, um online zu suchen",
+      "title": "Suchunterstützungsmodell"
+    },
    "title": "Netzwerksuche"
  },
  "searchAgentPlaceholder": "Suchassistent...",
@@ -41,7 +41,10 @@
    "error": {
      "desc": "Es tut uns leid, während des Initialisierungsprozesses der Pglite-Datenbank ist ein Fehler aufgetreten. Bitte klicken Sie auf die Schaltfläche, um es erneut zu versuchen. Wenn der Fehler nach mehreren Versuchen weiterhin auftritt, <1>reichen Sie bitte ein Problem ein</1>, und wir werden Ihnen umgehend bei der Untersuchung helfen.",
      "detail": "Fehlerursache: [{{type}}] {{message}}. Einzelheiten sind wie folgt:",
+      "detailTitle": "Fehlerursache",
+      "report": "Problem melden",
      "retry": "Erneut versuchen",
+      "selfSolve": "Selbsthilfe",
      "title": "Datenbankinitialisierung fehlgeschlagen"
    },
    "initing": {
@@ -80,6 +83,54 @@
      "button": "Jetzt verwenden",
      "desc": "Jetzt verwenden",
      "title": "PGlite-Datenbank ist bereit"
+    },
+    "solve": {
+      "backup": {
+        "backup": "Sicherung",
+        "backupSuccess": "Sicherung erfolgreich",
+        "desc": "Wichtige Daten aus der aktuellen Datenbank exportieren",
+        "export": "Alle Daten exportieren",
+        "exportDesc": "Die exportierten Daten werden im JSON-Format gespeichert und können für eine spätere Wiederherstellung oder Analyse verwendet werden.",
+        "reset": {
+          "alert": "Warnung",
+          "alertDesc": "Die folgenden Aktionen können zu Datenverlust führen. Bitte stellen Sie sicher, dass Sie wichtige Daten gesichert haben, bevor Sie fortfahren.",
+          "button": "Datenbank vollständig zurücksetzen (alle Daten löschen)",
+          "confirm": {
+            "desc": "Diese Aktion wird alle Daten löschen und ist nicht rückgängig zu machen. Möchten Sie fortfahren?",
+            "title": "Datenbank zurücksetzen bestätigen"
+          },
+          "desc": "Datenbank zurücksetzen, wenn eine Wiederherstellung nicht möglich ist",
+          "title": "Datenbank zurücksetzen"
+        },
+        "restore": "Wiederherstellen",
+        "restoreSuccess": "Wiederherstellung erfolgreich",
+        "title": "Datenbackup"
+      },
+      "diagnosis": {
+        "createdAt": "Erstellungszeit",
+        "migratedAt": "Migration abgeschlossen",
+        "sql": "Migration SQL",
+        "title": "Migrationsstatus"
+      },
+      "repair": {
+        "desc": "Manuelle Verwaltung des Migrationsstatus",
+        "runSQL": "Benutzerdefinierte Ausführung",
+        "sql": {
+          "clear": "Leeren",
+          "desc": "Benutzerdefinierte SQL-Anweisungen ausführen, um Datenbankprobleme zu beheben",
+          "markFinished": "Als abgeschlossen markieren",
+          "placeholder": "SQL-Anweisung eingeben...",
+          "result": "Ausführungsergebnis",
+          "run": "Ausführen",
+          "title": "SQL-Ausführungswerkzeug"
+        },
+        "title": "Migrationskontrolle"
+      },
+      "tabs": {
+        "backup": "Backup und Wiederherstellung",
+        "diagnosis": "Diagnose",
+        "repair": "Reparatur"
+      }
    }
  },
  "close": "Schließen",
@@ -132,7 +183,7 @@
  },
  "fullscreen": "Vollbildmodus",
  "historyRange": "Verlaufsbereich",
-  "import": "Importieren",
+  "importData": "Daten importieren",
  "importModal": {
    "error": {
      "desc": "Es tut uns sehr leid, aber beim Importieren der Daten ist ein Fehler aufgetreten. Bitte versuchen Sie es erneut oder <1>senden Sie uns eine Anfrage</1>, damit wir das Problem umgehend für Sie lösen können.",
@@ -154,7 +205,8 @@
      "sessions": "Assistenten",
      "skips": "Übersprungen (doppelt)",
      "topics": "Themen",
-      "type": "Datentyp"
+      "type": "Datentyp",
+      "update": "Datensatz aktualisiert"
    },
    "title": "Daten importieren",
    "uploading": {
@@ -163,6 +215,16 @@
      "speed": "Upload-Geschwindigkeit"
    }
  },
+  "importPreview": {
+    "confirmImport": "Import bestätigen",
+    "tables": {
+      "count": "Anzahl der Datensätze",
+      "name": "Tabellenname"
+    },
+    "title": "Datenimportvorschau",
+    "totalRecords": "Insgesamt werden {{count}} Datensätze importiert",
+    "totalTables": "{{count}} Tabellen"
+  },
  "information": "Community und Informationen",
  "installPWA": "Installiere die Browser-App",
  "lang": {
@@ -76,6 +76,7 @@
      "custom": "Benutzerdefiniertes Modell, standardmäßig unterstützt es sowohl Funktionsaufrufe als auch visuelle Erkennung. Bitte überprüfen Sie die Verfügbarkeit dieser Fähigkeiten basierend auf den tatsächlichen Gegebenheiten.",
      "file": "Dieses Modell unterstützt das Hochladen von Dateien und deren Erkennung.",
      "functionCall": "Dieses Modell unterstützt Funktionsaufrufe.",
+      "imageOutput": "Dieses Modell unterstützt die Generierung von Bildern",
      "reasoning": "Dieses Modell unterstützt tiefes Denken",
      "search": "Dieses Modell unterstützt die Online-Suche",
      "tokens": "Dieses Modell unterstützt maximal {{tokens}} Tokens pro Sitzung.",
@@ -85,6 +86,8 @@
  },
  "ModelSwitchPanel": {
    "emptyModel": "Kein aktiviertes Modell. Bitte gehen Sie zu den Einstellungen, um es zu aktivieren.",
+    "emptyProvider": "Es sind keine aktiven Anbieter vorhanden, bitte gehen Sie zu den Einstellungen, um sie zu aktivieren",
+    "goToSettings": "Zu den Einstellungen gehen",
    "provider": "Anbieter"
  },
  "OllamaSetupGuide": {
@@ -16,6 +16,16 @@
    "detail": "Fehlerdetails",
    "title": "Anfrage fehlgeschlagen"
  },
+  "import": {
+    "importConfigFile": {
+      "description": "Fehlerursache: {{reason}}",
+      "title": "Import fehlgeschlagen"
+    },
+    "incompatible": {
+      "description": "Diese Datei wurde aus einer höheren Version exportiert. Bitte versuchen Sie, auf die neueste Version zu aktualisieren und dann erneut zu importieren.",
+      "title": "Die aktuelle Anwendung unterstützt den Import dieser Datei nicht"
+    }
+  },
  "loginRequired": {
    "desc": "Sie werden in Kürze zur Anmeldeseite weitergeleitet",
    "title": "Bitte melden Sie sich an, um diese Funktion zu nutzen"
@@ -69,6 +79,7 @@
    "524": "Es tut uns leid, der Server hat beim Warten auf eine Antwort die Zeit überschritten, möglicherweise aufgrund einer zu langsamen Antwort. Bitte versuchen Sie es später erneut.",
    "AgentRuntimeError": "Es ist ein Fehler bei der Ausführung des Lobe-Sprachmodells aufgetreten. Bitte überprüfen Sie die folgenden Informationen oder versuchen Sie es erneut.",
    "ConnectionCheckFailed": "Die Anfrage brachte eine leere Antwort zurück. Bitte überprüfen Sie, ob die API-Proxy-Adresse am Ende nicht mit `/v1` endet.",
+    "CreateMessageError": "Es tut uns leid, die Nachricht konnte nicht erfolgreich gesendet werden. Bitte kopieren Sie den Inhalt und senden Sie ihn erneut. Nach dem Aktualisieren der Seite wird diese Nachricht nicht gespeichert.",
    "ExceededContextWindow": "Der aktuelle Anfrageinhalt überschreitet die von dem Modell verarbeitbare Länge. Bitte reduzieren Sie die Menge des Inhalts und versuchen Sie es erneut.",
    "FreePlanLimit": "Sie sind derzeit ein kostenloser Benutzer und können diese Funktion nicht nutzen. Bitte aktualisieren Sie auf ein kostenpflichtiges Abonnement, um fortzufahren.",
    "InsufficientQuota": "Es tut uns leid, das Kontingent (Quota) für diesen Schlüssel ist erreicht. Bitte überprüfen Sie Ihr Kontoguthaben oder erhöhen Sie das Kontingent des Schlüssels und versuchen Sie es erneut.",
@@ -0,0 +1,46 @@
+{
+  "addUserMessage": {
+    "desc": "Fügen Sie den aktuellen Eingabetext als Benutzernachricht hinzu, ohne die Generierung auszulösen",
+    "title": "Benutzernachricht hinzufügen"
+  },
+  "editMessage": {
+    "desc": "Treten Sie in den Bearbeitungsmodus, indem Sie die Alt-Taste gedrückt halten und auf die Nachricht doppelklicken",
+    "title": "Nachricht bearbeiten"
+  },
+  "openChatSettings": {
+    "desc": "Aktuelle Sitzungseinstellungen anzeigen und ändern",
+    "title": "Chat-Einstellungen öffnen"
+  },
+  "openHotkeyHelper": {
+    "desc": "Anleitung zur Verwendung aller Tastenkombinationen anzeigen",
+    "title": "Tastenkombinationshilfe öffnen"
+  },
+  "regenerateMessage": {
+    "desc": "Die letzte Nachricht neu generieren",
+    "title": "Nachricht neu generieren"
+  },
+  "saveTopic": {
+    "desc": "Das aktuelle Thema speichern und ein neues Thema öffnen",
+    "title": "Neues Thema beginnen"
+  },
+  "search": {
+    "desc": "Hauptsuchfeld der aktuellen Seite aufrufen",
+    "title": "Suche"
+  },
+  "switchAgent": {
+    "desc": "Wechseln Sie zwischen den im Seitenbereich fixierten Assistenten, indem Sie die Strg-Taste gedrückt halten und eine Zahl von 0 bis 9 drücken",
+    "title": "Schnell zwischen Assistenten wechseln"
+  },
+  "toggleLeftPanel": {
+    "desc": "Linkes Hilfepanel ein- oder ausblenden",
+    "title": "Assistentenpanel ein-/ausblenden"
+  },
+  "toggleRightPanel": {
+    "desc": "Rechtes Themenpanel ein- oder ausblenden",
+    "title": "Themenpanel ein-/ausblenden"
+  },
+  "toggleZenMode": {
+    "desc": "Im Fokusmodus nur die aktuelle Sitzung anzeigen, andere UI ausblenden",
+    "title": "Fokussierungsmodus umschalten"
+  }
+}
@@ -1,13 +1,4 @@
 {
-  "01-ai/Yi-1.5-34B-Chat-16K": {
-    "description": "Yi-1.5 34B bietet mit umfangreichen Trainingsbeispielen überlegene Leistungen in der Branchenanwendung."
-  },
-  "01-ai/Yi-1.5-6B-Chat": {
-    "description": "Yi-1.5-6B-Chat ist eine Variante der Yi-1.5-Serie und gehört zu den Open-Source-Chatmodellen. Yi-1.5 ist die verbesserte Version von Yi, die auf 500B hochwertigen Korpora kontinuierlich vortrainiert wurde und auf 3M diversifizierten Feinabstimmungsbeispielen feinabgestimmt wurde. Im Vergleich zu Yi zeigt Yi-1.5 stärkere Fähigkeiten in Codierung, Mathematik, Inferenz und Befolgung von Anweisungen, während es hervorragende Sprachverständnis-, Alltagswissen- und Leseverständnisfähigkeiten bewahrt. Das Modell bietet Versionen mit Kontextlängen von 4K, 16K und 32K, mit einer Gesamtanzahl von 3,6T Tokens im Vortraining."
-  },
-  "01-ai/Yi-1.5-9B-Chat-16K": {
-    "description": "Yi-1.5 9B unterstützt 16K Tokens und bietet effiziente, flüssige Sprachgenerierungsfähigkeiten."
-  },
  "01-ai/yi-1.5-34b-chat": {
    "description": "Yi 1.5, das neueste Open-Source-Fine-Tuning-Modell mit 34 Milliarden Parametern, unterstützt verschiedene Dialogszenarien mit hochwertigen Trainingsdaten, die auf menschliche Präferenzen abgestimmt sind."
  },
@@ -149,12 +140,6 @@
  "Llama-3.2-90B-Vision-Instruct\t": {
    "description": "Fortgeschrittene Bildschlussfolgerungsfähigkeiten für Anwendungen im Bereich der visuellen Verständigung."
  },
-  "LoRA/Qwen/Qwen2.5-72B-Instruct": {
-    "description": "Qwen2.5-72B-Instruct ist eines der neuesten großen Sprachmodelle, die von Alibaba Cloud veröffentlicht wurden. Dieses 72B-Modell hat signifikante Verbesserungen in den Bereichen Codierung und Mathematik. Das Modell bietet auch mehrsprachige Unterstützung und deckt über 29 Sprachen ab, einschließlich Chinesisch und Englisch. Es zeigt signifikante Verbesserungen in der Befolgung von Anweisungen, im Verständnis strukturierter Daten und in der Generierung strukturierter Ausgaben (insbesondere JSON)."
-  },
-  "LoRA/Qwen/Qwen2.5-7B-Instruct": {
-    "description": "Qwen2.5-7B-Instruct ist eines der neuesten großen Sprachmodelle, die von Alibaba Cloud veröffentlicht wurden. Dieses 7B-Modell hat signifikante Verbesserungen in den Bereichen Codierung und Mathematik. Das Modell bietet auch mehrsprachige Unterstützung und deckt über 29 Sprachen ab, einschließlich Chinesisch und Englisch. Es zeigt signifikante Verbesserungen in der Befolgung von Anweisungen, im Verständnis strukturierter Daten und in der Generierung strukturierter Ausgaben (insbesondere JSON)."
-  },
  "Meta-Llama-3.1-405B-Instruct": {
    "description": "Das auf Anweisungen optimierte Textmodell Llama 3.1 wurde für mehrsprachige Dialoganwendungen optimiert und zeigt in vielen verfügbaren Open-Source- und geschlossenen Chat-Modellen in gängigen Branchenbenchmarks hervorragende Leistungen."
  },
@@ -179,9 +164,6 @@
  "NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO": {
    "description": "Nous Hermes 2 - Mixtral 8x7B-DPO (46.7B) ist ein hochpräzises Anweisungsmodell, das für komplexe Berechnungen geeignet ist."
  },
-  "OpenGVLab/InternVL2-26B": {
-    "description": "InternVL2 zeigt herausragende Leistungen in verschiedenen visuellen Sprachaufgaben, einschließlich Dokumenten- und Diagrammverständnis, Szenentexterkennung, OCR, wissenschaftlicher und mathematischer Problemlösung."
-  },
  "Phi-3-medium-128k-instruct": {
    "description": "Das gleiche Phi-3-medium-Modell, jedoch mit einer größeren Kontextgröße für RAG oder Few-Shot-Prompting."
  },
@@ -206,9 +188,6 @@
  "Phi-3.5-vision-instrust": {
    "description": "Aktualisierte Version des Phi-3-vision-Modells."
  },
-  "Pro/OpenGVLab/InternVL2-8B": {
-    "description": "InternVL2 zeigt herausragende Leistungen in verschiedenen visuellen Sprachaufgaben, einschließlich Dokumenten- und Diagrammverständnis, Szenentexterkennung, OCR, wissenschaftlicher und mathematischer Problemlösung."
-  },
  "Pro/Qwen/Qwen2-1.5B-Instruct": {
    "description": "Qwen2-1.5B-Instruct ist das anweisungsfeinabgestimmte große Sprachmodell der Qwen2-Serie mit einer Parametergröße von 1,5B. Dieses Modell basiert auf der Transformer-Architektur und verwendet Technologien wie die SwiGLU-Aktivierungsfunktion, QKV-Offsets und gruppierte Abfrageaufmerksamkeit. Es zeigt hervorragende Leistungen in der Sprachverständnis, -generierung, Mehrsprachigkeit, Codierung, Mathematik und Inferenz in mehreren Benchmark-Tests und übertrifft die meisten Open-Source-Modelle. Im Vergleich zu Qwen1.5-1.8B-Chat zeigt Qwen2-1.5B-Instruct in Tests wie MMLU, HumanEval, GSM8K, C-Eval und IFEval signifikante Leistungsverbesserungen, obwohl die Parameteranzahl etwas geringer ist."
  },
@@ -224,20 +203,26 @@
  "Pro/Qwen/Qwen2.5-Coder-7B-Instruct": {
    "description": "Qwen2.5-Coder-7B-Instruct ist die neueste Version der von Alibaba Cloud veröffentlichten Reihe von code-spezifischen großen Sprachmodellen. Dieses Modell basiert auf Qwen2.5 und wurde mit 55 Billionen Tokens trainiert, um die Fähigkeiten zur Codegenerierung, Inferenz und Fehlerbehebung erheblich zu verbessern. Es verbessert nicht nur die Codierungsfähigkeiten, sondern bewahrt auch die Vorteile in Mathematik und allgemeinen Fähigkeiten. Das Modell bietet eine umfassendere Grundlage für praktische Anwendungen wie Code-Agenten."
  },
+  "Pro/Qwen/Qwen2.5-VL-7B-Instruct": {
+    "description": "Qwen2.5-VL ist ein neues Mitglied der Qwen-Serie und verfügt über leistungsstarke visuelle Wahrnehmungsfähigkeiten. Es kann Text, Diagramme und Layouts in Bildern analysieren, längere Videos verstehen und Ereignisse erfassen. Zudem kann es Schlussfolgerungen ziehen, Werkzeuge bedienen, mehrere Formate für Objektlokalisation unterstützen und strukturierte Ausgaben generieren. Die Videoverarbeitung wurde durch dynamische Auflösungs- und Frameratetraining optimiert, und die Effizienz des visuellen Encoders wurde verbessert."
+  },
  "Pro/THUDM/glm-4-9b-chat": {
    "description": "GLM-4-9B-Chat ist die Open-Source-Version des GLM-4-Modells, das von Zhizhu AI eingeführt wurde. Dieses Modell zeigt hervorragende Leistungen in den Bereichen Semantik, Mathematik, Inferenz, Code und Wissen. Neben der Unterstützung für mehrstufige Dialoge bietet GLM-4-9B-Chat auch fortgeschrittene Funktionen wie Web-Browsing, Code-Ausführung, benutzerdefinierte Tool-Aufrufe (Function Call) und langes Textverständnis. Das Modell unterstützt 26 Sprachen, darunter Chinesisch, Englisch, Japanisch, Koreanisch und Deutsch. In mehreren Benchmark-Tests zeigt GLM-4-9B-Chat hervorragende Leistungen, wie AlignBench-v2, MT-Bench, MMLU und C-Eval. Das Modell unterstützt eine maximale Kontextlänge von 128K und ist für akademische Forschung und kommerzielle Anwendungen geeignet."
  },
  "Pro/deepseek-ai/DeepSeek-R1": {
    "description": "DeepSeek-R1 ist ein durch verstärkendes Lernen (RL) gesteuertes Inferenzmodell, das Probleme mit Wiederholungen und Lesbarkeit im Modell löst. Vor dem RL führte DeepSeek-R1 Kaltstartdaten ein, um die Inferenzleistung weiter zu optimieren. Es zeigt in mathematischen, programmierbezogenen und Inferenzaufgaben eine vergleichbare Leistung zu OpenAI-o1 und verbessert die Gesamtleistung durch sorgfältig gestaltete Trainingsmethoden."
  },
+  "Pro/deepseek-ai/DeepSeek-R1-Distill-Qwen-1.5B": {
+    "description": "DeepSeek-R1-Distill-Qwen-1.5B ist ein Modell, das durch Wissensdistillierung auf Basis von Qwen2.5-Math-1.5B erstellt wurde. Dieses Modell wurde mit 800.000 sorgfältig ausgewählten Beispielen, die von DeepSeek-R1 generiert wurden, feinjustiert und zeigt in mehreren Benchmarks gute Leistungen. Als leichtgewichtiges Modell erreicht es eine Genauigkeit von 83,9 % auf MATH-500, einen Durchgangsrate von 28,9 % auf AIME 2024 und eine Bewertung von 954 auf CodeForces, was seine inferenziellen Fähigkeiten über seine Parametergröße hinaus zeigt."
+  },
+  "Pro/deepseek-ai/DeepSeek-R1-Distill-Qwen-7B": {
+    "description": "DeepSeek-R1-Distill-Qwen-7B ist ein Modell, das durch Wissensdistillierung auf Basis von Qwen2.5-Math-7B erstellt wurde. Dieses Modell wurde mit 800.000 sorgfältig ausgewählten Beispielen, die von DeepSeek-R1 generiert wurden, feinjustiert und zeigt ausgezeichnete Inferenzfähigkeiten. Es erzielte in mehreren Benchmarks hervorragende Ergebnisse, darunter eine Genauigkeit von 92,8 % im MATH-500, einen Durchgangsrate von 55,5 % im AIME 2024 und eine Bewertung von 1189 auf CodeForces, was seine starken mathematischen und programmierischen Fähigkeiten als Modell mit 7B Parametern unterstreicht."
+  },
  "Pro/deepseek-ai/DeepSeek-V3": {
    "description": "DeepSeek-V3 ist ein hybrides Experten (MoE) Sprachmodell mit 6710 Milliarden Parametern, das eine Multi-Head-Latente-Attention (MLA) und DeepSeekMoE-Architektur verwendet, kombiniert mit einer Lastenausgleichsstrategie ohne Hilfskosten, um die Inferenz- und Trainingseffizienz zu optimieren. Durch das Pre-Training auf 14,8 Billionen hochwertigen Tokens und anschließende überwachte Feinabstimmung und verstärktes Lernen übertrifft DeepSeek-V3 in der Leistung andere Open-Source-Modelle und nähert sich führenden geschlossenen Modellen."
  },
-  "Pro/google/gemma-2-9b-it": {
-    "description": "Gemma ist eines der leichtgewichtigen, hochmodernen offenen Modellserien, die von Google entwickelt wurden. Es handelt sich um ein großes Sprachmodell mit nur Decoder, das Englisch unterstützt und offene Gewichte, vortrainierte Varianten und anweisungsfeinabgestimmte Varianten bietet. Das Gemma-Modell eignet sich für verschiedene Textgenerierungsaufgaben, einschließlich Fragen und Antworten, Zusammenfassungen und Inferenz. Dieses 9B-Modell wurde mit 80 Billionen Tokens trainiert. Seine relativ kleine Größe ermöglicht es, in ressourcenbeschränkten Umgebungen wie Laptops, Desktop-Computern oder Ihrer eigenen Cloud-Infrastruktur bereitgestellt zu werden, wodurch mehr Menschen Zugang zu modernsten KI-Modellen erhalten und Innovationen gefördert werden."
-  },
-  "Pro/meta-llama/Meta-Llama-3.1-8B-Instruct": {
-    "description": "Meta Llama 3.1 ist eine Familie von mehrsprachigen großen Sprachmodellen, die von Meta entwickelt wurden und vortrainierte sowie anweisungsfeinabgestimmte Varianten mit 8B, 70B und 405B Parametern umfasst. Dieses 8B-Anweisungsfeinabgestimmte Modell wurde für mehrsprachige Dialogszenarien optimiert und zeigt in mehreren Branchen-Benchmark-Tests hervorragende Leistungen. Das Modelltraining verwendete über 150 Billionen Tokens aus öffentlichen Daten und nutzte Techniken wie überwachte Feinabstimmung und verstärkendes Lernen mit menschlichem Feedback, um die Nützlichkeit und Sicherheit des Modells zu verbessern. Llama 3.1 unterstützt Text- und Codegenerierung, mit einem Wissensstichtag von Dezember 2023."
+  "Pro/deepseek-ai/DeepSeek-V3-1226": {
+    "description": "DeepSeek-V3 ist ein hybrides Expertenmodell (MoE) mit 6710 Milliarden Parametern, das eine Multi-Head-Latente-Attention (MLA) und die DeepSeekMoE-Architektur verwendet, kombiniert mit einer Lastenausgleichsstrategie ohne Hilfskosten, um die Effizienz von Inferenz und Training zu optimieren. Durch das Pre-Training auf 14,8 Billionen hochwertigen Tokens und anschließendes überwachten Feintuning und verstärkendes Lernen übertrifft DeepSeek-V3 in der Leistung andere Open-Source-Modelle und nähert sich führenden Closed-Source-Modellen."
  },
  "QwQ-32B-Preview": {
    "description": "QwQ-32B-Preview ist ein innovatives Modell für die Verarbeitung natürlicher Sprache, das komplexe Aufgaben der Dialoggenerierung und des Kontextverständnisses effizient bewältigen kann."
@@ -290,6 +275,12 @@
  "Qwen/Qwen2.5-Coder-7B-Instruct": {
    "description": "Qwen2.5-Coder-7B-Instruct ist die neueste Version der von Alibaba Cloud veröffentlichten Reihe von code-spezifischen großen Sprachmodellen. Dieses Modell basiert auf Qwen2.5 und wurde mit 55 Billionen Tokens trainiert, um die Fähigkeiten zur Codegenerierung, Inferenz und Fehlerbehebung erheblich zu verbessern. Es verbessert nicht nur die Codierungsfähigkeiten, sondern bewahrt auch die Vorteile in Mathematik und allgemeinen Fähigkeiten. Das Modell bietet eine umfassendere Grundlage für praktische Anwendungen wie Code-Agenten."
  },
+  "Qwen/Qwen2.5-VL-32B-Instruct": {
+    "description": "Qwen2.5-VL-32B-Instruct ist ein multimodales Großmodell, das vom Qwen-Team entwickelt wurde und Teil der Qwen2.5-VL-Reihe ist. Dieses Modell ist nicht nur in der Lage, übliche Objekte zu erkennen, sondern kann auch Text, Diagramme, Symbole, Grafiken und Layouts in Bildern analysieren. Es kann als visueller Agent dienen, der in der Lage ist, zu schließen und Werkzeuge dynamisch zu steuern, wobei es Fähigkeiten im Umgang mit Computern und Smartphones besitzt. Darüber hinaus kann dieses Modell Objekte in Bildern präzise lokalisieren und strukturierte Ausgaben für Rechnungen, Tabellen usw. generieren. Im Vergleich zum Vorgängermodell Qwen2-VL wurde diese Version durch verstärktes Lernen in Mathematik und Problemlösungsfähigkeiten weiter verbessert, und ihr Antwortstil entspricht stärker den menschlichen Vorlieben."
+  },
+  "Qwen/Qwen2.5-VL-72B-Instruct": {
+    "description": "Qwen2.5-VL ist ein visueller Sprachmodell der Qwen2.5-Serie. Dieses Modell zeichnet sich durch erhebliche Verbesserungen aus: Es verfügt über eine stärkere visuelle Wahrnehmungsfähigkeit, kann übliche Objekte erkennen, Texte, Diagramme und Layouts analysieren; als visueller Agent kann es Schlussfolgerungen ziehen und die dynamische Nutzung von Werkzeugen leiten; es unterstützt das Verstehen von Videos mit einer Länge von über einer Stunde und kann wichtige Ereignisse erfassen; es kann durch die Generierung von Begrenzungsrahmen oder Punkten Objekte in Bildern präzise lokalisieren; es unterstützt die Erstellung strukturierter Ausgaben, insbesondere für gescannte Daten wie Rechnungen und Tabellen."
+  },
  "Qwen2-72B-Instruct": {
    "description": "Qwen2 ist die neueste Reihe des Qwen-Modells, das 128k Kontext unterstützt. Im Vergleich zu den derzeit besten Open-Source-Modellen übertrifft Qwen2-72B in den Bereichen natürliche Sprachverständnis, Wissen, Code, Mathematik und Mehrsprachigkeit deutlich die führenden Modelle."
  },
@@ -374,9 +365,6 @@
  "TeleAI/TeleChat2": {
    "description": "Das TeleChat2-Modell ist ein generatives semantisches Großmodell, das von China Telecom von Grund auf neu entwickelt wurde und Funktionen wie Enzyklopädiefragen, Codegenerierung und lange Textgenerierung unterstützt. Es bietet Benutzern Beratungsdienste, ermöglicht Dialoginteraktionen mit Benutzern, beantwortet Fragen, unterstützt bei der Erstellung und hilft Benutzern effizient und bequem, Informationen, Wissen und Inspiration zu erhalten. Das Modell zeigt hervorragende Leistungen in den Bereichen Halluzinationsprobleme, lange Textgenerierung und logisches Verständnis."
  },
-  "TeleAI/TeleMM": {
-    "description": "Das TeleMM-Modell ist ein multimodales Großmodell, das von China Telecom entwickelt wurde und in der Lage ist, Texte, Bilder und andere Modalitäten zu verarbeiten. Es unterstützt Funktionen wie Bildverständnis und Diagrammanalyse und bietet Benutzern multimodale Verständnisdienste. Das Modell kann mit Benutzern multimodal interagieren, den Eingabeinhalt genau verstehen, Fragen beantworten, bei der Erstellung helfen und effizient multimodale Informationen und Inspirationsunterstützung bereitstellen. Es zeigt hervorragende Leistungen in multimodalen Aufgaben wie feinkörniger Wahrnehmung und logischem Schlussfolgern."
-  },
  "Vendor-A/Qwen/Qwen2.5-72B-Instruct": {
    "description": "Qwen2.5-72B-Instruct ist eines der neuesten großen Sprachmodelle, die von Alibaba Cloud veröffentlicht wurden. Dieses 72B-Modell hat signifikante Verbesserungen in den Bereichen Codierung und Mathematik. Das Modell bietet auch mehrsprachige Unterstützung und deckt über 29 Sprachen ab, einschließlich Chinesisch und Englisch. Es zeigt signifikante Verbesserungen in der Befolgung von Anweisungen, im Verständnis strukturierter Daten und in der Generierung strukturierter Ausgaben (insbesondere JSON)."
  },
@@ -506,6 +494,9 @@
  "anthropic/claude-3.5-sonnet": {
    "description": "Claude 3.5 Sonnet bietet Fähigkeiten, die über Opus hinausgehen, und eine schnellere Geschwindigkeit als Sonnet, während es den gleichen Preis wie Sonnet beibehält. Sonnet ist besonders gut in Programmierung, Datenwissenschaft, visueller Verarbeitung und Agentenaufgaben."
  },
+  "anthropic/claude-3.7-sonnet": {
+    "description": "Claude 3.7 Sonnet ist das intelligenteste Modell von Anthropic bis heute und das erste hybride Inferenzmodell auf dem Markt. Claude 3.7 Sonnet kann nahezu sofortige Antworten oder verlängerte, schrittweise Überlegungen erzeugen, wobei die Benutzer diesen Prozess klar nachvollziehen können. Sonnet ist besonders gut in den Bereichen Programmierung, Datenwissenschaft, visuelle Verarbeitung und Agentenaufgaben."
+  },
  "aya": {
    "description": "Aya 23 ist ein mehrsprachiges Modell von Cohere, das 23 Sprachen unterstützt und die Anwendung in einer Vielzahl von Sprachen erleichtert."
  },
@@ -515,9 +506,27 @@
  "baichuan/baichuan2-13b-chat": {
    "description": "Baichuan-13B ist ein Open-Source-Sprachmodell mit 13 Milliarden Parametern, das von Baichuan Intelligence entwickelt wurde und in autorisierten chinesischen und englischen Benchmarks die besten Ergebnisse in seiner Größenordnung erzielt hat."
  },
+  "c4ai-aya-expanse-32b": {
+    "description": "Aya Expanse ist ein leistungsstarkes 32B mehrsprachiges Modell, das darauf abzielt, die Leistung von einsprachigen Modellen durch innovative Ansätze wie Anweisungsoptimierung, Datenarbitrage, Präferenztraining und Modellfusion herauszufordern. Es unterstützt 23 Sprachen."
+  },
+  "c4ai-aya-expanse-8b": {
+    "description": "Aya Expanse ist ein leistungsstarkes 8B mehrsprachiges Modell, das darauf abzielt, die Leistung von einsprachigen Modellen durch innovative Ansätze wie Anweisungsoptimierung, Datenarbitrage, Präferenztraining und Modellfusion herauszufordern. Es unterstützt 23 Sprachen."
+  },
+  "c4ai-aya-vision-32b": {
+    "description": "Aya Vision ist ein hochmodernes multimodales Modell, das in mehreren wichtigen Benchmarks für Sprache, Text und Bild hervorragende Leistungen zeigt. Diese 32B-Version konzentriert sich auf die fortschrittlichste mehrsprachige Leistung und unterstützt 23 Sprachen."
+  },
+  "c4ai-aya-vision-8b": {
+    "description": "Aya Vision ist ein hochmodernes multimodales Modell, das in mehreren wichtigen Benchmarks für Sprache, Text und Bild hervorragende Leistungen zeigt. Diese 8B-Version konzentriert sich auf niedrige Latenz und optimale Leistung."
+  },
  "charglm-3": {
    "description": "CharGLM-3 ist für Rollenspiele und emotionale Begleitung konzipiert und unterstützt extrem lange Mehrfachgedächtnisse und personalisierte Dialoge, mit breiter Anwendung."
  },
+  "chatglm3": {
+    "description": "ChatGLM3 ist ein proprietäres Modell, das von der KI-Forschungsgruppe Zhipu AI und dem KEG-Labor der Tsinghua-Universität veröffentlicht wurde. Es wurde durch umfangreiche Vortrainings mit chinesischen und englischen Bezeichnern sowie durch die Anpassung an menschliche Präferenzen entwickelt. Im Vergleich zum ersten Modell erzielte es Verbesserungen von 16 %, 36 % und 280 % in den Benchmarks MMLU, C-Eval und GSM8K und steht an der Spitze der chinesischen Aufgabenliste C-Eval. Es eignet sich für Szenarien, die hohe Anforderungen an das Wissensvolumen, die Inferenzfähigkeit und die Kreativität stellen, wie z. B. die Erstellung von Werbetexten, das Schreiben von Romanen, wissensbasiertes Schreiben und die Generierung von Code."
+  },
+  "chatglm3-6b-base": {
+    "description": "ChatGLM3-6b-base ist das neueste Modell der ChatGLM-Serie mit 6 Milliarden Parametern, entwickelt von Zhipu."
+  },
  "chatgpt-4o-latest": {
    "description": "ChatGPT-4o ist ein dynamisches Modell, das in Echtzeit aktualisiert wird, um die neueste Version zu gewährleisten. Es kombiniert starke Sprachverständnis- und Generierungsfähigkeiten und eignet sich für großangelegte Anwendungsszenarien, einschließlich Kundenservice, Bildung und technische Unterstützung."
  },
@@ -593,12 +602,39 @@
  "cohere-command-r-plus": {
    "description": "Command R+ ist ein hochmodernes, RAG-optimiertes Modell, das für unternehmensgerechte Arbeitslasten konzipiert ist."
  },
+  "command": {
+    "description": "Ein dialogbasiertes Modell, das Anweisungen folgt und in sprachlichen Aufgaben hohe Qualität und Zuverlässigkeit bietet. Im Vergleich zu unserem grundlegenden Generierungsmodell hat es eine längere Kontextlänge."
+  },
+  "command-a-03-2025": {
+    "description": "Command A ist unser bisher leistungsstärkstes Modell, das in der Nutzung von Werkzeugen, Agenten, Retrieval-Enhanced Generation (RAG) und mehrsprachigen Anwendungsszenarien hervorragende Leistungen zeigt. Command A hat eine Kontextlänge von 256K, benötigt nur zwei GPUs zum Betrieb und bietet im Vergleich zu Command R+ 08-2024 eine Steigerung der Durchsatzrate um 150 %."
+  },
+  "command-light": {
+    "description": "Eine kleinere, schnellere Version von Command, die fast ebenso leistungsstark ist, aber schneller arbeitet."
+  },
+  "command-light-nightly": {
+    "description": "Um die Zeitspanne zwischen den Hauptversionsveröffentlichungen zu verkürzen, haben wir eine nächtliche Version des Command Modells eingeführt. Für die command-light-Serie wird diese Version als command-light-nightly bezeichnet. Bitte beachten Sie, dass command-light-nightly die neueste, experimentellste und (möglicherweise) instabilste Version ist. Die nächtlichen Versionen werden regelmäßig aktualisiert, ohne vorherige Ankündigung, daher wird die Verwendung in Produktionsumgebungen nicht empfohlen."
+  },
+  "command-nightly": {
+    "description": "Um die Zeitspanne zwischen den Hauptversionsveröffentlichungen zu verkürzen, haben wir eine nächtliche Version des Command Modells eingeführt. Für die Command-Serie wird diese Version als command-cightly bezeichnet. Bitte beachten Sie, dass command-nightly die neueste, experimentellste und (möglicherweise) instabilste Version ist. Die nächtlichen Versionen werden regelmäßig aktualisiert, ohne vorherige Ankündigung, daher wird die Verwendung in Produktionsumgebungen nicht empfohlen."
+  },
  "command-r": {
    "description": "Command R ist ein LLM, das für Dialoge und Aufgaben mit langen Kontexten optimiert ist und sich besonders gut für dynamische Interaktionen und Wissensmanagement eignet."
  },
+  "command-r-03-2024": {
+    "description": "Command R ist ein dialogbasiertes Modell, das Anweisungen folgt und in sprachlichen Aufgaben eine höhere Qualität und Zuverlässigkeit bietet. Im Vergleich zu früheren Modellen hat es eine längere Kontextlänge. Es kann für komplexe Workflows wie Codegenerierung, Retrieval-Enhanced Generation (RAG), Werkzeugnutzung und Agenten verwendet werden."
+  },
+  "command-r-08-2024": {
+    "description": "command-r-08-2024 ist die aktualisierte Version des Command R Modells, das im August 2024 veröffentlicht wurde."
+  },
  "command-r-plus": {
    "description": "Command R+ ist ein leistungsstarkes großes Sprachmodell, das speziell für reale Unternehmensszenarien und komplexe Anwendungen entwickelt wurde."
  },
+  "command-r-plus-04-2024": {
+    "description": "Command R+ ist ein dialogbasiertes Modell, das Anweisungen folgt und in sprachlichen Aufgaben eine höhere Qualität und Zuverlässigkeit bietet. Im Vergleich zu früheren Modellen hat es eine längere Kontextlänge. Es eignet sich am besten für komplexe RAG-Workflows und mehrstufige Werkzeugnutzung."
+  },
+  "command-r7b-12-2024": {
+    "description": "command-r7b-12-2024 ist eine kompakte und effiziente aktualisierte Version, die im Dezember 2024 veröffentlicht wurde. Es zeigt hervorragende Leistungen in Aufgaben, die komplexes Denken und mehrstufige Verarbeitung erfordern, wie RAG, Werkzeugnutzung und Agenten."
+  },
  "dall-e-2": {
    "description": "Zweite Generation des DALL·E-Modells, unterstützt realistischere und genauere Bildgenerierung, mit einer Auflösung, die viermal so hoch ist wie die der ersten Generation."
  },
@@ -614,9 +650,6 @@
  "deepseek-ai/DeepSeek-R1-Distill-Llama-70B": {
    "description": "Das DeepSeek-R1-Distill-Modell optimiert die Inferenzleistung durch verstärkendes Lernen und Kaltstartdaten. Das Open-Source-Modell setzt neue Maßstäbe für Multitasking."
  },
-  "deepseek-ai/DeepSeek-R1-Distill-Llama-8B": {
-    "description": "DeepSeek-R1-Distill-Llama-8B ist ein destilliertes Modell, das auf Llama-3.1-8B basiert. Dieses Modell wurde mit Beispielen, die von DeepSeek-R1 generiert wurden, feinabgestimmt und zeigt hervorragende Inferenzfähigkeiten. Es hat in mehreren Benchmark-Tests gut abgeschnitten, darunter eine Genauigkeit von 89,1 % in MATH-500, eine Bestehensquote von 50,4 % in AIME 2024 und eine Bewertung von 1205 in CodeForces, was starke mathematische und Programmierfähigkeiten für ein 8B-Modell demonstriert."
-  },
  "deepseek-ai/DeepSeek-R1-Distill-Qwen-1.5B": {
    "description": "Das DeepSeek-R1-Distill-Modell optimiert die Inferenzleistung durch verstärkendes Lernen und Kaltstartdaten. Das Open-Source-Modell setzt neue Maßstäbe für Multitasking."
  },
@@ -659,12 +692,30 @@
  "deepseek-r1": {
    "description": "DeepSeek-R1 ist ein durch verstärkendes Lernen (RL) gesteuertes Inferenzmodell, das die Probleme der Wiederholbarkeit und Lesbarkeit im Modell löst. Vor dem RL führte DeepSeek-R1 Kaltstartdaten ein, um die Inferenzleistung weiter zu optimieren. Es zeigt in mathematischen, programmierbezogenen und Inferenzaufgaben eine vergleichbare Leistung zu OpenAI-o1 und verbessert durch sorgfältig gestaltete Trainingsmethoden die Gesamteffizienz."
  },
+  "deepseek-r1-70b-fast-online": {
+    "description": "DeepSeek R1 70B Schnellversion, die Echtzeit-Online-Suche unterstützt und eine schnellere Reaktionszeit bei gleichbleibender Modellleistung bietet."
+  },
+  "deepseek-r1-70b-online": {
+    "description": "DeepSeek R1 70B Standardversion, die Echtzeit-Online-Suche unterstützt und sich für Dialoge und Textverarbeitungsaufgaben eignet, die aktuelle Informationen benötigen."
+  },
+  "deepseek-r1-distill-llama": {
+    "description": "deepseek-r1-distill-llama ist ein Modell, das auf der Grundlage von Llama aus DeepSeek-R1 destilliert wurde."
+  },
  "deepseek-r1-distill-llama-70b": {
    "description": "DeepSeek R1 – das größere und intelligentere Modell im DeepSeek-Paket – wurde in die Llama 70B-Architektur destilliert. Basierend auf Benchmark-Tests und menschlicher Bewertung ist dieses Modell intelligenter als das ursprüngliche Llama 70B, insbesondere bei Aufgaben, die mathematische und faktische Genauigkeit erfordern."
  },
  "deepseek-r1-distill-llama-8b": {
    "description": "Das DeepSeek-R1-Distill Modell wurde durch Wissensdistillationstechniken entwickelt, indem Proben, die von DeepSeek-R1 generiert wurden, auf Qwen, Llama und andere Open-Source-Modelle feinabgestimmt wurden."
  },
+  "deepseek-r1-distill-qianfan-llama-70b": {
+    "description": "Erstmals veröffentlicht am 14. Februar 2025, destilliert vom Qianfan-Modellteam auf Basis des Llama3_70B Modells (gebaut mit Meta Llama), wobei auch die Qianfan-Korpora in die Destillationsdaten aufgenommen wurden."
+  },
+  "deepseek-r1-distill-qianfan-llama-8b": {
+    "description": "Erstmals veröffentlicht am 14. Februar 2025, destilliert vom Qianfan-Modellteam auf Basis des Llama3_8B Modells (gebaut mit Meta Llama), wobei auch die Qianfan-Korpora in die Destillationsdaten aufgenommen wurden."
+  },
+  "deepseek-r1-distill-qwen": {
+    "description": "deepseek-r1-distill-qwen ist ein Modell, das auf der Grundlage von Qwen durch Distillierung aus DeepSeek-R1 erstellt wurde."
+  },
  "deepseek-r1-distill-qwen-1.5b": {
    "description": "Das DeepSeek-R1-Distill Modell wurde durch Wissensdistillationstechniken entwickelt, indem Proben, die von DeepSeek-R1 generiert wurden, auf Qwen, Llama und andere Open-Source-Modelle feinabgestimmt wurden."
  },
@@ -677,6 +728,12 @@
  "deepseek-r1-distill-qwen-7b": {
    "description": "Das DeepSeek-R1-Distill Modell wurde durch Wissensdistillationstechniken entwickelt, indem Proben, die von DeepSeek-R1 generiert wurden, auf Qwen, Llama und andere Open-Source-Modelle feinabgestimmt wurden."
  },
+  "deepseek-r1-fast-online": {
+    "description": "DeepSeek R1 Vollschnellversion, die Echtzeit-Online-Suche unterstützt und die leistungsstarken Fähigkeiten von 671B Parametern mit einer schnelleren Reaktionszeit kombiniert."
+  },
+  "deepseek-r1-online": {
+    "description": "DeepSeek R1 Vollversion mit 671B Parametern, die Echtzeit-Online-Suche unterstützt und über verbesserte Verständnis- und Generierungsfähigkeiten verfügt."
+  },
  "deepseek-reasoner": {
    "description": "Das von DeepSeek entwickelte Inferenzmodell. Bevor das Modell die endgültige Antwort ausgibt, gibt es zunächst eine Denkprozesskette aus, um die Genauigkeit der endgültigen Antwort zu erhöhen."
  },
@@ -689,6 +746,9 @@
  "deepseek-v3": {
    "description": "DeepSeek-V3 ist ein MoE-Modell, das von der Hangzhou DeepSeek Artificial Intelligence Technology Research Co., Ltd. entwickelt wurde. Es hat in mehreren Bewertungen herausragende Ergebnisse erzielt und belegt in den gängigen Rankings den ersten Platz unter den Open-Source-Modellen. Im Vergleich zum V2.5-Modell hat sich die Generierungsgeschwindigkeit um das Dreifache erhöht, was den Nutzern ein schnelleres und flüssigeres Nutzungserlebnis bietet."
  },
+  "deepseek-v3-0324": {
+    "description": "DeepSeek-V3-0324 ist ein MoE-Modell mit 671 Milliarden Parametern, das in den Bereichen Programmierung und technische Fähigkeiten, Kontextverständnis und Verarbeitung langer Texte herausragende Vorteile bietet."
+  },
  "deepseek/deepseek-chat": {
    "description": "Ein neues Open-Source-Modell, das allgemeine und Codefähigkeiten vereint. Es behält nicht nur die allgemeinen Dialogfähigkeiten des ursprünglichen Chat-Modells und die leistungsstarken Codeverarbeitungsfähigkeiten des Coder-Modells bei, sondern stimmt auch besser mit menschlichen Vorlieben überein. Darüber hinaus hat DeepSeek-V2.5 in vielen Bereichen wie Schreibaufgaben und Befehlsbefolgung erhebliche Verbesserungen erzielt."
  },
@@ -755,6 +815,9 @@
  "ernie-4.0-turbo-8k-preview": {
    "description": "Das von Baidu entwickelte Flaggschiff-Modell für große Sprachmodelle zeigt hervorragende Gesamtergebnisse und ist weit verbreitet in komplexen Aufgabenbereichen anwendbar; es unterstützt die automatische Anbindung an das Baidu-Suchplugin, um die Aktualität der Antwortinformationen zu gewährleisten. Im Vergleich zu ERNIE 4.0 bietet es eine bessere Leistung."
  },
+  "ernie-4.5-8k-preview": {
+    "description": "Das ERNIE 4.5 Modell ist ein neu entwickeltes, natives multimodales Basis-Modell von Baidu, das durch die gemeinsame Modellierung mehrerer Modalitäten eine synergistische Optimierung erreicht und über hervorragende multimodale Verständnisfähigkeiten verfügt; es bietet verbesserte Sprachfähigkeiten, umfassende Verbesserungen in Verständnis, Generierung, Logik und Gedächtnis, sowie signifikante Verbesserungen in der Vermeidung von Halluzinationen, logischen Schlussfolgerungen und Programmierfähigkeiten."
+  },
  "ernie-char-8k": {
    "description": "Das von Baidu entwickelte große Sprachmodell für vertikale Szenarien eignet sich für Anwendungen wie NPCs in Spielen, Kundenservice-Dialoge und Rollenspiele, mit einem klareren und konsistenteren Charakterstil, einer stärkeren Befolgung von Anweisungen und besserer Inferenzleistung."
  },
@@ -788,9 +851,6 @@
  "gemini-1.0-pro-latest": {
    "description": "Gemini 1.0 Pro ist Googles leistungsstarkes KI-Modell, das für die Skalierung einer Vielzahl von Aufgaben konzipiert ist."
  },
-  "gemini-1.5-flash": {
-    "description": "Gemini 1.5 Flash ist Googles neuestes multimodales KI-Modell, das über eine schnelle Verarbeitungskapazität verfügt und Texte, Bilder und Videoeingaben unterstützt, um eine effiziente Skalierung für verschiedene Aufgaben zu ermöglichen."
-  },
  "gemini-1.5-flash-001": {
    "description": "Gemini 1.5 Flash 001 ist ein effizientes multimodales Modell, das eine breite Anwendbarkeit unterstützt."
  },
@@ -803,6 +863,9 @@
  "gemini-1.5-flash-8b-exp-0924": {
    "description": "Gemini 1.5 Flash 8B 0924 ist das neueste experimentelle Modell, das in Text- und multimodalen Anwendungsfällen erhebliche Leistungsverbesserungen aufweist."
  },
+  "gemini-1.5-flash-8b-latest": {
+    "description": "Gemini 1.5 Flash 8B ist ein effizientes multimodales Modell, das eine breite Palette von Anwendungen unterstützt."
+  },
  "gemini-1.5-flash-exp-0827": {
    "description": "Gemini 1.5 Flash 0827 bietet optimierte multimodale Verarbeitungskapazitäten, die für verschiedene komplexe Aufgaben geeignet sind."
  },
@@ -830,24 +893,27 @@
  "gemini-2.0-flash-001": {
    "description": "Gemini 2.0 Flash bietet nächste Generation Funktionen und Verbesserungen, einschließlich außergewöhnlicher Geschwindigkeit, nativer Werkzeugnutzung, multimodaler Generierung und einem Kontextfenster von 1M Tokens."
  },
+  "gemini-2.0-flash-exp": {
+    "description": "Gemini 2.0 Flash-Modellvariante, die auf Kosteneffizienz und niedrige Latenz optimiert ist."
+  },
+  "gemini-2.0-flash-exp-image-generation": {
+    "description": "Gemini 2.0 Flash Experimentmodell, das die Bildgenerierung unterstützt"
+  },
  "gemini-2.0-flash-lite": {
    "description": "Gemini 2.0 Flash ist eine Modellvariante, die auf Kosteneffizienz und niedrige Latenz optimiert ist."
  },
  "gemini-2.0-flash-lite-001": {
    "description": "Gemini 2.0 Flash ist eine Modellvariante, die auf Kosteneffizienz und niedrige Latenz optimiert ist."
  },
-  "gemini-2.0-flash-lite-preview-02-05": {
-    "description": "Ein Gemini 2.0 Flash Modell, das auf Kosteneffizienz und niedrige Latenz optimiert wurde."
-  },
-  "gemini-2.0-flash-thinking-exp": {
-    "description": "Gemini 2.0 Flash Exp ist Googles neuestes experimentelles multimodales KI-Modell mit der nächsten Generation von Funktionen, außergewöhnlicher Geschwindigkeit, nativer Tool-Nutzung und multimodaler Generierung."
-  },
  "gemini-2.0-flash-thinking-exp-01-21": {
    "description": "Gemini 2.0 Flash Exp ist Googles neuestes experimentelles multimodales KI-Modell mit der nächsten Generation von Funktionen, außergewöhnlicher Geschwindigkeit, nativer Tool-Nutzung und multimodaler Generierung."
  },
  "gemini-2.0-pro-exp-02-05": {
    "description": "Gemini 2.0 Pro Experimental ist Googles neuestes experimentelles multimodales KI-Modell, das im Vergleich zu früheren Versionen eine gewisse Qualitätsverbesserung aufweist, insbesondere in Bezug auf Weltwissen, Code und lange Kontexte."
  },
+  "gemini-2.5-pro-exp-03-25": {
+    "description": "Gemini 2.5 Pro Experimental ist Googles fortschrittlichstes Denkmodell, das in der Lage ist, komplexe Probleme in den Bereichen Code, Mathematik und STEM zu analysieren. Es kann auch lange Kontexte nutzen, um große Datensätze, Codebasen und Dokumente zu analysieren."
+  },
  "gemma-7b-it": {
    "description": "Gemma 7B eignet sich für die Verarbeitung von mittelgroßen Aufgaben und bietet ein gutes Kosten-Nutzen-Verhältnis."
  },
@@ -1016,6 +1082,9 @@
  "gpt-4o-mini-realtime-preview": {
    "description": "Echtzeitversion von GPT-4o-mini, unterstützt Audio- und Texteingabe sowie -ausgabe in Echtzeit."
  },
+  "gpt-4o-mini-tts": {
+    "description": "GPT-4o mini TTS ist ein Text-to-Speech-Modell, das auf GPT-4o mini basiert und hochwertige Sprachgenerierung bei niedrigeren Kosten bietet."
+  },
  "gpt-4o-realtime-preview": {
    "description": "Echtzeitversion von GPT-4o, unterstützt Audio- und Texteingabe sowie -ausgabe in Echtzeit."
  },
@@ -1073,6 +1142,12 @@
  "hunyuan-standard-vision": {
    "description": "Das neueste multimodale Modell von Hunyuan, das mehrsprachige Antworten unterstützt und sowohl in Chinesisch als auch in Englisch ausgewogen ist."
  },
+  "hunyuan-t1-20250321": {
+    "description": "Umfassende Entwicklung der Modellfähigkeiten in Geistes- und Naturwissenschaften, starke Fähigkeit zur Erfassung langer Textinformationen. Unterstützt die Lösung von wissenschaftlichen Problemen in verschiedenen Schwierigkeitsgraden, einschließlich Mathematik, logischem Denken, Wissenschaft und Code."
+  },
+  "hunyuan-t1-latest": {
+    "description": "Das erste ultra-skalierbare Hybrid-Transformer-Mamba-Inferenzmodell der Branche, das die Inferenzfähigkeiten erweitert, eine extrem hohe Dekodierungsgeschwindigkeit bietet und weiter auf menschliche Präferenzen abgestimmt ist."
+  },
  "hunyuan-translation": {
    "description": "Unterstützt die Übersetzung zwischen Chinesisch und Englisch, Japanisch, Französisch, Portugiesisch, Spanisch, Türkisch, Russisch, Arabisch, Koreanisch, Italienisch, Deutsch, Vietnamesisch, Malaiisch und Indonesisch in 15 Sprachen. Basierend auf einem automatisierten Bewertungs-Framework COMET, das auf mehrsprachigen Übersetzungsbewertungsszenarien basiert, übertrifft es insgesamt die Übersetzungsfähigkeiten anderer Modelle ähnlicher Größe auf dem Markt."
  },
@@ -1082,9 +1157,6 @@
  "hunyuan-turbo": {
    "description": "Die Vorschauversion des neuen großen Sprachmodells von Hunyuan verwendet eine neuartige hybride Expertenmodellstruktur (MoE) und bietet im Vergleich zu Hunyuan-Pro eine schnellere Inferenz und bessere Leistung."
  },
-  "hunyuan-turbo-20241120": {
-    "description": "Hunyuan-turbo Version vom 20. November 2024, eine feste Version, die zwischen hunyuan-turbo und hunyuan-turbo-latest liegt."
-  },
  "hunyuan-turbo-20241223": {
    "description": "Diese Version optimiert: Datenanweisungs-Skalierung, erhebliche Verbesserung der allgemeinen Generalisierungsfähigkeit des Modells; erhebliche Verbesserung der mathematischen, programmierbaren und logischen Denkfähigkeiten; Optimierung der Fähigkeiten im Textverständnis und der Wortverständnisfähigkeiten; Optimierung der Qualität der Inhaltserzeugung in der Texterstellung."
  },
@@ -1094,6 +1166,15 @@
  "hunyuan-turbo-vision": {
    "description": "Das neue Flaggschiff-Modell der visuellen Sprache von Hunyuan, das eine brandneue Struktur des gemischten Expertenmodells (MoE) verwendet, bietet umfassende Verbesserungen in den Fähigkeiten zur grundlegenden Erkennung, Inhaltserstellung, Wissensfragen und Analyse sowie Schlussfolgerungen im Vergleich zum vorherigen Modell."
  },
+  "hunyuan-turbos-20250226": {
+    "description": "hunyuan-TurboS pv2.1.2 ist eine feste Version mit aktualisierten Trainings-Tokens; verbesserte Denkfähigkeiten in Mathematik/Logik/Code; verbesserte allgemeine Erfahrung in Chinesisch und Englisch, einschließlich Textgenerierung, Textverständnis, Wissensfragen und Smalltalk."
+  },
+  "hunyuan-turbos-20250313": {
+    "description": "Ein einheitlicher Stil für mathematische Problemlösungsprozesse, der die mehrstufige Beantwortung von mathematischen Fragen verbessert. Textgenerierung optimiert den Antwortstil, entfernt AI-typische Formulierungen und erhöht die sprachliche Eleganz."
+  },
+  "hunyuan-turbos-latest": {
+    "description": "hunyuan-TurboS ist die neueste Version des Hunyuan-Flaggschiffmodells, das über verbesserte Denkfähigkeiten und ein besseres Nutzungserlebnis verfügt."
+  },
  "hunyuan-vision": {
    "description": "Das neueste multimodale Modell von Hunyuan unterstützt die Eingabe von Bildern und Text zur Generierung von Textinhalten."
  },
@@ -1124,12 +1205,18 @@
  "lite": {
    "description": "Spark Lite ist ein leichtgewichtiges großes Sprachmodell mit extrem niedriger Latenz und effizienter Verarbeitung, das vollständig kostenlos und offen ist und Echtzeitsuchfunktionen unterstützt. Seine schnelle Reaktionsfähigkeit macht es besonders geeignet für Inferenzanwendungen und Modellanpassungen auf Geräten mit geringer Rechenleistung und bietet den Nutzern ein hervorragendes Kosten-Nutzen-Verhältnis sowie ein intelligentes Erlebnis, insbesondere in den Bereichen Wissensabfragen, Inhaltserstellung und Suchszenarien."
  },
+  "llama-2-7b-chat": {
+    "description": "Llama2 ist eine Serie großer Sprachmodelle (LLM), die von Meta entwickelt und als Open Source veröffentlicht wurden. Diese Serie umfasst generative Textmodelle mit einer Parameteranzahl von 7 Milliarden bis 70 Milliarden, die vortrainiert und feinjustiert wurden. Architekturtechnisch ist Llama2 ein autoregressives Sprachmodell, das eine optimierte Transformer-Architektur verwendet. Die angepassten Versionen nutzen überwachte Feinabstimmung (SFT) und Reinforcement Learning mit menschlichem Feedback (RLHF), um den menschlichen Vorlieben für Nützlichkeit und Sicherheit zu entsprechen. Llama2 übertrifft die Leistung der Llama-Serie in mehreren akademischen Datensätzen und bietet Inspiration für die Entwicklung und Gestaltung vieler anderer Modelle."
+  },
  "llama-3.1-70b-versatile": {
    "description": "Llama 3.1 70B bietet leistungsstarke KI-Schlussfolgerungsfähigkeiten, die für komplexe Anwendungen geeignet sind und eine hohe Rechenverarbeitung bei gleichzeitiger Effizienz und Genauigkeit unterstützen."
  },
  "llama-3.1-8b-instant": {
    "description": "Llama 3.1 8B ist ein leistungsstarkes Modell, das schnelle Textgenerierungsfähigkeiten bietet und sich hervorragend für Anwendungen eignet, die große Effizienz und Kosteneffektivität erfordern."
  },
+  "llama-3.1-instruct": {
+    "description": "Das Llama 3.1 Instruktionstuning-Modell ist für Dialogszenarien optimiert und übertrifft in gängigen Branchenbenchmarks viele bestehende Open-Source-Chatmodelle."
+  },
  "llama-3.2-11b-vision-instruct": {
    "description": "Überlegene Bildverarbeitungsfähigkeiten auf hochauflösenden Bildern, geeignet für visuelle Verständnisanwendungen."
  },
@@ -1142,12 +1229,18 @@
  "llama-3.2-90b-vision-preview": {
    "description": "Llama 3.2 ist darauf ausgelegt, Aufgaben zu bearbeiten, die visuelle und textuelle Daten kombinieren. Es zeigt hervorragende Leistungen bei Aufgaben wie Bildbeschreibung und visuellen Fragen und Antworten und überbrückt die Kluft zwischen Sprachgenerierung und visueller Schlussfolgerung."
  },
+  "llama-3.2-vision-instruct": {
+    "description": "Das Llama 3.2-Vision-Instruct-Modell ist optimiert für visuelle Erkennung, Bildschlussfolgerungen, Bildbeschreibungen und das Beantworten von allgemeinen Fragen, die mit Bildern zusammenhängen."
+  },
  "llama-3.3-70b-instruct": {
    "description": "Llama 3.3 ist das fortschrittlichste mehrsprachige Open-Source-Sprachmodell der Llama-Serie, das eine Leistung bietet, die mit einem 405B-Modell vergleichbar ist, und das zu extrem niedrigen Kosten. Es basiert auf der Transformer-Architektur und verbessert die Nützlichkeit und Sicherheit durch überwachte Feinabstimmung (SFT) und verstärkendes Lernen mit menschlichem Feedback (RLHF). Die auf Anweisungen optimierte Version ist speziell für mehrsprachige Dialoge optimiert und übertrifft in mehreren Branchenbenchmarks viele Open-Source- und geschlossene Chat-Modelle. Das Wissensdatum endet im Dezember 2023."
  },
  "llama-3.3-70b-versatile": {
    "description": "Das Meta Llama 3.3 ist ein mehrsprachiges, großes Sprachmodell (LLM), das aus einem vortrainierten und anweisungsorientierten generativen Modell mit 70B (Text-Eingabe/Text-Ausgabe) besteht. Das anweisungsorientierte Modell von Llama 3.3 ist für mehrsprachige Dialoganwendungen optimiert und übertrifft viele verfügbare Open-Source- und Closed-Source-Chat-Modelle bei gängigen Branchenbenchmarks."
  },
+  "llama-3.3-instruct": {
+    "description": "Das Llama 3.3 Instruct-Modell ist für Dialogszenarien optimiert und übertrifft in gängigen Branchenbenchmarks viele bestehende Open-Source-Chatmodelle."
+  },
  "llama3-70b-8192": {
    "description": "Meta Llama 3 70B bietet unvergleichliche Fähigkeiten zur Verarbeitung von Komplexität und ist maßgeschneidert für Projekte mit hohen Anforderungen."
  },
@@ -1187,6 +1280,9 @@
  "max-32k": {
    "description": "Spark Max 32K bietet eine große Kontextverarbeitungsfähigkeit mit verbesserter Kontextverständnis und logischer Schlussfolgerungsfähigkeit und unterstützt Texteingaben von bis zu 32K Tokens, was es ideal für das Lesen langer Dokumente und private Wissensabfragen macht."
  },
+  "megrez-3b-instruct": {
+    "description": "Megrez-3B-Instruct ist ein großes Sprachmodell, das vollständig von Wuxin XinQiong trainiert wurde. Megrez-3B-Instruct zielt darauf ab, durch die Idee der Hardware-Software-Kooperation eine schnelle Inferenz, ein kompaktes Design und eine benutzerfreundliche Endgerätlösung zu schaffen."
+  },
  "meta-llama-3-70b-instruct": {
    "description": "Ein leistungsstarkes Modell mit 70 Milliarden Parametern, das in den Bereichen Schlussfolgerungen, Programmierung und breiten Sprachanwendungen herausragt."
  },
@@ -1223,9 +1319,6 @@
  "meta-llama/Llama-3.2-90B-Vision-Instruct-Turbo": {
    "description": "LLaMA 3.2 ist darauf ausgelegt, Aufgaben zu bewältigen, die sowohl visuelle als auch Textdaten kombinieren. Es erzielt hervorragende Ergebnisse bei Aufgaben wie Bildbeschreibung und visueller Fragebeantwortung und überbrückt die Kluft zwischen Sprachgenerierung und visueller Schlussfolgerung."
  },
-  "meta-llama/Llama-3.3-70B-Instruct": {
-    "description": "Llama 3.3 ist das fortschrittlichste mehrsprachige Open-Source-Sprachmodell der Llama-Serie, das zu extrem niedrigen Kosten eine Leistung bietet, die mit der eines 405B-Modells vergleichbar ist. Basierend auf der Transformer-Architektur und verbessert durch überwachte Feinabstimmung (SFT) und verstärkendes Lernen mit menschlichem Feedback (RLHF) für Nützlichkeit und Sicherheit. Die optimierte Version für Anweisungen ist speziell für mehrsprachige Dialoge optimiert und übertrifft in mehreren Branchenbenchmarks viele Open-Source- und geschlossene Chat-Modelle. Wissensstichtag ist der 31. Dezember 2023."
-  },
  "meta-llama/Llama-3.3-70B-Instruct-Turbo": {
    "description": "Das Meta Llama 3.3 mehrsprachige große Sprachmodell (LLM) ist ein vortrainiertes und anweisungsoptimiertes Generierungsmodell mit 70B (Textinput/Textoutput). Das anweisungsoptimierte reine Textmodell von Llama 3.3 wurde für mehrsprachige Dialoganwendungen optimiert und übertrifft viele verfügbare Open-Source- und geschlossene Chat-Modelle in gängigen Branchenbenchmarks."
  },
@@ -1253,15 +1346,9 @@
  "meta-llama/Meta-Llama-3.1-70B": {
    "description": "Llama 3.1 ist das führende Modell von Meta, das bis zu 405B Parameter unterstützt und in komplexen Gesprächen, mehrsprachiger Übersetzung und Datenanalyse eingesetzt werden kann."
  },
-  "meta-llama/Meta-Llama-3.1-70B-Instruct": {
-    "description": "LLaMA 3.1 70B bietet effiziente Dialogunterstützung in mehreren Sprachen."
-  },
  "meta-llama/Meta-Llama-3.1-70B-Instruct-Turbo": {
    "description": "Das Llama 3.1 70B-Modell wurde feinabgestimmt und eignet sich für hochbelastete Anwendungen, die auf FP8 quantisiert wurden, um eine effizientere Rechenleistung und Genauigkeit zu bieten und in komplexen Szenarien hervorragende Leistungen zu gewährleisten."
  },
-  "meta-llama/Meta-Llama-3.1-8B-Instruct": {
-    "description": "LLaMA 3.1 bietet Unterstützung für mehrere Sprachen und ist eines der führenden Generierungsmodelle der Branche."
-  },
  "meta-llama/Meta-Llama-3.1-8B-Instruct-Turbo": {
    "description": "Das Llama 3.1 8B-Modell verwendet FP8-Quantisierung und unterstützt bis zu 131.072 Kontextmarkierungen, es ist eines der besten Open-Source-Modelle, das sich für komplexe Aufgaben eignet und in vielen Branchenbenchmarks übertrifft."
  },
@@ -1355,12 +1442,18 @@
  "mistral-large": {
    "description": "Mixtral Large ist das Flaggschiff-Modell von Mistral, das die Fähigkeiten zur Codegenerierung, Mathematik und Schlussfolgerungen kombiniert und ein Kontextfenster von 128k unterstützt."
  },
+  "mistral-large-instruct": {
+    "description": "Mistral-Large-Instruct-2407 ist ein fortschrittliches dichtes großes Sprachmodell (LLM) mit 123 Milliarden Parametern und verfügt über state-of-the-art-Schließen, Wissen und Codierungsfähigkeiten."
+  },
  "mistral-large-latest": {
    "description": "Mistral Large ist das Flaggschiff-Modell, das sich gut für mehrsprachige Aufgaben, komplexe Schlussfolgerungen und Codegenerierung eignet und die ideale Wahl für hochentwickelte Anwendungen ist."
  },
  "mistral-nemo": {
    "description": "Mistral Nemo wurde in Zusammenarbeit mit Mistral AI und NVIDIA entwickelt und ist ein leistungsstarkes 12B-Modell."
  },
+  "mistral-nemo-instruct": {
+    "description": "Das große Sprachmodell (LLM) Mistral-Nemo-Instruct-2407 ist eine auf Befehle angepasste Version von Mistral-Nemo-Base-2407."
+  },
  "mistral-small": {
    "description": "Mistral Small kann für jede sprachbasierte Aufgabe verwendet werden, die hohe Effizienz und geringe Latenz erfordert."
  },
@@ -1577,6 +1670,12 @@
  "qwen2": {
    "description": "Qwen2 ist das neue große Sprachmodell von Alibaba, das mit hervorragender Leistung eine Vielzahl von Anwendungsanforderungen unterstützt."
  },
+  "qwen2-72b-instruct": {
+    "description": "Qwen2 ist die neueste Generation von Sprachmodellen, die vom Qwen-Team entwickelt wurde. Es basiert auf der Transformer-Architektur und verwendet Techniken wie die SwiGLU-Aktivierungsfunktion, die Aufmerksamkeits-QKV-Bias (attention QKV bias), die gruppenbasierte Abfrageaufmerksamkeit (group query attention) und eine Mischung aus rutschendem Fenster und voller Aufmerksamkeit (mixture of sliding window attention and full attention). Darüber hinaus hat das Qwen-Team den Tokenizer verbessert, der für die Verarbeitung von natürlicher Sprache und Code optimiert ist."
+  },
+  "qwen2-7b-instruct": {
+    "description": "Qwen2 ist die neueste Serie von großen Sprachmodellen, die vom Qwen-Team entwickelt wurde. Es basiert auf der Transformer-Architektur und verwendet Techniken wie die SwiGLU-Aktivierungsfunktion, die Aufmerksamkeits-QKV-Bias (attention QKV bias), die Gruppenabfrageaufmerksamkeit (group query attention) und eine Mischung aus rutschendem Fenster und voller Aufmerksamkeit (mixture of sliding window attention and full attention). Zudem hat das Qwen-Team den Tokenizer verbessert, um mehrere natürliche Sprachen und Code besser zu verarbeiten."
+  },
  "qwen2.5": {
    "description": "Qwen2.5 ist das neue, groß angelegte Sprachmodell der Alibaba-Gruppe, das hervorragende Leistungen zur Unterstützung vielfältiger Anwendungsbedürfnisse bietet."
  },
@@ -1604,6 +1703,12 @@
  "qwen2.5-coder-7b-instruct": {
    "description": "Die Open-Source-Version des Tongyi Qianwen Code-Modells."
  },
+  "qwen2.5-coder-instruct": {
+    "description": "Qwen2.5-Coder ist das neueste Modell der Qwen-Serie, speziell für den Codeentwicklungsbereich entwickelt (früher bekannt als CodeQwen)."
+  },
+  "qwen2.5-instruct": {
+    "description": "Qwen2.5 ist die neueste Serie des Qwen-Sprachmodells. Für Qwen2.5 haben wir mehrere Basis-Sprachmodelle und instruktionsfeinjustierte Sprachmodelle veröffentlicht, deren Parameter von 500 Millionen bis 7,2 Milliarden reichen."
+  },
  "qwen2.5-math-1.5b-instruct": {
    "description": "Das Qwen-Math-Modell verfügt über starke Fähigkeiten zur Lösung mathematischer Probleme."
  },
@@ -1613,12 +1718,21 @@
  "qwen2.5-math-7b-instruct": {
    "description": "Das Qwen-Math-Modell verfügt über starke Fähigkeiten zur Lösung mathematischer Probleme."
  },
+  "qwen2.5-omni-7b": {
+    "description": "Das Qwen-Omni-Modell der Serie unterstützt die Eingabe verschiedener Modalitäten, einschließlich Video, Audio, Bilder und Text, und gibt Audio und Text aus."
+  },
+  "qwen2.5-vl-32b-instruct": {
+    "description": "Die Qwen2.5-VL-Modellreihe verbessert die Intelligenz, Praktikabilität und Anwendbarkeit des Modells, sodass es in Szenarien wie natürlichen Dialogen, Inhaltserstellung, Fachwissensdiensten und Codeentwicklung besser abschneidet. Die 32B-Version verwendet Techniken des verstärkenden Lernens zur Optimierung des Modells. Im Vergleich zu anderen Modellen der Qwen2.5-VL-Reihe bietet sie einen für Menschen präferierten Ausgabe-Stil, Fähigkeiten zur Inferenz komplexer mathematischer Probleme sowie die Fähigkeit zur feingranularen Bildverarbeitung und -inferenz."
+  },
  "qwen2.5-vl-72b-instruct": {
    "description": "Verbesserte Befolgung von Anweisungen, Mathematik, Problemlösung und Programmierung, gesteigerte Erkennungsfähigkeiten für alle Arten von visuellen Elementen, Unterstützung für die präzise Lokalisierung visueller Elemente in verschiedenen Formaten, Verständnis von langen Videodateien (maximal 10 Minuten) und sekundengenauer Ereigniszeitpunktlokalisierung, Fähigkeit zur zeitlichen Einordnung und Geschwindigkeitsverständnis, Unterstützung für die Steuerung von OS- oder Mobile-Agenten basierend auf Analyse- und Lokalisierungsfähigkeiten, starke Fähigkeit zur Extraktion von Schlüsselinformationen und JSON-Format-Ausgabe. Diese Version ist die leistungsstärkste Version der 72B-Serie."
  },
  "qwen2.5-vl-7b-instruct": {
    "description": "Verbesserte Befolgung von Anweisungen, Mathematik, Problemlösung und Programmierung, gesteigerte Erkennungsfähigkeiten für alle Arten von visuellen Elementen, Unterstützung für die präzise Lokalisierung visueller Elemente in verschiedenen Formaten, Verständnis von langen Videodateien (maximal 10 Minuten) und sekundengenauer Ereigniszeitpunktlokalisierung, Fähigkeit zur zeitlichen Einordnung und Geschwindigkeitsverständnis, Unterstützung für die Steuerung von OS- oder Mobile-Agenten basierend auf Analyse- und Lokalisierungsfähigkeiten, starke Fähigkeit zur Extraktion von Schlüsselinformationen und JSON-Format-Ausgabe. Diese Version ist die leistungsstärkste Version der 72B-Serie."
  },
+  "qwen2.5-vl-instruct": {
+    "description": "Qwen2.5-VL ist die neueste Version des visuellen Sprachmodells in der Qwen-Modellfamilie."
+  },
  "qwen2.5:0.5b": {
    "description": "Qwen2.5 ist das neue, groß angelegte Sprachmodell der Alibaba-Gruppe, das hervorragende Leistungen zur Unterstützung vielfältiger Anwendungsbedürfnisse bietet."
  },
@@ -1754,6 +1868,9 @@
  "wizardlm2:8x22b": {
    "description": "WizardLM 2 ist ein Sprachmodell von Microsoft AI, das in komplexen Dialogen, mehrsprachigen Anwendungen, Schlussfolgerungen und intelligenten Assistenten besonders gut abschneidet."
  },
+  "yi-1.5-34b-chat": {
+    "description": "Yi-1.5 ist eine verbesserte Version von Yi. Es wurde mit einem hochwertigen Korpus von 500B Tokens auf Yi fortlaufend vortrainiert und auf 3M diversen Feinabstimmungsbeispielen feinjustiert."
+  },
  "yi-large": {
    "description": "Das brandneue Modell mit einer Billion Parametern bietet außergewöhnliche Frage- und Textgenerierungsfähigkeiten."
  },
@@ -23,6 +23,9 @@
  "cloudflare": {
    "description": "Führen Sie von serverlosen GPUs betriebene Machine-Learning-Modelle im globalen Netzwerk von Cloudflare aus."
  },
+  "cohere": {
+    "description": "Cohere bringt Ihnen die fortschrittlichsten mehrsprachigen Modelle, leistungsstarke Suchfunktionen und einen maßgeschneiderten KI-Arbeitsbereich für moderne Unternehmen – alles integriert in einer sicheren Plattform."
+  },
  "deepseek": {
    "description": "DeepSeek ist ein Unternehmen, das sich auf die Forschung und Anwendung von KI-Technologien spezialisiert hat. Ihr neuestes Modell, DeepSeek-V2.5, kombiniert allgemeine Dialog- und Codeverarbeitungsfähigkeiten und hat signifikante Fortschritte in den Bereichen menschliche Präferenzanpassung, Schreibaufgaben und Befehlsbefolgung erzielt."
  },
@@ -53,6 +56,9 @@
  "hunyuan": {
    "description": "Ein von Tencent entwickeltes großes Sprachmodell, das über starke Fähigkeiten zur Erstellung von Inhalten in chinesischer Sprache, logisches Denkvermögen in komplexen Kontexten und zuverlässige Fähigkeiten zur Aufgabenerfüllung verfügt."
  },
+  "infiniai": {
+    "description": "Bietet Anwendungsentwicklern hochleistungs-fähige, benutzerfreundliche und sichere Dienste für große Modelle, die den gesamten Prozess von der Entwicklung großer Modelle bis hin zur Dienstbereitstellung abdecken."
+  },
  "internlm": {
    "description": "Eine Open-Source-Organisation, die sich der Forschung und Entwicklung von großen Modellen und Werkzeugketten widmet. Sie bietet allen KI-Entwicklern eine effiziente und benutzerfreundliche Open-Source-Plattform, die den Zugang zu den neuesten Technologien und Algorithmen für große Modelle ermöglicht."
  },
@@ -98,6 +104,9 @@
  "sambanova": {
    "description": "SambaNova Cloud ermöglicht es Entwicklern, die besten Open-Source-Modelle einfach zu nutzen und von der schnellsten Inferenzgeschwindigkeit zu profitieren."
  },
+  "search1api": {
+    "description": "Search1API bietet Zugriff auf die DeepSeek-Modellreihe, die bei Bedarf selbstständig online gehen kann, einschließlich der Standard- und Schnellversion, und unterstützt die Auswahl von Modellen in verschiedenen Parametergrößen."
+  },
  "sensenova": {
    "description": "SenseTime bietet mit der starken Basisunterstützung von SenseTimes großem Gerät effiziente und benutzerfreundliche Full-Stack-Modelldienste."
  },
@@ -137,6 +146,9 @@
  "xai": {
    "description": "xAI ist ein Unternehmen, das sich der Entwicklung von Künstlicher Intelligenz widmet, um menschliche wissenschaftliche Entdeckungen zu beschleunigen. Unsere Mission ist es, unser gemeinsames Verständnis des Universums voranzutreiben."
  },
+  "xinference": {
+    "description": "Xorbits Inference (Xinference) ist eine Open-Source-Plattform zur Vereinfachung der Ausführung und Integration verschiedener KI-Modelle. Mit Xinference können Sie beliebige Open-Source-LLMs, Embedding-Modelle und multimodale Modelle in der Cloud oder lokal ausführen, um leistungsstarke KI-Anwendungen zu erstellen."
+  },
  "zeroone": {
    "description": "01.AI konzentriert sich auf die künstliche Intelligenz-Technologie der AI 2.0-Ära und fördert aktiv die Innovation und Anwendung von 'Mensch + künstliche Intelligenz', indem sie leistungsstarke Modelle und fortschrittliche KI-Technologien einsetzt, um die Produktivität der Menschen zu steigern und technologische Befähigung zu erreichen."
  },
@@ -42,6 +42,17 @@
    "sessionWithName": "Sitzungseinstellungen · {{name}}",
    "title": "Einstellungen"
  },
+  "hotkey": {
+    "conflicts": "Konflikte mit bestehenden Tastenkombinationen",
+    "group": {
+      "conversation": "Gespräch",
+      "essential": "Grundlegend"
+    },
+    "invalidCombination": "Die Tastenkombination muss mindestens einen Modifikatortaste (Strg, Alt, Umschalt) und eine normale Taste enthalten",
+    "record": "Drücken Sie eine Taste, um die Tastenkombination aufzuzeichnen",
+    "reset": "Auf die Standard-Tastenkombination zurücksetzen",
+    "title": "Tastenkombinationen"
+  },
  "llm": {
    "aesGcm": "Ihr Schlüssel und Ihre Proxy-Adresse werden mit dem <1>AES-GCM</1> Verschlüsselungsalgorithmus verschlüsselt.",
    "apiKey": {
@@ -335,6 +346,33 @@
    },
    "title": "Thema einstellen"
  },
+  "storage": {
+    "actions": {
+      "export": {
+        "button": "Exportieren",
+        "exportType": {
+          "agent": "Exportiere Assistenteneinstellungen",
+          "agentWithMessage": "Exportiere Assistenten und Nachrichten",
+          "all": "Exportiere globale Einstellungen und alle Assistentendaten",
+          "allAgent": "Exportiere alle Assistenteneinstellungen",
+          "allAgentWithMessage": "Exportiere alle Assistenten und Nachrichten",
+          "globalSetting": "Exportiere globale Einstellungen"
+        },
+        "title": "Daten exportieren"
+      },
+      "import": {
+        "button": "Importieren",
+        "title": "Daten importieren"
+      },
+      "title": "Erweiterte Aktionen"
+    },
+    "desc": "Speicherverbrauch im aktuellen Browser",
+    "embeddings": {
+      "used": "Vektorspeicher"
+    },
+    "title": "Datenspeicher",
+    "used": "Speicherverbrauch"
+  },
  "submitAgentModal": {
    "button": "Assistent einreichen",
    "identifier": "Assistenten-Kennung",
@@ -425,8 +463,10 @@
    "agent": "Standard-Assistent",
    "common": "Allgemeine Einstellungen",
    "experiment": "Experiment",
+    "hotkey": "Tastenkombinationen",
    "llm": "Sprachmodell",
    "provider": "KI-Dienstanbieter",
+    "storage": "Datenspeicher",
    "sync": "Cloud-Synchronisierung",
    "system-agent": "Systemassistent",
    "tts": "Sprachdienste"
@@ -32,6 +32,7 @@
    "title": "Themenliste"
  },
  "searchPlaceholder": "Themen suchen...",
+  "searchResultEmpty": "Keine Suchergebnisse vorhanden",
  "temp": "Vorübergehend",
  "title": "Thema"
 }
@@ -64,6 +64,9 @@
    "stop": "Stop",
    "warp": "New Line"
  },
+  "intentUnderstanding": {
+    "title": "Understanding and analyzing your intent..."
+  },
  "knowledgeBase": {
    "all": "All Content",
    "allFiles": "All Files",
@@ -144,7 +147,6 @@
        "desc": "Intelligently determine whether a search is needed based on the conversation content",
        "title": "Smart Online Search"
      },
-      "disable": "The current model does not support function calls, so the smart online search feature is unavailable",
      "off": {
        "desc": "Use only the model's basic knowledge without performing a web search",
        "title": "Disable Online Search"
@@ -155,6 +157,10 @@
      },
      "useModelBuiltin": "Use the model's built-in search engine"
    },
+    "searchModel": {
+      "desc": "The current model does not support function calls, so it needs to be paired with a model that does support function calls for online searching.",
+      "title": "Search Assistant Model"
+    },
    "title": "Online Search"
  },
  "searchAgentPlaceholder": "Search assistants...",
@@ -41,7 +41,10 @@
    "error": {
      "desc": "We apologize, an error occurred during the Pglite database initialization process. Please click the button to retry. If the error persists after multiple attempts, please <1>submit an issue</1>, and we will assist you as soon as possible.",
      "detail": "Error reason: [{{type}}] {{message}}. Details are as follows:",
+      "detailTitle": "Error Reason",
+      "report": "Report Issue",
      "retry": "Retry",
+      "selfSolve": "Self-Solve",
      "title": "Database Initialization Failed"
    },
    "initing": {
@@ -80,6 +83,54 @@
      "button": "Use Now",
      "desc": "Ready to use",
      "title": "PGlite Database is Ready"
+    },
+    "solve": {
+      "backup": {
+        "backup": "Backup",
+        "backupSuccess": "Backup Successful",
+        "desc": "Export key data from the current database",
+        "export": "Export All Data",
+        "exportDesc": "The exported data will be saved in JSON format, which can be used for future recovery or analysis.",
+        "reset": {
+          "alert": "Warning",
+          "alertDesc": "The following actions may result in data loss. Please ensure you have backed up important data before proceeding.",
+          "button": "Completely Reset Database (Delete All Data)",
+          "confirm": {
+            "desc": "This action will delete all data and cannot be undone. Do you confirm to continue?",
+            "title": "Confirm Database Reset"
+          },
+          "desc": "Reset the database in case of irreversible migration",
+          "title": "Database Reset"
+        },
+        "restore": "Restore",
+        "restoreSuccess": "Restore Successful",
+        "title": "Data Backup"
+      },
+      "diagnosis": {
+        "createdAt": "Creation Time",
+        "migratedAt": "Migration Completion Time",
+        "sql": "Migration SQL",
+        "title": "Migration Status"
+      },
+      "repair": {
+        "desc": "Manually manage migration status",
+        "runSQL": "Custom Execute",
+        "sql": {
+          "clear": "Clear",
+          "desc": "Execute custom SQL statements to fix database issues",
+          "markFinished": "Mark as Finished",
+          "placeholder": "Enter SQL statement...",
+          "result": "Execution Result",
+          "run": "Execute",
+          "title": "SQL Executor"
+        },
+        "title": "Migration Control"
+      },
+      "tabs": {
+        "backup": "Backup & Restore",
+        "diagnosis": "Diagnosis",
+        "repair": "Repair"
+      }
    }
  },
  "close": "Close",
@@ -132,7 +183,7 @@
  },
  "fullscreen": "Full Screen Mode",
  "historyRange": "History Range",
-  "import": "Import Configuration",
+  "importData": "Import Data",
  "importModal": {
    "error": {
      "desc": "Sorry, an error occurred during the data import process. Please try importing again, or <1>submit a request</1>, and we will help you troubleshoot the issue as soon as possible.",
@@ -154,7 +205,8 @@
      "sessions": "Assistants",
      "skips": "Duplicates skipped",
      "topics": "Topics",
-      "type": "Data Type"
+      "type": "Data Type",
+      "update": "Record Updated"
    },
    "title": "Import Data",
    "uploading": {
@@ -163,6 +215,16 @@
      "speed": "Upload speed"
    }
  },
+  "importPreview": {
+    "confirmImport": "Confirm Import",
+    "tables": {
+      "count": "Record Count",
+      "name": "Table Name"
+    },
+    "title": "Data Import Preview",
+    "totalRecords": "A total of {{count}} records will be imported",
+    "totalTables": "{{count}} tables"
+  },
  "information": "Community and News",
  "installPWA": "Install browser app",
  "lang": {
@@ -76,6 +76,7 @@
      "custom": "Custom model, by default, supports both function call and visual recognition. Please verify the availability of the above capabilities based on actual situations.",
      "file": "This model supports file upload for reading and recognition.",
      "functionCall": "This model supports function call.",
+      "imageOutput": "This model supports image generation",
      "reasoning": "This model supports deep thinking",
      "search": "This model supports online search",
      "tokens": "This model supports up to {{tokens}} tokens in a single session.",
@@ -85,6 +86,8 @@
  },
  "ModelSwitchPanel": {
    "emptyModel": "No enabled model. Please go to settings to enable.",
+    "emptyProvider": "No enabled providers. Please go to settings to enable one.",
+    "goToSettings": "Go to settings",
    "provider": "Provider"
  },
  "OllamaSetupGuide": {
@@ -16,6 +16,16 @@
    "detail": "Error details",
    "title": "Request failed"
  },
+  "import": {
+    "importConfigFile": {
+      "description": "Error reason: {{reason}}",
+      "title": "Import Failed"
+    },
+    "incompatible": {
+      "description": "This file was exported from a higher version. Please try upgrading to the latest version and then re-importing.",
+      "title": "Current application does not support importing this file"
+    }
+  },
  "loginRequired": {
    "desc": "You will be redirected to the login page shortly",
    "title": "Please log in to use this feature"
@@ -69,6 +79,7 @@
    "524": "Sorry, the server timed out while waiting for a response, possibly due to a slow reply. Please try again later.",
    "AgentRuntimeError": "Lobe language model runtime execution error. Please troubleshoot or retry based on the following information.",
    "ConnectionCheckFailed": "The request returned empty. Please check if the API proxy address does not end with `/v1`.",
+    "CreateMessageError": "Sorry, the message could not be sent successfully. Please copy the content and try sending it again. This message will not be retained after refreshing the page.",
    "ExceededContextWindow": "The current request content exceeds the length that the model can handle. Please reduce the amount of content and try again.",
    "FreePlanLimit": "You are currently a free user and cannot use this feature. Please upgrade to a paid plan to continue using it.",
    "InsufficientQuota": "Sorry, the quota for this key has been reached. Please check your account balance or increase the key quota and try again.",
@@ -0,0 +1,46 @@
+{
+  "addUserMessage": {
+    "desc": "Add the current input as a user message without triggering generation",
+    "title": "Add a User Message"
+  },
+  "editMessage": {
+    "desc": "Enter edit mode by holding Alt and double-clicking the message",
+    "title": "Edit Message"
+  },
+  "openChatSettings": {
+    "desc": "View and modify the settings for the current conversation",
+    "title": "Open Chat Settings"
+  },
+  "openHotkeyHelper": {
+    "desc": "View instructions for all keyboard shortcuts",
+    "title": "Open Hotkey Help"
+  },
+  "regenerateMessage": {
+    "desc": "Regenerate the last message",
+    "title": "Regenerate Message"
+  },
+  "saveTopic": {
+    "desc": "Save the current topic and open a new one",
+    "title": "Start a New Topic"
+  },
+  "search": {
+    "desc": "Activate the main search box on the current page",
+    "title": "Search"
+  },
+  "switchAgent": {
+    "desc": "Switch between pinned assistants in the sidebar by holding Ctrl and pressing numbers 0-9",
+    "title": "Quick Switch Assistant"
+  },
+  "toggleLeftPanel": {
+    "desc": "Show or hide the left assistant panel",
+    "title": "Show/Hide Assistant Panel"
+  },
+  "toggleRightPanel": {
+    "desc": "Show or hide the right topics panel",
+    "title": "Show/Hide Topic Panel"
+  },
+  "toggleZenMode": {
+    "desc": "In focus mode, only display the current conversation and hide other UI elements",
+    "title": "Toggle Focus Mode"
+  }
+}
@@ -1,13 +1,4 @@
 {
-  "01-ai/Yi-1.5-34B-Chat-16K": {
-    "description": "Yi-1.5 34B delivers superior performance in industry applications with a wealth of training samples."
-  },
-  "01-ai/Yi-1.5-6B-Chat": {
-    "description": "Yi-1.5-6B-Chat is a variant of the Yi-1.5 series, belonging to the open-source chat model. Yi-1.5 is an upgraded version of Yi, continuously pre-trained on 500B high-quality corpora and fine-tuned on over 3M diverse samples. Compared to Yi, Yi-1.5 demonstrates stronger capabilities in coding, mathematics, reasoning, and instruction following, while maintaining excellent language understanding, common sense reasoning, and reading comprehension abilities. The model is available in context length versions of 4K, 16K, and 32K, with a total pre-training volume reaching 3.6T tokens."
-  },
-  "01-ai/Yi-1.5-9B-Chat-16K": {
-    "description": "Yi-1.5 9B supports 16K tokens, providing efficient and smooth language generation capabilities."
-  },
  "01-ai/yi-1.5-34b-chat": {
    "description": "Zero One Everything, the latest open-source fine-tuned model with 34 billion parameters, supports various dialogue scenarios with high-quality training data aligned with human preferences."
  },
@@ -149,12 +140,6 @@
  "Llama-3.2-90B-Vision-Instruct\t": {
    "description": "Advanced image reasoning capabilities suitable for visual understanding agent applications."
  },
-  "LoRA/Qwen/Qwen2.5-72B-Instruct": {
-    "description": "Qwen2.5-72B-Instruct is one of the latest large language models released by Alibaba Cloud. This 72B model shows significant improvements in coding and mathematics. It also provides multilingual support, covering over 29 languages, including Chinese and English. The model has made notable advancements in instruction following, understanding structured data, and generating structured outputs, especially JSON."
-  },
-  "LoRA/Qwen/Qwen2.5-7B-Instruct": {
-    "description": "Qwen2.5-7B-Instruct is one of the latest large language models released by Alibaba Cloud. This 7B model shows significant improvements in coding and mathematics. It also provides multilingual support, covering over 29 languages, including Chinese and English. The model has made notable advancements in instruction following, understanding structured data, and generating structured outputs, especially JSON."
-  },
  "Meta-Llama-3.1-405B-Instruct": {
    "description": "Llama 3.1 instruction-tuned text model optimized for multilingual dialogue use cases, performing excellently on common industry benchmarks among many available open-source and closed chat models."
  },
@@ -179,9 +164,6 @@
  "NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO": {
    "description": "Nous Hermes 2 - Mixtral 8x7B-DPO (46.7B) is a high-precision instruction model suitable for complex computations."
  },
-  "OpenGVLab/InternVL2-26B": {
-    "description": "InternVL2 demonstrates exceptional performance across various visual language tasks, including document and chart understanding, scene text understanding, OCR, and solving scientific and mathematical problems."
-  },
  "Phi-3-medium-128k-instruct": {
    "description": "The same Phi-3-medium model, but with a larger context size for RAG or few-shot prompting."
  },
@@ -206,9 +188,6 @@
  "Phi-3.5-vision-instrust": {
    "description": "An updated version of the Phi-3-vision model."
  },
-  "Pro/OpenGVLab/InternVL2-8B": {
-    "description": "InternVL2 demonstrates exceptional performance across various visual language tasks, including document and chart understanding, scene text understanding, OCR, and solving scientific and mathematical problems."
-  },
  "Pro/Qwen/Qwen2-1.5B-Instruct": {
    "description": "Qwen2-1.5B-Instruct is an instruction-tuned large language model in the Qwen2 series, with a parameter size of 1.5B. This model is based on the Transformer architecture and employs techniques such as the SwiGLU activation function, attention QKV bias, and group query attention. It excels in language understanding, generation, multilingual capabilities, coding, mathematics, and reasoning across multiple benchmark tests, surpassing most open-source models. Compared to Qwen1.5-1.8B-Chat, Qwen2-1.5B-Instruct shows significant performance improvements in tests such as MMLU, HumanEval, GSM8K, C-Eval, and IFEval, despite having slightly fewer parameters."
  },
@@ -224,20 +203,26 @@
  "Pro/Qwen/Qwen2.5-Coder-7B-Instruct": {
    "description": "Qwen2.5-Coder-7B-Instruct is the latest version in Alibaba Cloud's series of code-specific large language models. This model significantly enhances code generation, reasoning, and repair capabilities based on Qwen2.5, trained on 55 trillion tokens. It not only improves coding abilities but also maintains advantages in mathematics and general capabilities, providing a more comprehensive foundation for practical applications such as code agents."
  },
+  "Pro/Qwen/Qwen2.5-VL-7B-Instruct": {
+    "description": "Qwen2.5-VL is the newest addition to the Qwen series, featuring enhanced visual comprehension capabilities. It can analyze text, charts, and layouts within images, comprehend long videos while capturing events. The model supports reasoning, tool manipulation, multi-format object localization, and structured output generation. It incorporates optimized dynamic resolution and frame rate training for video understanding, along with improved efficiency in its visual encoder."
+  },
  "Pro/THUDM/glm-4-9b-chat": {
    "description": "GLM-4-9B-Chat is the open-source version of the GLM-4 series pre-trained models launched by Zhipu AI. This model excels in semantics, mathematics, reasoning, code, and knowledge. In addition to supporting multi-turn dialogues, GLM-4-9B-Chat also features advanced capabilities such as web browsing, code execution, custom tool invocation (Function Call), and long-text reasoning. The model supports 26 languages, including Chinese, English, Japanese, Korean, and German. In multiple benchmark tests, GLM-4-9B-Chat has demonstrated excellent performance, such as in AlignBench-v2, MT-Bench, MMLU, and C-Eval. The model supports a maximum context length of 128K, making it suitable for academic research and commercial applications."
  },
  "Pro/deepseek-ai/DeepSeek-R1": {
    "description": "DeepSeek-R1 is a reinforcement learning (RL) driven inference model that addresses issues of repetitiveness and readability in models. Prior to RL, DeepSeek-R1 introduced cold start data to further optimize inference performance. It performs comparably to OpenAI-o1 in mathematical, coding, and reasoning tasks, and enhances overall effectiveness through carefully designed training methods."
  },
+  "Pro/deepseek-ai/DeepSeek-R1-Distill-Qwen-1.5B": {
+    "description": "DeepSeek-R1-Distill-Qwen-1.5B is a model derived from Qwen2.5-Math-1.5B through knowledge distillation. Fine-tuned with 800,000 carefully selected samples generated by DeepSeek-R1, this model demonstrates commendable performance across multiple benchmarks. As a lightweight model, it achieves an accuracy of 83.9% on MATH-500, a pass rate of 28.9% on AIME 2024, and a score of 954 on CodeForces, showcasing reasoning capabilities that exceed its parameter scale."
+  },
+  "Pro/deepseek-ai/DeepSeek-R1-Distill-Qwen-7B": {
+    "description": "DeepSeek-R1-Distill-Qwen-7B is a model derived from Qwen2.5-Math-7B through knowledge distillation. It was fine-tuned using 800,000 carefully selected samples generated by DeepSeek-R1, demonstrating exceptional reasoning capabilities. The model achieves outstanding performance across multiple benchmarks, including 92.8% accuracy on MATH-500, a 55.5% pass rate on AIME 2024, and a score of 1189 on CodeForces, showcasing strong mathematical and programming abilities for a 7B-scale model."
+  },
  "Pro/deepseek-ai/DeepSeek-V3": {
    "description": "DeepSeek-V3 is a mixed expert (MoE) language model with 671 billion parameters, utilizing multi-head latent attention (MLA) and the DeepSeekMoE architecture, combined with a load balancing strategy without auxiliary loss to optimize inference and training efficiency. Pre-trained on 14.8 trillion high-quality tokens and fine-tuned with supervision and reinforcement learning, DeepSeek-V3 outperforms other open-source models and approaches leading closed-source models."
  },
-  "Pro/google/gemma-2-9b-it": {
-    "description": "Gemma is one of Google's lightweight, state-of-the-art open model series. It is a large language model with a decoder-only architecture, supporting English, and providing open weights, pre-trained variants, and instruction-tuned variants. The Gemma model is suitable for various text generation tasks, including question answering, summarization, and reasoning. This 9B model is trained on 80 trillion tokens. Its relatively small size allows it to be deployed in resource-constrained environments, such as laptops, desktops, or your own cloud infrastructure, making cutting-edge AI models more accessible and fostering innovation."
-  },
-  "Pro/meta-llama/Meta-Llama-3.1-8B-Instruct": {
-    "description": "Meta Llama 3.1 is a family of multilingual large language models developed by Meta, including pre-trained and instruction-tuned variants with parameter sizes of 8B, 70B, and 405B. This 8B instruction-tuned model is optimized for multilingual dialogue scenarios and performs excellently in multiple industry benchmark tests. The model is trained using over 150 trillion tokens of public data and employs techniques such as supervised fine-tuning and human feedback reinforcement learning to enhance the model's usefulness and safety. Llama 3.1 supports text generation and code generation, with a knowledge cutoff date of December 2023."
+  "Pro/deepseek-ai/DeepSeek-V3-1226": {
+    "description": "DeepSeek-V3 is a mixture of experts (MoE) language model with 671 billion parameters, utilizing multi-head latent attention (MLA) and the DeepSeekMoE architecture, combined with a load balancing strategy without auxiliary loss to optimize inference and training efficiency. Pre-trained on 14.8 trillion high-quality tokens and fine-tuned with supervised learning and reinforcement learning, DeepSeek-V3 outperforms other open-source models and approaches leading closed-source models in performance."
  },
  "QwQ-32B-Preview": {
    "description": "QwQ-32B-Preview is an innovative natural language processing model capable of efficiently handling complex dialogue generation and context understanding tasks."
@@ -290,6 +275,12 @@
  "Qwen/Qwen2.5-Coder-7B-Instruct": {
    "description": "Qwen2.5-Coder-7B-Instruct is the latest version in Alibaba Cloud's series of code-specific large language models. This model significantly enhances code generation, reasoning, and repair capabilities based on Qwen2.5, trained on 55 trillion tokens. It not only improves coding abilities but also maintains advantages in mathematics and general capabilities, providing a more comprehensive foundation for practical applications such as code agents."
  },
+  "Qwen/Qwen2.5-VL-32B-Instruct": {
+    "description": "Qwen2.5-VL-32B-Instruct is a multimodal large language model developed by the Tongyi Qianwen team, representing part of the Qwen2.5-VL series. This model excels not only in recognizing common objects but also in analyzing text, charts, icons, graphics, and layouts within images. It functions as a visual agent capable of reasoning and dynamically manipulating tools, with the ability to operate computers and mobile devices. Additionally, the model can precisely locate objects in images and generate structured outputs for documents like invoices and tables. Compared to its predecessor Qwen2-VL, this version demonstrates enhanced mathematical and problem-solving capabilities through reinforcement learning, while also exhibiting more human-preferred response styles."
+  },
+  "Qwen/Qwen2.5-VL-72B-Instruct": {
+    "description": "Qwen2.5-VL is the vision-language model in the Qwen2.5 series. This model demonstrates significant improvements across multiple dimensions: enhanced visual comprehension capable of recognizing common objects, analyzing text, charts, and layouts; serving as a visual agent that can reason and dynamically guide tool usage; supporting understanding of long videos exceeding 1 hour while capturing key events; able to precisely locate objects in images by generating bounding boxes or points; and capable of producing structured outputs particularly suitable for scanned data like invoices and forms."
+  },
  "Qwen2-72B-Instruct": {
    "description": "Qwen2 is the latest series of the Qwen model, supporting 128k context. Compared to the current best open-source models, Qwen2-72B significantly surpasses leading models in natural language understanding, knowledge, coding, mathematics, and multilingual capabilities."
  },
@@ -374,9 +365,6 @@
  "TeleAI/TeleChat2": {
    "description": "The TeleChat2 large model is a generative semantic model independently developed from scratch by China Telecom, supporting functions such as encyclopedia Q&A, code generation, and long text generation, providing users with conversational consulting services. It can interact with users, answer questions, assist in creation, and efficiently help users obtain information, knowledge, and inspiration. The model performs well in areas such as hallucination issues, long text generation, and logical understanding."
  },
-  "TeleAI/TeleMM": {
-    "description": "The TeleMM multimodal large model is a multimodal understanding model independently developed by China Telecom, capable of processing various modal inputs such as text and images, supporting functions like image understanding and chart analysis, providing users with cross-modal understanding services. The model can interact with users in a multimodal manner, accurately understand input content, answer questions, assist in creation, and efficiently provide multimodal information and inspiration support. It excels in fine-grained perception, logical reasoning, and other multimodal tasks."
-  },
  "Vendor-A/Qwen/Qwen2.5-72B-Instruct": {
    "description": "Qwen2.5-72B-Instruct is one of the latest large language models released by Alibaba Cloud. This 72B model shows significant improvements in coding and mathematics. It also provides multilingual support, covering over 29 languages, including Chinese and English. The model has made notable advancements in instruction following, understanding structured data, and generating structured outputs, especially JSON."
  },
@@ -506,6 +494,9 @@
  "anthropic/claude-3.5-sonnet": {
    "description": "Claude 3.5 Sonnet offers capabilities that surpass Opus and faster speeds than Sonnet, while maintaining the same pricing as Sonnet. Sonnet excels particularly in programming, data science, visual processing, and agent tasks."
  },
+  "anthropic/claude-3.7-sonnet": {
+    "description": "Claude 3.7 Sonnet is Anthropic's most advanced model to date and the first hybrid reasoning model on the market. Claude 3.7 Sonnet can generate near-instant responses or extended step-by-step reasoning, allowing users to clearly observe these processes. Sonnet excels particularly in programming, data science, visual processing, and agent tasks."
+  },
  "aya": {
    "description": "Aya 23 is a multilingual model launched by Cohere, supporting 23 languages, facilitating diverse language applications."
  },
@@ -515,9 +506,27 @@
  "baichuan/baichuan2-13b-chat": {
    "description": "Baichuan-13B is an open-source, commercially usable large language model developed by Baichuan Intelligence, containing 13 billion parameters, achieving the best results in its size on authoritative Chinese and English benchmarks."
  },
+  "c4ai-aya-expanse-32b": {
+    "description": "Aya Expanse is a high-performance 32B multilingual model designed to challenge the performance of single-language models through innovations in instruction tuning, data arbitrage, preference training, and model merging. It supports 23 languages."
+  },
+  "c4ai-aya-expanse-8b": {
+    "description": "Aya Expanse is a high-performance 8B multilingual model designed to challenge the performance of single-language models through innovations in instruction tuning, data arbitrage, preference training, and model merging. It supports 23 languages."
+  },
+  "c4ai-aya-vision-32b": {
+    "description": "Aya Vision is a state-of-the-art multimodal model that excels in multiple key benchmarks for language, text, and image capabilities. This 32 billion parameter version focuses on cutting-edge multilingual performance and supports 23 languages."
+  },
+  "c4ai-aya-vision-8b": {
+    "description": "Aya Vision is a state-of-the-art multimodal model that excels in multiple key benchmarks for language, text, and image capabilities. This 8 billion parameter version focuses on low latency and optimal performance."
+  },
  "charglm-3": {
    "description": "CharGLM-3 is designed for role-playing and emotional companionship, supporting ultra-long multi-turn memory and personalized dialogue, with wide applications."
  },
+  "chatglm3": {
+    "description": "ChatGLM3 is a closed-source model released by Zhipu AI and Tsinghua KEG Lab. It has been pre-trained on a massive amount of Chinese and English identifiers and fine-tuned with human preference alignment. Compared to the first-generation model, it has achieved improvements of 16%, 36%, and 280% in MMLU, C-Eval, and GSM8K, respectively, and topped the Chinese task leaderboard C-Eval. It is suitable for scenarios that require a high level of knowledge, reasoning, and creativity, such as advertising copywriting, novel writing, knowledge-based writing, and code generation."
+  },
+  "chatglm3-6b-base": {
+    "description": "ChatGLM3-6b-base is the latest generation of the ChatGLM series, a 6 billion parameter open-source base model developed by Zhipu."
+  },
  "chatgpt-4o-latest": {
    "description": "ChatGPT-4o is a dynamic model that updates in real-time to stay current with the latest version. It combines powerful language understanding and generation capabilities, making it suitable for large-scale applications, including customer service, education, and technical support."
  },
@@ -593,12 +602,39 @@
  "cohere-command-r-plus": {
    "description": "Command R+ is a state-of-the-art RAG-optimized model designed to tackle enterprise-grade workloads."
  },
+  "command": {
+    "description": "An instruction-following dialogue model that delivers high quality and reliability in language tasks, with a longer context length compared to our base generation models."
+  },
+  "command-a-03-2025": {
+    "description": "Command A is our most powerful model to date, excelling in tool usage, agent tasks, retrieval-augmented generation (RAG), and multilingual applications. Command A features a context length of 256K and can run on just two GPUs, achieving a 150% increase in throughput compared to Command R+ 08-2024."
+  },
+  "command-light": {
+    "description": "A smaller, faster version of Command that is nearly as powerful but operates at a higher speed."
+  },
+  "command-light-nightly": {
+    "description": "To shorten the time interval between major version releases, we have launched nightly versions of the Command model. For the command-light series, this version is called command-light-nightly. Please note that command-light-nightly is the latest, most experimental, and (potentially) unstable version. Nightly versions are updated regularly without prior notice, so they are not recommended for production use."
+  },
+  "command-nightly": {
+    "description": "To shorten the time interval between major version releases, we have launched nightly versions of the Command model. For the Command series, this version is called command-cightly. Please note that command-nightly is the latest, most experimental, and (potentially) unstable version. Nightly versions are updated regularly without prior notice, so they are not recommended for production use."
+  },
  "command-r": {
    "description": "Command R is an LLM optimized for dialogue and long context tasks, particularly suitable for dynamic interactions and knowledge management."
  },
+  "command-r-03-2024": {
+    "description": "Command R is an instruction-following dialogue model that provides higher quality and reliability in language tasks, with a longer context length than previous models. It can be used for complex workflows such as code generation, retrieval-augmented generation (RAG), tool usage, and agent tasks."
+  },
+  "command-r-08-2024": {
+    "description": "command-r-08-2024 is an updated version of the Command R model, released in August 2024."
+  },
  "command-r-plus": {
    "description": "Command R+ is a high-performance large language model designed for real enterprise scenarios and complex applications."
  },
+  "command-r-plus-04-2024": {
+    "description": "Command R+ is an instruction-following dialogue model that delivers higher quality and reliability in language tasks, with a longer context length than previous models. It is best suited for complex RAG workflows and multi-step tool usage."
+  },
+  "command-r7b-12-2024": {
+    "description": "command-r7b-12-2024 is a compact and efficient updated version, released in December 2024. It excels in tasks requiring complex reasoning and multi-step processing, such as RAG, tool usage, and agent tasks."
+  },
  "dall-e-2": {
    "description": "The second generation DALL·E model, supporting more realistic and accurate image generation, with a resolution four times that of the first generation."
  },
@@ -614,9 +650,6 @@
  "deepseek-ai/DeepSeek-R1-Distill-Llama-70B": {
    "description": "The DeepSeek-R1 distillation model optimizes inference performance through reinforcement learning and cold-start data, refreshing the benchmark for open-source models across multiple tasks."
  },
-  "deepseek-ai/DeepSeek-R1-Distill-Llama-8B": {
-    "description": "DeepSeek-R1-Distill-Llama-8B is a distillation model developed based on Llama-3.1-8B. This model is fine-tuned using samples generated by DeepSeek-R1, demonstrating excellent reasoning capabilities. It has performed well in multiple benchmark tests, achieving an 89.1% accuracy rate on MATH-500, a 50.4% pass rate on AIME 2024, and a score of 1205 on CodeForces, showcasing strong mathematical and programming abilities as an 8B scale model."
-  },
  "deepseek-ai/DeepSeek-R1-Distill-Qwen-1.5B": {
    "description": "The DeepSeek-R1 distillation model optimizes inference performance through reinforcement learning and cold-start data, refreshing the benchmark for open-source models across multiple tasks."
  },
@@ -659,12 +692,30 @@
  "deepseek-r1": {
    "description": "DeepSeek-R1 is a reinforcement learning (RL) driven inference model that addresses issues of repetitiveness and readability within the model. Prior to RL, DeepSeek-R1 introduced cold start data to further optimize inference performance. It performs comparably to OpenAI-o1 in mathematical, coding, and reasoning tasks, and enhances overall effectiveness through meticulously designed training methods."
  },
+  "deepseek-r1-70b-fast-online": {
+    "description": "DeepSeek R1 70B fast version, supporting real-time online search, providing faster response times while maintaining model performance."
+  },
+  "deepseek-r1-70b-online": {
+    "description": "DeepSeek R1 70B standard version, supporting real-time online search, suitable for dialogue and text processing tasks that require the latest information."
+  },
+  "deepseek-r1-distill-llama": {
+    "description": "deepseek-r1-distill-llama is a model distilled from DeepSeek-R1 based on Llama."
+  },
  "deepseek-r1-distill-llama-70b": {
    "description": "DeepSeek R1—the larger and smarter model in the DeepSeek suite—has been distilled into the Llama 70B architecture. Based on benchmark tests and human evaluations, this model is smarter than the original Llama 70B, especially excelling in tasks requiring mathematical and factual accuracy."
  },
  "deepseek-r1-distill-llama-8b": {
    "description": "The DeepSeek-R1-Distill series models are fine-tuned versions of samples generated by DeepSeek-R1, using knowledge distillation techniques on open-source models like Qwen and Llama."
  },
+  "deepseek-r1-distill-qianfan-llama-70b": {
+    "description": "First released on February 14, 2025, distilled by the Qianfan model development team using Llama3_70B as the base model (Built with Meta Llama), with Qianfan's corpus also added to the distilled data."
+  },
+  "deepseek-r1-distill-qianfan-llama-8b": {
+    "description": "First released on February 14, 2025, distilled by the Qianfan model development team using Llama3_8B as the base model (Built with Meta Llama), with Qianfan's corpus also added to the distilled data."
+  },
+  "deepseek-r1-distill-qwen": {
+    "description": "deepseek-r1-distill-qwen is a model distilled from DeepSeek-R1 based on Qwen."
+  },
  "deepseek-r1-distill-qwen-1.5b": {
    "description": "The DeepSeek-R1-Distill series models are fine-tuned versions of samples generated by DeepSeek-R1, using knowledge distillation techniques on open-source models like Qwen and Llama."
  },
@@ -677,6 +728,12 @@
  "deepseek-r1-distill-qwen-7b": {
    "description": "The DeepSeek-R1-Distill series models are fine-tuned versions of samples generated by DeepSeek-R1, using knowledge distillation techniques on open-source models like Qwen and Llama."
  },
+  "deepseek-r1-fast-online": {
+    "description": "DeepSeek R1 full fast version, supporting real-time online search, combining the powerful capabilities of 671B parameters with faster response times."
+  },
+  "deepseek-r1-online": {
+    "description": "DeepSeek R1 full version, with 671B parameters, supporting real-time online search, offering enhanced understanding and generation capabilities."
+  },
  "deepseek-reasoner": {
    "description": "The reasoning model launched by DeepSeek. Before outputting the final answer, the model first provides a chain of thought to enhance the accuracy of the final response."
  },
@@ -689,6 +746,9 @@
  "deepseek-v3": {
    "description": "DeepSeek-V3 is a MoE model developed by Hangzhou DeepSeek Artificial Intelligence Technology Research Co., Ltd., achieving outstanding results in multiple evaluations and ranking first among open-source models on mainstream leaderboards. Compared to the V2.5 model, V3 has achieved a threefold increase in generation speed, providing users with a faster and smoother experience."
  },
+  "deepseek-v3-0324": {
+    "description": "DeepSeek-V3-0324 is a 671B parameter MoE model, excelling in programming and technical capabilities, contextual understanding, and long text processing."
+  },
  "deepseek/deepseek-chat": {
    "description": "A new open-source model that integrates general and coding capabilities, retaining the general conversational abilities of the original Chat model and the powerful code handling capabilities of the Coder model, while better aligning with human preferences. Additionally, DeepSeek-V2.5 has achieved significant improvements in writing tasks, instruction following, and more."
  },
@@ -755,6 +815,9 @@
  "ernie-4.0-turbo-8k-preview": {
    "description": "Baidu's flagship ultra-large-scale language model, demonstrating outstanding overall performance, widely applicable to complex task scenarios across various fields; it supports automatic integration with Baidu search plugins to ensure the timeliness of Q&A information. It performs better than ERNIE 4.0 in terms of performance."
  },
+  "ernie-4.5-8k-preview": {
+    "description": "ERNIE 4.5 is Baidu's self-developed next-generation native multimodal foundational model, achieving collaborative optimization through joint modeling of multiple modalities, with excellent multimodal understanding capabilities; it features enhanced language abilities, with significant improvements in understanding, generation, logic, and memory, as well as reduced hallucinations and improved logical reasoning and coding capabilities."
+  },
  "ernie-char-8k": {
    "description": "Baidu's vertical scene large language model, suitable for applications such as game NPCs, customer service dialogues, and role-playing conversations, with a more distinct and consistent character style, stronger instruction-following capabilities, and superior inference performance."
  },
@@ -788,9 +851,6 @@
  "gemini-1.0-pro-latest": {
    "description": "Gemini 1.0 Pro is Google's high-performance AI model, designed for extensive task scaling."
  },
-  "gemini-1.5-flash": {
-    "description": "Gemini 1.5 Flash is Google's latest multimodal AI model, featuring rapid processing capabilities and supporting text, image, and video inputs, making it efficient for scaling across various tasks."
-  },
  "gemini-1.5-flash-001": {
    "description": "Gemini 1.5 Flash 001 is an efficient multimodal model that supports extensive application scaling."
  },
@@ -803,6 +863,9 @@
  "gemini-1.5-flash-8b-exp-0924": {
    "description": "Gemini 1.5 Flash 8B 0924 is the latest experimental model, showcasing significant performance improvements in both text and multimodal use cases."
  },
+  "gemini-1.5-flash-8b-latest": {
+    "description": "Gemini 1.5 Flash 8B is a highly efficient multimodal model designed for scalable applications."
+  },
  "gemini-1.5-flash-exp-0827": {
    "description": "Gemini 1.5 Flash 0827 provides optimized multimodal processing capabilities, suitable for various complex task scenarios."
  },
@@ -830,24 +893,27 @@
  "gemini-2.0-flash-001": {
    "description": "Gemini 2.0 Flash offers next-generation features and improvements, including exceptional speed, native tool usage, multimodal generation, and a 1M token context window."
  },
+  "gemini-2.0-flash-exp": {
+    "description": "Gemini 2.0 Flash model variant optimized for cost-effectiveness and low latency."
+  },
+  "gemini-2.0-flash-exp-image-generation": {
+    "description": "Gemini 2.0 Flash experimental model, supports image generation"
+  },
  "gemini-2.0-flash-lite": {
    "description": "Gemini 2.0 Flash is a variant of the model optimized for cost-effectiveness and low latency."
  },
  "gemini-2.0-flash-lite-001": {
    "description": "Gemini 2.0 Flash is a variant of the model optimized for cost-effectiveness and low latency."
  },
-  "gemini-2.0-flash-lite-preview-02-05": {
-    "description": "A Gemini 2.0 Flash model optimized for cost-effectiveness and low latency."
-  },
-  "gemini-2.0-flash-thinking-exp": {
-    "description": "Gemini 2.0 Flash Exp is Google's latest experimental multimodal AI model, featuring next-generation capabilities, exceptional speed, native tool invocation, and multimodal generation."
-  },
  "gemini-2.0-flash-thinking-exp-01-21": {
    "description": "Gemini 2.0 Flash Exp is Google's latest experimental multimodal AI model, featuring next-generation capabilities, exceptional speed, native tool invocation, and multimodal generation."
  },
  "gemini-2.0-pro-exp-02-05": {
    "description": "Gemini 2.0 Pro Experimental is Google's latest experimental multimodal AI model, showing a quality improvement compared to previous versions, especially in world knowledge, coding, and long context."
  },
+  "gemini-2.5-pro-exp-03-25": {
+    "description": "Gemini 2.5 Pro Experimental is Google's most advanced thinking model, capable of reasoning about complex problems in code, mathematics, and STEM fields, as well as analyzing large datasets, codebases, and documents using long context."
+  },
  "gemma-7b-it": {
    "description": "Gemma 7B is suitable for medium to small-scale task processing, offering cost-effectiveness."
  },
@@ -1016,6 +1082,9 @@
  "gpt-4o-mini-realtime-preview": {
    "description": "GPT-4o-mini real-time version, supporting real-time audio and text input and output."
  },
+  "gpt-4o-mini-tts": {
+    "description": "GPT-4o mini TTS is a text-to-speech model based on GPT-4o mini, providing high-quality speech generation at a lower cost."
+  },
  "gpt-4o-realtime-preview": {
    "description": "GPT-4o real-time version, supporting real-time audio and text input and output."
  },
@@ -1073,6 +1142,12 @@
  "hunyuan-standard-vision": {
    "description": "The latest multimodal model from Hunyuan, supporting multilingual responses with balanced capabilities in both Chinese and English."
  },
+  "hunyuan-t1-20250321": {
+    "description": "Comprehensively builds model capabilities in both arts and sciences, with strong long-text information capture ability. Supports reasoning and answering various scientific questions, including mathematics, logic, science, and code, of varying difficulty."
+  },
+  "hunyuan-t1-latest": {
+    "description": "The industry's first ultra-large-scale Hybrid-Transformer-Mamba inference model, enhancing reasoning capabilities with exceptional decoding speed, further aligning with human preferences."
+  },
  "hunyuan-translation": {
    "description": "Supports translation between Chinese and 15 other languages including English, Japanese, French, Portuguese, Spanish, Turkish, Russian, Arabic, Korean, Italian, German, Vietnamese, Malay, and Indonesian. It is based on a multi-scenario translation evaluation set with automated COMET scoring, demonstrating overall superior translation capabilities compared to similarly scaled models in the market."
  },
@@ -1082,9 +1157,6 @@
  "hunyuan-turbo": {
    "description": "The preview version of the next-generation Hunyuan large language model, featuring a brand-new mixed expert model (MoE) structure, which offers faster inference efficiency and stronger performance compared to Hunyuan Pro."
  },
-  "hunyuan-turbo-20241120": {
-    "description": "Hunyuan-turbo fixed version as of November 20, 2024, a version that lies between hunyuan-turbo and hunyuan-turbo-latest."
-  },
  "hunyuan-turbo-20241223": {
    "description": "This version optimizes: data instruction scaling, significantly enhancing the model's generalization capabilities; greatly improving mathematical, coding, and logical reasoning abilities; optimizing text understanding and word comprehension capabilities; enhancing the quality of content generation in text creation."
  },
@@ -1094,6 +1166,15 @@
  "hunyuan-turbo-vision": {
    "description": "The next-generation flagship visual language model from Hunyuan, utilizing a new mixed expert model (MoE) structure, with comprehensive improvements in basic recognition, content creation, knowledge Q&A, and analytical reasoning capabilities compared to the previous generation model."
  },
+  "hunyuan-turbos-20250226": {
+    "description": "hunyuan-TurboS pv2.1.2 fixed version with upgraded training tokens; enhanced reasoning capabilities in mathematics, logic, and coding; improved performance in both Chinese and English across text creation, comprehension, knowledge Q&A, and casual conversation."
+  },
+  "hunyuan-turbos-20250313": {
+    "description": "Unifies the style of mathematical problem-solving steps and enhances multi-turn Q&A in mathematics. Optimizes the response style for text creation, removing AI-like characteristics and adding literary flair."
+  },
+  "hunyuan-turbos-latest": {
+    "description": "The latest version of hunyuan-TurboS, the flagship model of Hunyuan, features enhanced reasoning capabilities and improved user experience."
+  },
  "hunyuan-vision": {
    "description": "The latest multimodal model from Hunyuan, supporting image + text input to generate textual content."
  },
@@ -1124,12 +1205,18 @@
  "lite": {
    "description": "Spark Lite is a lightweight large language model with extremely low latency and efficient processing capabilities, completely free and open, supporting real-time online search functionality. Its quick response feature makes it excel in inference applications and model fine-tuning on low-power devices, providing users with excellent cost-effectiveness and intelligent experiences, particularly in knowledge Q&A, content generation, and search scenarios."
  },
+  "llama-2-7b-chat": {
+    "description": "Llama2 is a series of large language models (LLMs) developed and open-sourced by Meta. This series includes generative text models of varying sizes, ranging from 7 billion to 70 billion parameters, which have been pre-trained and fine-tuned. Architecturally, Llama2 is an autoregressive language model that uses an optimized transformer architecture. The fine-tuned versions leverage supervised fine-tuning (SFT) and reinforcement learning with human feedback (RLHF) to align with human preferences for usefulness and safety. Llama2 outperforms the Llama series on multiple academic datasets and provides valuable insights for the design and development of other models."
+  },
  "llama-3.1-70b-versatile": {
    "description": "Llama 3.1 70B provides enhanced AI reasoning capabilities, suitable for complex applications, supporting extensive computational processing while ensuring efficiency and accuracy."
  },
  "llama-3.1-8b-instant": {
    "description": "Llama 3.1 8B is a high-performance model that offers rapid text generation capabilities, making it ideal for applications requiring large-scale efficiency and cost-effectiveness."
  },
+  "llama-3.1-instruct": {
+    "description": "The Llama 3.1 instruction-tuned model is optimized for conversational scenarios, outperforming many existing open-source chat models on common industry benchmarks."
+  },
  "llama-3.2-11b-vision-instruct": {
    "description": "Excellent image reasoning capabilities on high-resolution images, suitable for visual understanding applications."
  },
@@ -1142,12 +1229,18 @@
  "llama-3.2-90b-vision-preview": {
    "description": "Llama 3.2 is designed to handle tasks that combine visual and textual data. It excels in tasks such as image description and visual question answering, bridging the gap between language generation and visual reasoning."
  },
+  "llama-3.2-vision-instruct": {
+    "description": "The Llama 3.2-Vision instruction-tuned model is optimized for visual recognition, image reasoning, image captioning, and answering general questions related to images."
+  },
  "llama-3.3-70b-instruct": {
    "description": "Llama 3.3 is the most advanced multilingual open-source large language model in the Llama series, offering performance comparable to a 405B model at an extremely low cost. Based on the Transformer architecture, it enhances usability and safety through supervised fine-tuning (SFT) and reinforcement learning from human feedback (RLHF). Its instruction-tuned version is optimized for multilingual dialogue and outperforms many open-source and closed chat models on various industry benchmarks. Knowledge cutoff date is December 2023."
  },
  "llama-3.3-70b-versatile": {
    "description": "Meta Llama 3.3 is a multilingual large language model (LLM) with 70 billion parameters (text input/text output), featuring pre-training and instruction-tuning. The instruction-tuned pure text model of Llama 3.3 is optimized for multilingual conversational use cases and outperforms many available open-source and closed chat models on common industry benchmarks."
  },
+  "llama-3.3-instruct": {
+    "description": "The Llama 3.3 instruction-tuned model is optimized for conversational scenarios, outperforming many existing open-source chat models on common industry benchmarks."
+  },
  "llama3-70b-8192": {
    "description": "Meta Llama 3 70B provides unparalleled complexity handling capabilities, tailored for high-demand projects."
  },
@@ -1187,6 +1280,9 @@
  "max-32k": {
    "description": "Spark Max 32K is configured with large context processing capabilities, enhanced contextual understanding, and logical reasoning abilities, supporting text input of 32K tokens, suitable for long document reading, private knowledge Q&A, and other scenarios."
  },
+  "megrez-3b-instruct": {
+    "description": "Megrez-3B-Instruct is a large language model fully trained by Wuwen Xin Qiong. Megrez-3B-Instruct aims to create an ultra-fast, compact, and easy-to-use intelligent solution for edge devices through the concept of hardware-software co-design."
+  },
  "meta-llama-3-70b-instruct": {
    "description": "A powerful 70-billion parameter model excelling in reasoning, coding, and broad language applications."
  },
@@ -1223,9 +1319,6 @@
  "meta-llama/Llama-3.2-90B-Vision-Instruct-Turbo": {
    "description": "LLaMA 3.2 is designed for tasks involving both visual and textual data. It excels in tasks like image description and visual question answering, bridging the gap between language generation and visual reasoning."
  },
-  "meta-llama/Llama-3.3-70B-Instruct": {
-    "description": "Llama 3.3 is the most advanced multilingual open-source large language model in the Llama series, offering performance comparable to 405B models at a very low cost. Based on the Transformer architecture, it enhances usability and safety through supervised fine-tuning (SFT) and reinforcement learning from human feedback (RLHF). Its instruction-tuned version is optimized for multilingual dialogue and outperforms many open-source and closed chat models on multiple industry benchmarks. Knowledge cutoff date is December 2023."
-  },
  "meta-llama/Llama-3.3-70B-Instruct-Turbo": {
    "description": "Meta Llama 3.3 is a multilingual large language model (LLM) that is a pre-trained and instruction-tuned generative model within the 70B (text input/text output) framework. The instruction-tuned pure text model is optimized for multilingual dialogue use cases and outperforms many available open-source and closed chat models on common industry benchmarks."
  },
@@ -1253,15 +1346,9 @@
  "meta-llama/Meta-Llama-3.1-70B": {
    "description": "Llama 3.1 is a leading model launched by Meta, supporting up to 405B parameters, applicable in complex conversations, multilingual translation, and data analysis."
  },
-  "meta-llama/Meta-Llama-3.1-70B-Instruct": {
-    "description": "LLaMA 3.1 70B offers efficient conversational support in multiple languages."
-  },
  "meta-llama/Meta-Llama-3.1-70B-Instruct-Turbo": {
    "description": "Llama 3.1 70B model is finely tuned for high-load applications, quantized to FP8 for enhanced computational efficiency and accuracy, ensuring outstanding performance in complex scenarios."
  },
-  "meta-llama/Meta-Llama-3.1-8B-Instruct": {
-    "description": "LLaMA 3.1 provides multilingual support and is one of the industry's leading generative models."
-  },
  "meta-llama/Meta-Llama-3.1-8B-Instruct-Turbo": {
    "description": "Llama 3.1 8B model utilizes FP8 quantization, supporting up to 131,072 context tokens, making it a standout in open-source models, excelling in complex tasks and outperforming many industry benchmarks."
  },
@@ -1355,12 +1442,18 @@
  "mistral-large": {
    "description": "Mixtral Large is Mistral's flagship model, combining capabilities in code generation, mathematics, and reasoning, supporting a 128k context window."
  },
+  "mistral-large-instruct": {
+    "description": "Mistral-Large-Instruct-2407 is an advanced dense large language model (LLM) with 123 billion parameters, featuring state-of-the-art reasoning, knowledge, and coding capabilities."
+  },
  "mistral-large-latest": {
    "description": "Mistral Large is the flagship model, excelling in multilingual tasks, complex reasoning, and code generation, making it an ideal choice for high-end applications."
  },
  "mistral-nemo": {
    "description": "Mistral Nemo, developed in collaboration with Mistral AI and NVIDIA, is a high-performance 12B model."
  },
+  "mistral-nemo-instruct": {
+    "description": "Mistral-Nemo-Instruct-2407 is the instruction-tuned version of the Mistral-Nemo-Base-2407 large language model (LLM)."
+  },
  "mistral-small": {
    "description": "Mistral Small can be used for any language-based task that requires high efficiency and low latency."
  },
@@ -1577,6 +1670,12 @@
  "qwen2": {
    "description": "Qwen2 is Alibaba's next-generation large-scale language model, supporting diverse application needs with excellent performance."
  },
+  "qwen2-72b-instruct": {
+    "description": "Qwen2 is the new generation of large language model series introduced by the Qwen team. It is based on the Transformer architecture and incorporates technologies such as the SwiGLU activation function, attention QKV bias, group query attention, a mixture of sliding window attention, and full attention. Additionally, the Qwen team has improved the tokenizer to better adapt to multiple natural languages and code."
+  },
+  "qwen2-7b-instruct": {
+    "description": "Qwen2 is the new generation of large language model series introduced by the Qwen team. It is based on the Transformer architecture and incorporates technologies such as the SwiGLU activation function, attention QKV bias, group query attention, a mixture of sliding window attention, and full attention. Additionally, the Qwen team has improved the tokenizer to better adapt to multiple natural languages and code."
+  },
  "qwen2.5": {
    "description": "Qwen2.5 is Alibaba's next-generation large-scale language model, supporting diverse application needs with outstanding performance."
  },
@@ -1604,6 +1703,12 @@
  "qwen2.5-coder-7b-instruct": {
    "description": "The open-source version of the Tongyi Qianwen Coder model."
  },
+  "qwen2.5-coder-instruct": {
+    "description": "Qwen2.5-Coder is the latest code-specific large language model in the Qwen series (formerly known as CodeQwen)."
+  },
+  "qwen2.5-instruct": {
+    "description": "Qwen2.5 is the latest series of Qwen large language models. For Qwen2.5, we have released multiple base language models and instruction-tuned language models with parameter sizes ranging from 0.5 billion to 7.2 billion."
+  },
  "qwen2.5-math-1.5b-instruct": {
    "description": "Qwen-Math model has powerful mathematical problem-solving capabilities."
  },
@@ -1613,12 +1718,21 @@
  "qwen2.5-math-7b-instruct": {
    "description": "The Qwen-Math model possesses strong capabilities for solving mathematical problems."
  },
+  "qwen2.5-omni-7b": {
+    "description": "The Qwen-Omni series models support input of various modalities, including video, audio, images, and text, and output audio and text."
+  },
+  "qwen2.5-vl-32b-instruct": {
+    "description": "The Qwen2.5-VL model series enhances the model's intelligence level, practicality, and applicability, delivering superior performance in scenarios such as natural conversations, content creation, professional knowledge services, and code development. The 32B version employs reinforcement learning techniques to optimize the model, offering more human-preferred output styles, enhanced reasoning capabilities for complex mathematical problems, and fine-grained image understanding and reasoning compared to other models in the Qwen2.5-VL series."
+  },
  "qwen2.5-vl-72b-instruct": {
    "description": "This version enhances instruction following, mathematics, problem-solving, and coding capabilities, improving the ability to recognize various formats and accurately locate visual elements. It supports understanding long video files (up to 10 minutes) and pinpointing events in seconds, comprehending the sequence and speed of time, and based on parsing and locating capabilities, it supports controlling OS or Mobile agents. It has strong key information extraction and JSON output capabilities, and this version is the most powerful in the series at 72B."
  },
  "qwen2.5-vl-7b-instruct": {
    "description": "This version enhances instruction following, mathematics, problem-solving, and coding capabilities, improving the ability to recognize various formats and accurately locate visual elements. It supports understanding long video files (up to 10 minutes) and pinpointing events in seconds, comprehending the sequence and speed of time, and based on parsing and locating capabilities, it supports controlling OS or Mobile agents. It has strong key information extraction and JSON output capabilities, and this version is the most powerful in the series at 72B."
  },
+  "qwen2.5-vl-instruct": {
+    "description": "Qwen2.5-VL is the latest version of the visual language model in the Qwen model family."
+  },
  "qwen2.5:0.5b": {
    "description": "Qwen2.5 is Alibaba's next-generation large-scale language model, supporting diverse application needs with outstanding performance."
  },
@@ -1754,6 +1868,9 @@
  "wizardlm2:8x22b": {
    "description": "WizardLM 2 is a language model provided by Microsoft AI, excelling in complex dialogues, multilingual capabilities, reasoning, and intelligent assistant applications."
  },
+  "yi-1.5-34b-chat": {
+    "description": "Yi-1.5 is an upgraded version of Yi. It continues pre-training on Yi using a high-quality corpus of 500B tokens and is fine-tuned on 3M diverse samples."
+  },
  "yi-large": {
    "description": "A new trillion-parameter model, providing super strong question-answering and text generation capabilities."
  },
@@ -23,6 +23,9 @@
  "cloudflare": {
    "description": "Run serverless GPU-powered machine learning models on Cloudflare's global network."
  },
+  "cohere": {
+    "description": "Cohere brings you cutting-edge multilingual models, advanced retrieval capabilities, and an AI workspace tailored for modern enterprises—all integrated into a secure platform."
+  },
  "deepseek": {
    "description": "DeepSeek is a company focused on AI technology research and application, with its latest model DeepSeek-V2.5 integrating general dialogue and code processing capabilities, achieving significant improvements in human preference alignment, writing tasks, and instruction following."
  },
@@ -53,6 +56,9 @@
  "hunyuan": {
    "description": "A large language model developed by Tencent, equipped with powerful Chinese creative capabilities, logical reasoning abilities in complex contexts, and reliable task execution skills."
  },
+  "infiniai": {
+    "description": "Provides high-performance, easy-to-use, and secure large model services for application developers, covering the entire process from large model development to service deployment."
+  },
  "internlm": {
    "description": "An open-source organization dedicated to the research and development of large model toolchains. It provides an efficient and user-friendly open-source platform for all AI developers, making cutting-edge large models and algorithm technologies easily accessible."
  },
@@ -98,6 +104,9 @@
  "sambanova": {
    "description": "SambaNova Cloud allows developers to easily utilize the best open-source models and enjoy the fastest inference speeds."
  },
+  "search1api": {
+    "description": "Search1API provides access to the DeepSeek series of models that can connect to the internet as needed, including standard and fast versions, supporting a variety of model sizes."
+  },
  "sensenova": {
    "description": "SenseNova, backed by SenseTime's robust infrastructure, offers efficient and user-friendly full-stack large model services."
  },
@@ -137,6 +146,9 @@
  "xai": {
    "description": "xAI is a company dedicated to building artificial intelligence to accelerate human scientific discovery. Our mission is to advance our collective understanding of the universe."
  },
+  "xinference": {
+    "description": "Xorbits Inference (Xinference) is an open-source platform designed to simplify the deployment and integration of diverse AI models. With Xinference, you can leverage any open-source LLM, embedding model, or multimodal model to perform inference in cloud or on-premises environments, enabling the creation of powerful AI applications."
+  },
  "zeroone": {
    "description": "01.AI focuses on AI 2.0 era technologies, vigorously promoting the innovation and application of 'human + artificial intelligence', using powerful models and advanced AI technologies to enhance human productivity and achieve technological empowerment."
  },
@@ -42,6 +42,17 @@
    "sessionWithName": "Session Settings · {{name}}",
    "title": "Settings"
  },
+  "hotkey": {
+    "conflicts": "Conflicts with existing hotkeys",
+    "group": {
+      "conversation": "Conversation",
+      "essential": "Essential"
+    },
+    "invalidCombination": "The hotkey must include at least one modifier key (Ctrl, Alt, Shift) and one regular key",
+    "record": "Press a key to record the hotkey",
+    "reset": "Reset to default hotkeys",
+    "title": "Hotkeys"
+  },
  "llm": {
    "aesGcm": "Your keys and proxy address will be encrypted using the <1>AES-GCM</1> encryption algorithm",
    "apiKey": {
@@ -335,6 +346,33 @@
    },
    "title": "Theme Settings"
  },
+  "storage": {
+    "actions": {
+      "export": {
+        "button": "Export",
+        "exportType": {
+          "agent": "Export Assistant Settings",
+          "agentWithMessage": "Export Assistant and Messages",
+          "all": "Export Global Settings and All Assistant Data",
+          "allAgent": "Export All Assistant Settings",
+          "allAgentWithMessage": "Export All Assistants and Messages",
+          "globalSetting": "Export Global Settings"
+        },
+        "title": "Export Data"
+      },
+      "import": {
+        "button": "Import",
+        "title": "Import Data"
+      },
+      "title": "Advanced Operations"
+    },
+    "desc": "Current storage usage in the browser",
+    "embeddings": {
+      "used": "Vector Storage"
+    },
+    "title": "Data Storage",
+    "used": "Storage Usage"
+  },
  "submitAgentModal": {
    "button": "Submit Assistant",
    "identifier": "Assistant Identifier",
@@ -425,8 +463,10 @@
    "agent": "Default Assistant",
    "common": "Common Settings",
    "experiment": "Experiment",
+    "hotkey": "Hotkeys",
    "llm": "Language Model",
    "provider": "AI Service Provider",
+    "storage": "Data Storage",
    "sync": "Cloud Sync",
    "system-agent": "System Assistant",
    "tts": "Text-to-Speech"
@@ -32,6 +32,7 @@
    "title": "Topic List"
  },
  "searchPlaceholder": "Search Topics...",
+  "searchResultEmpty": "No search results found.",
  "temp": "Temporary",
  "title": "Topic"
 }
@@ -64,6 +64,9 @@
    "stop": "Detener",
    "warp": "Salto de línea"
  },
+  "intentUnderstanding": {
+    "title": "Entendiendo y analizando su intención..."
+  },
  "knowledgeBase": {
    "all": "Todo el contenido",
    "allFiles": "Todos los archivos",
@@ -144,7 +147,6 @@
        "desc": "Determina inteligentemente si se necesita buscar según el contenido de la conversación",
        "title": "Conexión inteligente"
      },
-      "disable": "El modelo actual no admite llamadas a funciones, por lo que no se puede utilizar la función de conexión inteligente",
      "off": {
        "desc": "Utiliza solo el conocimiento básico del modelo, sin realizar búsquedas en línea",
        "title": "Desactivar conexión"
@@ -155,6 +157,10 @@
      },
      "useModelBuiltin": "Utilizar el motor de búsqueda integrado del modelo"
    },
+    "searchModel": {
+      "desc": "El modelo actual no admite llamadas a funciones, por lo que se necesita combinarlo con un modelo que admita llamadas a funciones para realizar búsquedas en línea",
+      "title": "Modelo de búsqueda auxiliar"
+    },
    "title": "Búsqueda en línea"
  },
  "searchAgentPlaceholder": "Asistente de búsqueda...",
@@ -41,7 +41,10 @@
    "error": {
      "desc": "Lo sentimos, ha ocurrido una excepción en el proceso de inicialización de la base de datos Pglite. Por favor, haga clic en el botón para intentar de nuevo. Si después de varios intentos sigue ocurriendo el mismo error, por favor <1>envíe un problema</1>, y lo resolveremos lo antes posible.",
      "detail": "Razón del error: [{{type}}] {{message}}. Detalles a continuación:",
+      "detailTitle": "Razón del error",
+      "report": "Informar problema",
      "retry": "Reintentar",
+      "selfSolve": "Solución autónoma",
      "title": "Falló la inicialización de la base de datos"
    },
    "initing": {
@@ -80,6 +83,54 @@
      "button": "Usar ahora",
      "desc": "Listo para usar",
      "title": "La base de datos PGlite está lista"
+    },
+    "solve": {
+      "backup": {
+        "backup": "Copia de seguridad",
+        "backupSuccess": "Copia de seguridad exitosa",
+        "desc": "Exportar datos clave de la base de datos actual",
+        "export": "Exportar todos los datos",
+        "exportDesc": "Los datos exportados se guardarán en formato JSON, que se puede utilizar para recuperación o análisis posterior.",
+        "reset": {
+          "alert": "Advertencia",
+          "alertDesc": "Las siguientes operaciones pueden causar pérdida de datos. Asegúrese de haber respaldado datos importantes antes de continuar.",
+          "button": "Restablecer completamente la base de datos (eliminar todos los datos)",
+          "confirm": {
+            "desc": "Esta operación eliminará todos los datos y no se puede deshacer, ¿confirma que desea continuar?",
+            "title": "Confirmar restablecimiento de la base de datos"
+          },
+          "desc": "Restablecer la base de datos en caso de migración no recuperable",
+          "title": "Restablecimiento de la base de datos"
+        },
+        "restore": "Restaurar",
+        "restoreSuccess": "Restauración exitosa",
+        "title": "Copia de seguridad de datos"
+      },
+      "diagnosis": {
+        "createdAt": "Fecha de creación",
+        "migratedAt": "Fecha de finalización de la migración",
+        "sql": "SQL de migración",
+        "title": "Estado de la migración"
+      },
+      "repair": {
+        "desc": "Gestionar manualmente el estado de la migración",
+        "runSQL": "Ejecutar personalizado",
+        "sql": {
+          "clear": "Limpiar",
+          "desc": "Ejecutar sentencias SQL personalizadas para reparar problemas de la base de datos",
+          "markFinished": "Marcar como completado",
+          "placeholder": "Introducir sentencia SQL...",
+          "result": "Resultado de la ejecución",
+          "run": "Ejecutar",
+          "title": "Ejecutor de SQL"
+        },
+        "title": "Control de migración"
+      },
+      "tabs": {
+        "backup": "Copia de seguridad y restauración",
+        "diagnosis": "Diagnóstico",
+        "repair": "Reparar"
+      }
    }
  },
  "close": "Cerrar",
@@ -132,7 +183,7 @@
  },
  "fullscreen": "Pantalla completa",
  "historyRange": "Rango de historial",
-  "import": "Importar configuración",
+  "importData": "Importar datos",
  "importModal": {
    "error": {
      "desc": "Lo sentimos mucho, se produjo un error durante el proceso de importación de datos. Inténtalo de nuevo o <1>envía un informe</1>, y te ayudaremos a solucionar el problema lo antes posible.",
@@ -154,7 +205,8 @@
      "sessions": "Asistentes",
      "skips": "Saltos de duplicados",
      "topics": "Temas",
-      "type": "Tipo de datos"
+      "type": "Tipo de datos",
+      "update": "Registro actualizado"
    },
    "title": "Importar datos",
    "uploading": {
@@ -163,6 +215,16 @@
      "speed": "Velocidad de carga"
    }
  },
+  "importPreview": {
+    "confirmImport": "Confirmar importación",
+    "tables": {
+      "count": "Número de registros",
+      "name": "Nombre de la tabla"
+    },
+    "title": "Vista previa de la importación de datos",
+    "totalRecords": "Se importarán un total de {{count}} registros",
+    "totalTables": "{{count}} tablas"
+  },
  "information": "Comunidad e Información",
  "installPWA": "Instalar la aplicación del navegador",
  "lang": {
@@ -76,6 +76,7 @@
      "custom": "Modelo personalizado: admite llamadas de función y reconocimiento visual. Verifique la disponibilidad de estas capacidades según sea necesario.",
      "file": "Este modelo admite la carga y reconocimiento de archivos.",
      "functionCall": "Este modelo admite llamadas de función.",
+      "imageOutput": "Este modelo admite la generación de imágenes",
      "reasoning": "Este modelo admite un pensamiento profundo",
      "search": "Este modelo admite búsqueda en línea",
      "tokens": "Este modelo admite un máximo de {{tokens}} tokens por sesión.",
@@ -85,6 +86,8 @@
  },
  "ModelSwitchPanel": {
    "emptyModel": "No hay modelos habilitados. Vaya a la configuración para habilitarlos.",
+    "emptyProvider": "No hay proveedores habilitados, por favor ve a la configuración para activarlos",
+    "goToSettings": "Ir a la configuración",
    "provider": "Proveedor"
  },
  "OllamaSetupGuide": {
@@ -16,6 +16,16 @@
    "detail": "Detalles del error",
    "title": "Solicitud fallida"
  },
+  "import": {
+    "importConfigFile": {
+      "description": "Razón del error: {{reason}}",
+      "title": "Importación fallida"
+    },
+    "incompatible": {
+      "description": "Este archivo fue exportado desde una versión más alta, por favor intente actualizar a la última versión y luego vuelva a importar",
+      "title": "La aplicación actual no admite la importación de este archivo"
+    }
+  },
  "loginRequired": {
    "desc": "Serás redirigido automáticamente a la página de inicio de sesión",
    "title": "Por favor, inicie sesión para utilizar esta función"
@@ -69,6 +79,7 @@
    "524": "Lo sentimos, el servidor ha agotado el tiempo de espera mientras esperaba una respuesta, puede ser debido a que la respuesta es demasiado lenta, por favor inténtelo de nuevo más tarde",
    "AgentRuntimeError": "Se produjo un error en la ejecución del tiempo de ejecución del modelo de lenguaje Lobe, por favor, verifica la siguiente información o inténtalo de nuevo",
    "ConnectionCheckFailed": "La respuesta de la solicitud está vacía, por favor verifica que la dirección del proxy de la API no termine con `/v1`",
+    "CreateMessageError": "Lo sentimos, el mensaje no se pudo enviar correctamente. Por favor, copia el contenido y vuelve a enviarlo. Después de actualizar la página, este mensaje no se conservará.",
    "ExceededContextWindow": "El contenido de la solicitud actual excede la longitud que el modelo puede procesar. Por favor, reduzca la cantidad de contenido y vuelva a intentarlo.",
    "FreePlanLimit": "Actualmente eres un usuario gratuito y no puedes utilizar esta función. Por favor, actualiza a un plan de pago para seguir utilizando.",
    "InsufficientQuota": "Lo sentimos, la cuota de esta clave ha alcanzado su límite. Por favor, verifique si el saldo de su cuenta es suficiente o aumente la cuota de la clave y vuelva a intentarlo.",
@@ -0,0 +1,46 @@
+{
+  "addUserMessage": {
+    "desc": "Añadir el contenido actual como un mensaje de usuario, pero sin activar la generación",
+    "title": "Añadir un mensaje de usuario"
+  },
+  "editMessage": {
+    "desc": "Entrar en modo de edición manteniendo presionada la tecla Alt y haciendo doble clic en el mensaje",
+    "title": "Editar mensaje"
+  },
+  "openChatSettings": {
+    "desc": "Ver y modificar la configuración de la conversación actual",
+    "title": "Abrir configuración de la conversación"
+  },
+  "openHotkeyHelper": {
+    "desc": "Ver las instrucciones de uso de todos los atajos de teclado",
+    "title": "Abrir ayuda de atajos de teclado"
+  },
+  "regenerateMessage": {
+    "desc": "Regenerar el último mensaje",
+    "title": "Regenerar mensaje"
+  },
+  "saveTopic": {
+    "desc": "Guardar el tema actual y abrir un nuevo tema",
+    "title": "Iniciar un nuevo tema"
+  },
+  "search": {
+    "desc": "Invocar el cuadro de búsqueda principal de la página actual",
+    "title": "Buscar"
+  },
+  "switchAgent": {
+    "desc": "Cambiar el asistente fijado en la barra lateral manteniendo presionada la tecla Ctrl y pulsando un número del 0 al 9",
+    "title": "Cambio rápido de asistente"
+  },
+  "toggleLeftPanel": {
+    "desc": "Mostrar u ocultar el panel de asistente a la izquierda",
+    "title": "Mostrar/Ocultar panel de asistente"
+  },
+  "toggleRightPanel": {
+    "desc": "Mostrar u ocultar el panel de temas a la derecha",
+    "title": "Mostrar/Ocultar panel de temas"
+  },
+  "toggleZenMode": {
+    "desc": "En modo de enfoque, solo se muestra la conversación actual, ocultando otras interfaces",
+    "title": "Alternar modo de enfoque"
+  }
+}
@@ -1,13 +1,4 @@
 {
-  "01-ai/Yi-1.5-34B-Chat-16K": {
-    "description": "Yi-1.5 34B, con un rico conjunto de muestras de entrenamiento, ofrece un rendimiento superior en aplicaciones industriales."
-  },
-  "01-ai/Yi-1.5-6B-Chat": {
-    "description": "Yi-1.5-6B-Chat es una variante de la serie Yi-1.5, que pertenece a los modelos de chat de código abierto. Yi-1.5 es una versión mejorada de Yi, que ha sido preentrenada de manera continua en 500B de corpus de alta calidad y ajustada en más de 3M de muestras de ajuste diversificadas. En comparación con Yi, Yi-1.5 muestra un rendimiento superior en codificación, matemáticas, razonamiento y capacidad de seguimiento de instrucciones, manteniendo al mismo tiempo una excelente comprensión del lenguaje, razonamiento de sentido común y comprensión de lectura. Este modelo tiene versiones con longitudes de contexto de 4K, 16K y 32K, con un total de preentrenamiento de 3.6T de tokens."
-  },
-  "01-ai/Yi-1.5-9B-Chat-16K": {
-    "description": "Yi-1.5 9B soporta 16K Tokens, proporcionando una capacidad de generación de lenguaje eficiente y fluida."
-  },
  "01-ai/yi-1.5-34b-chat": {
    "description": "Cero Uno, el último modelo de ajuste fino de código abierto, cuenta con 34 mil millones de parámetros, con ajuste fino que admite múltiples escenarios de conversación y datos de entrenamiento de alta calidad, alineados con las preferencias humanas."
  },
@@ -149,12 +140,6 @@
  "Llama-3.2-90B-Vision-Instruct\t": {
    "description": "Capacidad avanzada de razonamiento de imágenes para aplicaciones de agentes de comprensión visual."
  },
-  "LoRA/Qwen/Qwen2.5-72B-Instruct": {
-    "description": "Qwen2.5-72B-Instruct es uno de los últimos modelos de lenguaje a gran escala lanzados por Alibaba Cloud. Este modelo de 72B ha mejorado significativamente en áreas como codificación y matemáticas. También ofrece soporte multilingüe, abarcando más de 29 idiomas, incluidos chino e inglés. El modelo ha mostrado mejoras significativas en el seguimiento de instrucciones, comprensión de datos estructurados y generación de salidas estructuradas (especialmente JSON)."
-  },
-  "LoRA/Qwen/Qwen2.5-7B-Instruct": {
-    "description": "Qwen2.5-7B-Instruct es uno de los últimos modelos de lenguaje a gran escala lanzados por Alibaba Cloud. Este modelo de 7B ha mejorado significativamente en áreas como codificación y matemáticas. También ofrece soporte multilingüe, abarcando más de 29 idiomas, incluidos chino e inglés. El modelo ha mostrado mejoras significativas en el seguimiento de instrucciones, comprensión de datos estructurados y generación de salidas estructuradas (especialmente JSON)."
-  },
  "Meta-Llama-3.1-405B-Instruct": {
    "description": "Modelo de texto ajustado por instrucciones de Llama 3.1, optimizado para casos de uso de diálogos multilingües, que se destaca en muchos modelos de chat de código abierto y cerrados en benchmarks de la industria comunes."
  },
@@ -179,9 +164,6 @@
  "NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO": {
    "description": "Nous Hermes 2 - Mixtral 8x7B-DPO (46.7B) es un modelo de instrucciones de alta precisión, adecuado para cálculos complejos."
  },
-  "OpenGVLab/InternVL2-26B": {
-    "description": "InternVL2 ha demostrado un rendimiento sobresaliente en diversas tareas de lenguaje visual, incluidas la comprensión de documentos y gráficos, comprensión de texto en escenas, OCR, resolución de problemas científicos y matemáticos."
-  },
  "Phi-3-medium-128k-instruct": {
    "description": "El mismo modelo Phi-3-medium, pero con un tamaño de contexto más grande para RAG o indicaciones de pocos disparos."
  },
@@ -206,9 +188,6 @@
  "Phi-3.5-vision-instrust": {
    "description": "Versión actualizada del modelo Phi-3-vision."
  },
-  "Pro/OpenGVLab/InternVL2-8B": {
-    "description": "InternVL2 ha demostrado un rendimiento sobresaliente en diversas tareas de lenguaje visual, incluidas la comprensión de documentos y gráficos, comprensión de texto en escenas, OCR, resolución de problemas científicos y matemáticos."
-  },
  "Pro/Qwen/Qwen2-1.5B-Instruct": {
    "description": "Qwen2-1.5B-Instruct es un modelo de lenguaje a gran escala de ajuste fino por instrucciones dentro de la serie Qwen2, con un tamaño de parámetros de 1.5B. Este modelo se basa en la arquitectura Transformer, utilizando funciones de activación SwiGLU, sesgos de atención QKV y atención de consulta agrupada, entre otras técnicas. Ha destacado en múltiples pruebas de referencia en comprensión del lenguaje, generación, capacidad multilingüe, codificación, matemáticas y razonamiento, superando a la mayoría de los modelos de código abierto. En comparación con Qwen1.5-1.8B-Chat, Qwen2-1.5B-Instruct ha mostrado mejoras significativas en pruebas como MMLU, HumanEval, GSM8K, C-Eval e IFEval, a pesar de tener un número de parámetros ligeramente menor."
  },
@@ -224,20 +203,26 @@
  "Pro/Qwen/Qwen2.5-Coder-7B-Instruct": {
    "description": "Qwen2.5-Coder-7B-Instruct es la última versión de la serie de modelos de lenguaje a gran escala específicos para código lanzada por Alibaba Cloud. Este modelo, basado en Qwen2.5, ha mejorado significativamente la generación, razonamiento y reparación de código a través de un entrenamiento con 55 billones de tokens. No solo ha mejorado la capacidad de codificación, sino que también ha mantenido ventajas en habilidades matemáticas y generales. El modelo proporciona una base más completa para aplicaciones prácticas como agentes de código."
  },
+  "Pro/Qwen/Qwen2.5-VL-7B-Instruct": {
+    "description": "Qwen2.5-VL es el nuevo miembro de la serie Qwen, con potentes capacidades de comprensión visual. Puede analizar texto, gráficos y diseños en imágenes, comprender videos largos y capturar eventos. Es capaz de razonar, manipular herramientas, admitir el posicionamiento de objetos en múltiples formatos y generar salidas estructuradas. Optimiza la resolución dinámica y la tasa de cuadros para la comprensión de videos, además de mejorar la eficiencia del codificador visual."
+  },
  "Pro/THUDM/glm-4-9b-chat": {
    "description": "GLM-4-9B-Chat es la versión de código abierto de la serie de modelos preentrenados GLM-4 lanzada por Zhipu AI. Este modelo destaca en semántica, matemáticas, razonamiento, código y conocimiento. Además de soportar diálogos de múltiples turnos, GLM-4-9B-Chat también cuenta con funciones avanzadas como navegación web, ejecución de código, llamadas a herramientas personalizadas (Function Call) y razonamiento de textos largos. El modelo admite 26 idiomas, incluidos chino, inglés, japonés, coreano y alemán. En múltiples pruebas de referencia, GLM-4-9B-Chat ha demostrado un rendimiento excepcional, como AlignBench-v2, MT-Bench, MMLU y C-Eval. Este modelo admite una longitud de contexto máxima de 128K, adecuado para investigación académica y aplicaciones comerciales."
  },
  "Pro/deepseek-ai/DeepSeek-R1": {
    "description": "DeepSeek-R1 es un modelo de inferencia impulsado por aprendizaje por refuerzo (RL) que aborda problemas de repetitividad y legibilidad en el modelo. Antes del RL, DeepSeek-R1 introdujo datos de arranque en frío, optimizando aún más el rendimiento de inferencia. Se desempeña de manera comparable a OpenAI-o1 en tareas matemáticas, de código e inferencia, y mejora el rendimiento general a través de métodos de entrenamiento cuidadosamente diseñados."
  },
+  "Pro/deepseek-ai/DeepSeek-R1-Distill-Qwen-1.5B": {
+    "description": "DeepSeek-R1-Distill-Qwen-1.5B es un modelo obtenido mediante destilación de conocimiento basado en Qwen2.5-Math-1.5B. Este modelo fue ajustado utilizando 800,000 muestras seleccionadas generadas por DeepSeek-R1, demostrando un rendimiento notable en múltiples benchmarks. Como modelo ligero, alcanzó una precisión del 83.9% en MATH-500, una tasa de aprobación del 28.9% en AIME 2024 y una puntuación de 954 en CodeForces, mostrando capacidades de razonamiento que superan su escala de parámetros."
+  },
+  "Pro/deepseek-ai/DeepSeek-R1-Distill-Qwen-7B": {
+    "description": "DeepSeek-R1-Distill-Qwen-7B es un modelo obtenido mediante destilación de conocimiento basado en Qwen2.5-Math-7B. Este modelo se ha ajustado utilizando 800.000 muestras seleccionadas generadas por DeepSeek-R1, demostrando una excelente capacidad de razonamiento. Ha mostrado un rendimiento sobresaliente en múltiples pruebas de referencia, alcanzando un 92,8% de precisión en MATH-500, un 55,5% de tasa de aprobación en AIME 2024 y una puntuación de 1189 en CodeForces, lo que demuestra una fuerte capacidad matemática y de programación para un modelo de escala 7B."
+  },
  "Pro/deepseek-ai/DeepSeek-V3": {
    "description": "DeepSeek-V3 es un modelo de lenguaje de expertos mixtos (MoE) con 671 mil millones de parámetros, que utiliza atención potencial de múltiples cabezas (MLA) y la arquitectura DeepSeekMoE, combinando estrategias de balanceo de carga sin pérdidas auxiliares para optimizar la eficiencia de inferencia y entrenamiento. Preentrenado en 14.8 billones de tokens de alta calidad, y ajustado mediante supervisión y aprendizaje por refuerzo, DeepSeek-V3 supera a otros modelos de código abierto y se acerca a los modelos cerrados líderes."
  },
-  "Pro/google/gemma-2-9b-it": {
-    "description": "Gemma es una de las series de modelos abiertos más avanzados y ligeros desarrollados por Google. Es un modelo de lenguaje a gran escala solo de decodificación, que admite inglés y proporciona pesos abiertos, variantes preentrenadas y variantes de ajuste fino por instrucciones. El modelo Gemma es adecuado para diversas tareas de generación de texto, incluyendo preguntas y respuestas, resúmenes y razonamiento. Este modelo de 9B se ha entrenado con 80 billones de tokens. Su tamaño relativamente pequeño permite su implementación en entornos con recursos limitados, como computadoras portátiles, de escritorio o su propia infraestructura en la nube, lo que permite a más personas acceder a modelos de IA de vanguardia y fomentar la innovación."
-  },
-  "Pro/meta-llama/Meta-Llama-3.1-8B-Instruct": {
-    "description": "Meta Llama 3.1 es parte de la familia de modelos de lenguaje a gran escala multilingües desarrollados por Meta, que incluye variantes preentrenadas y de ajuste fino por instrucciones con tamaños de parámetros de 8B, 70B y 405B. Este modelo de 8B ha sido optimizado para escenarios de diálogo multilingüe y ha destacado en múltiples pruebas de referencia de la industria. El entrenamiento del modelo utilizó más de 150 billones de tokens de datos públicos y empleó técnicas como ajuste fino supervisado y aprendizaje por refuerzo con retroalimentación humana para mejorar la utilidad y seguridad del modelo. Llama 3.1 admite generación de texto y generación de código, con una fecha límite de conocimiento hasta diciembre de 2023."
+  "Pro/deepseek-ai/DeepSeek-V3-1226": {
+    "description": "DeepSeek-V3 es un modelo de lenguaje de expertos mixtos (MoE) con 671 mil millones de parámetros, que utiliza atención latente de múltiples cabezas (MLA) y la arquitectura DeepSeekMoE, combinando una estrategia de balanceo de carga sin pérdidas auxiliares para optimizar la eficiencia de inferencia y entrenamiento. Preentrenado en 14.8 billones de tokens de alta calidad y ajustado mediante supervisión y aprendizaje por refuerzo, DeepSeek-V3 supera en rendimiento a otros modelos de código abierto, acercándose a los modelos cerrados líderes."
  },
  "QwQ-32B-Preview": {
    "description": "QwQ-32B-Preview es un modelo de procesamiento de lenguaje natural innovador, capaz de manejar de manera eficiente tareas complejas de generación de diálogos y comprensión del contexto."
@@ -290,6 +275,12 @@
  "Qwen/Qwen2.5-Coder-7B-Instruct": {
    "description": "Qwen2.5-Coder-7B-Instruct es la última versión de la serie de modelos de lenguaje a gran escala específicos para código lanzada por Alibaba Cloud. Este modelo, basado en Qwen2.5, ha mejorado significativamente la generación, razonamiento y reparación de código a través de un entrenamiento con 55 billones de tokens. No solo ha mejorado la capacidad de codificación, sino que también ha mantenido ventajas en habilidades matemáticas y generales. El modelo proporciona una base más completa para aplicaciones prácticas como agentes de código."
  },
+  "Qwen/Qwen2.5-VL-32B-Instruct": {
+    "description": "Qwen2.5-VL-32B-Instruct es un modelo multimodal avanzado desarrollado por el equipo Tongyi Qianwen, que forma parte de la serie Qwen2.5-VL. Este modelo no solo domina el reconocimiento de objetos comunes, sino que también puede analizar texto, gráficos, iconos, diagramas y diseños en imágenes. Funciona como un agente visual inteligente capaz de razonar y manipular herramientas dinámicamente, con habilidades para operar computadoras y dispositivos móviles. Además, el modelo puede localizar con precisión objetos en imágenes y generar salidas estructuradas para documentos como facturas y tablas. En comparación con su predecesor Qwen2-VL, esta versión ha mejorado significativamente sus capacidades matemáticas y de resolución de problemas mediante aprendizaje por refuerzo, y su estilo de respuesta se ha optimizado para adaptarse mejor a las preferencias humanas."
+  },
+  "Qwen/Qwen2.5-VL-72B-Instruct": {
+    "description": "Qwen2.5-VL es el modelo de lenguaje visual de la serie Qwen2.5. Este modelo presenta mejoras significativas en múltiples aspectos: posee una mayor capacidad de comprensión visual, pudiendo reconocer objetos comunes, analizar texto, gráficos y diseños; como agente visual puede razonar y guiar dinámicamente el uso de herramientas; soporta la comprensión de videos largos de más de 1 hora capturando eventos clave; es capaz de localizar objetos en imágenes con precisión generando cuadros delimitadores o puntos; y admite la generación de salidas estructuradas, especialmente útil para datos escaneados como facturas o tablas."
+  },
  "Qwen2-72B-Instruct": {
    "description": "Qwen2 es la última serie del modelo Qwen, que admite un contexto de 128k. En comparación con los modelos de código abierto más óptimos actuales, Qwen2-72B supera significativamente a los modelos líderes actuales en comprensión del lenguaje natural, conocimiento, código, matemáticas y capacidades multilingües."
  },
@@ -374,9 +365,6 @@
  "TeleAI/TeleChat2": {
    "description": "El modelo grande TeleChat2 ha sido desarrollado de manera independiente por China Telecom desde cero, siendo un modelo semántico generativo que admite funciones como preguntas y respuestas enciclopédicas, generación de código y generación de textos largos, proporcionando servicios de consulta conversacional a los usuarios, permitiendo interacciones de diálogo, respondiendo preguntas y asistiendo en la creación, ayudando a los usuarios a obtener información, conocimiento e inspiración de manera eficiente y conveniente. El modelo ha mostrado un rendimiento destacado en problemas de alucinación, generación de textos largos y comprensión lógica."
  },
-  "TeleAI/TeleMM": {
-    "description": "El modelo multimodal TeleMM ha sido desarrollado de manera independiente por China Telecom, siendo un modelo de comprensión multimodal que puede manejar entradas de múltiples modalidades como texto e imágenes, apoyando funciones como comprensión de imágenes y análisis de gráficos, proporcionando servicios de comprensión cruzada para los usuarios. El modelo puede interactuar con los usuarios de manera multimodal, entendiendo con precisión el contenido de entrada, respondiendo preguntas, asistiendo en la creación y proporcionando de manera eficiente información y apoyo inspirador multimodal. Ha mostrado un rendimiento excepcional en tareas multimodales como percepción de alta resolución y razonamiento lógico."
-  },
  "Vendor-A/Qwen/Qwen2.5-72B-Instruct": {
    "description": "Qwen2.5-72B-Instruct es uno de los últimos modelos de lenguaje a gran escala lanzados por Alibaba Cloud. Este modelo de 72B ha mejorado significativamente en áreas como codificación y matemáticas. También ofrece soporte multilingüe, abarcando más de 29 idiomas, incluidos chino e inglés. El modelo ha mostrado mejoras significativas en el seguimiento de instrucciones, comprensión de datos estructurados y generación de salidas estructuradas (especialmente JSON)."
  },
@@ -506,6 +494,9 @@
  "anthropic/claude-3.5-sonnet": {
    "description": "Claude 3.5 Sonnet ofrece capacidades que superan a Opus y una velocidad más rápida que Sonnet, manteniendo el mismo precio que Sonnet. Sonnet es especialmente hábil en programación, ciencia de datos, procesamiento visual y tareas de agente."
  },
+  "anthropic/claude-3.7-sonnet": {
+    "description": "Claude 3.7 Sonnet es el modelo más inteligente de Anthropic hasta la fecha y el primer modelo de razonamiento híbrido en el mercado. Claude 3.7 Sonnet puede generar respuestas casi instantáneas o un pensamiento prolongado y gradual, permitiendo a los usuarios observar claramente estos procesos. Sonnet es especialmente hábil en programación, ciencia de datos, procesamiento visual y tareas de agente."
+  },
  "aya": {
    "description": "Aya 23 es un modelo multilingüe lanzado por Cohere, que admite 23 idiomas, facilitando aplicaciones de lenguaje diversas."
  },
@@ -515,9 +506,27 @@
  "baichuan/baichuan2-13b-chat": {
    "description": "Baichuan-13B es un modelo de lenguaje de gran escala de código abierto y comercializable desarrollado por Baichuan Intelligence, que cuenta con 13 mil millones de parámetros y ha logrado los mejores resultados en benchmarks autorizados en chino e inglés."
  },
+  "c4ai-aya-expanse-32b": {
+    "description": "Aya Expanse es un modelo multilingüe de alto rendimiento de 32B, diseñado para desafiar el rendimiento de los modelos monolingües a través de innovaciones en ajuste por instrucciones, arbitraje de datos, entrenamiento de preferencias y fusión de modelos. Soporta 23 idiomas."
+  },
+  "c4ai-aya-expanse-8b": {
+    "description": "Aya Expanse es un modelo multilingüe de alto rendimiento de 8B, diseñado para desafiar el rendimiento de los modelos monolingües a través de innovaciones en ajuste por instrucciones, arbitraje de datos, entrenamiento de preferencias y fusión de modelos. Soporta 23 idiomas."
+  },
+  "c4ai-aya-vision-32b": {
+    "description": "Aya Vision es un modelo multimodal de última generación, que destaca en múltiples benchmarks clave de capacidades lingüísticas, textuales y visuales. Soporta 23 idiomas. Esta versión de 32B se centra en el rendimiento multilingüe de vanguardia."
+  },
+  "c4ai-aya-vision-8b": {
+    "description": "Aya Vision es un modelo multimodal de última generación, que destaca en múltiples benchmarks clave de capacidades lingüísticas, textuales y visuales. Esta versión de 8B se centra en baja latencia y rendimiento óptimo."
+  },
  "charglm-3": {
    "description": "CharGLM-3 está diseñado para juegos de rol y acompañamiento emocional, soportando memoria de múltiples rondas y diálogos personalizados, con aplicaciones amplias."
  },
+  "chatglm3": {
+    "description": "ChatGLM3 es un modelo de código cerrado desarrollado por Zhipu AI y el Laboratorio KEG de Tsinghua. Ha sido preentrenado con una gran cantidad de identificadores en chino e inglés y ajustado a las preferencias humanas. En comparación con el modelo de primera generación, ha logrado mejoras del 16%, 36% y 280% en MMLU, C-Eval y GSM8K, respectivamente, y ha alcanzado el primer lugar en el ranking de tareas en chino C-Eval. Es adecuado para escenarios que requieren un alto nivel de conocimiento, capacidad de razonamiento y creatividad, como la redacción de anuncios, la escritura de novelas, la redacción de contenido de conocimiento y la generación de código."
+  },
+  "chatglm3-6b-base": {
+    "description": "ChatGLM3-6b-base es el modelo base de la última generación de la serie ChatGLM, desarrollado por Zhipu, con una escala de 6.000 millones de parámetros y de código abierto."
+  },
  "chatgpt-4o-latest": {
    "description": "ChatGPT-4o es un modelo dinámico que se actualiza en tiempo real para mantener la versión más actual. Combina una poderosa comprensión y generación de lenguaje, adecuado para aplicaciones a gran escala, incluyendo servicio al cliente, educación y soporte técnico."
  },
@@ -593,12 +602,39 @@
  "cohere-command-r-plus": {
    "description": "Command R+ es un modelo optimizado para RAG de última generación diseñado para abordar cargas de trabajo de nivel empresarial."
  },
+  "command": {
+    "description": "Un modelo de conversación que sigue instrucciones, ofreciendo alta calidad y fiabilidad en tareas lingüísticas, además de tener una longitud de contexto más larga que nuestros modelos de generación básicos."
+  },
+  "command-a-03-2025": {
+    "description": "Command A es nuestro modelo más potente hasta la fecha, destacando en el uso de herramientas, agentes, generación aumentada por recuperación (RAG) y aplicaciones multilingües. Command A tiene una longitud de contexto de 256K, puede ejecutarse con solo dos GPU y ha mejorado su rendimiento en un 150% en comparación con Command R+ 08-2024."
+  },
+  "command-light": {
+    "description": "Una versión más pequeña y rápida de Command, casi igual de potente, pero más rápida."
+  },
+  "command-light-nightly": {
+    "description": "Para acortar el intervalo entre lanzamientos de versiones principales, hemos lanzado versiones nocturnas del modelo Command. Para la serie command-light, esta versión se llama command-light-nightly. Tenga en cuenta que command-light-nightly es la versión más reciente, experimental y (posiblemente) inestable. Las versiones nocturnas se actualizan regularmente sin previo aviso, por lo que no se recomienda su uso en entornos de producción."
+  },
+  "command-nightly": {
+    "description": "Para acortar el intervalo entre lanzamientos de versiones principales, hemos lanzado versiones nocturnas del modelo Command. Para la serie Command, esta versión se llama command-cightly. Tenga en cuenta que command-nightly es la versión más reciente, experimental y (posiblemente) inestable. Las versiones nocturnas se actualizan regularmente sin previo aviso, por lo que no se recomienda su uso en entornos de producción."
+  },
  "command-r": {
    "description": "Command R es un LLM optimizado para tareas de diálogo y contexto largo, especialmente adecuado para interacciones dinámicas y gestión del conocimiento."
  },
+  "command-r-03-2024": {
+    "description": "Command R es un modelo de conversación que sigue instrucciones, ofreciendo una mayor calidad y fiabilidad en tareas lingüísticas, además de tener una longitud de contexto más larga que los modelos anteriores. Se puede utilizar en flujos de trabajo complejos, como generación de código, generación aumentada por recuperación (RAG), uso de herramientas y agentes."
+  },
+  "command-r-08-2024": {
+    "description": "command-r-08-2024 es una versión actualizada del modelo Command R, lanzada en agosto de 2024."
+  },
  "command-r-plus": {
    "description": "Command R+ es un modelo de lenguaje de gran tamaño de alto rendimiento, diseñado para escenarios empresariales reales y aplicaciones complejas."
  },
+  "command-r-plus-04-2024": {
+    "description": "Command R+ es un modelo de conversación que sigue instrucciones, ofreciendo una mayor calidad y fiabilidad en tareas lingüísticas, además de tener una longitud de contexto más larga que los modelos anteriores. Es ideal para flujos de trabajo complejos de RAG y uso de herramientas en múltiples pasos."
+  },
+  "command-r7b-12-2024": {
+    "description": "command-r7b-12-2024 es una versión pequeña y eficiente, lanzada en diciembre de 2024. Destaca en tareas que requieren razonamiento complejo y procesamiento en múltiples pasos, como RAG, uso de herramientas y agentes."
+  },
  "dall-e-2": {
    "description": "El segundo modelo DALL·E, que admite generación de imágenes más realistas y precisas, con una resolución cuatro veces mayor que la de la primera generación."
  },
@@ -614,9 +650,6 @@
  "deepseek-ai/DeepSeek-R1-Distill-Llama-70B": {
    "description": "El modelo de destilación DeepSeek-R1 optimiza el rendimiento de inferencia mediante aprendizaje por refuerzo y datos de arranque en frío, actualizando el estándar de múltiples tareas en modelos de código abierto."
  },
-  "deepseek-ai/DeepSeek-R1-Distill-Llama-8B": {
-    "description": "DeepSeek-R1-Distill-Llama-8B es un modelo de destilación desarrollado a partir de Llama-3.1-8B. Este modelo se ajustó utilizando muestras generadas por DeepSeek-R1, mostrando una excelente capacidad de inferencia. Ha tenido un buen desempeño en múltiples pruebas de referencia, alcanzando una precisión del 89.1% en MATH-500, una tasa de aprobación del 50.4% en AIME 2024, y una puntuación de 1205 en CodeForces, demostrando una fuerte capacidad matemática y de programación como modelo de 8B."
-  },
  "deepseek-ai/DeepSeek-R1-Distill-Qwen-1.5B": {
    "description": "El modelo de destilación DeepSeek-R1 optimiza el rendimiento de inferencia mediante aprendizaje por refuerzo y datos de arranque en frío, actualizando el estándar de múltiples tareas en modelos de código abierto."
  },
@@ -659,12 +692,30 @@
  "deepseek-r1": {
    "description": "DeepSeek-R1 es un modelo de inferencia impulsado por aprendizaje reforzado (RL) que aborda los problemas de repetitividad y legibilidad en el modelo. Antes de RL, DeepSeek-R1 introdujo datos de arranque en frío, optimizando aún más el rendimiento de la inferencia. Su desempeño en tareas matemáticas, de código e inferencia es comparable al de OpenAI-o1, y ha mejorado su efectividad general a través de métodos de entrenamiento cuidadosamente diseñados."
  },
+  "deepseek-r1-70b-fast-online": {
+    "description": "DeepSeek R1 70B versión rápida, que soporta búsqueda en línea en tiempo real, ofreciendo una velocidad de respuesta más rápida mientras mantiene el rendimiento del modelo."
+  },
+  "deepseek-r1-70b-online": {
+    "description": "DeepSeek R1 70B versión estándar, que soporta búsqueda en línea en tiempo real, adecuada para tareas de conversación y procesamiento de textos que requieren información actualizada."
+  },
+  "deepseek-r1-distill-llama": {
+    "description": "deepseek-r1-distill-llama es un modelo basado en Llama destilado a partir de DeepSeek-R1."
+  },
  "deepseek-r1-distill-llama-70b": {
    "description": "DeepSeek R1, el modelo más grande e inteligente del conjunto DeepSeek, ha sido destilado en la arquitectura Llama 70B. Basado en pruebas de referencia y evaluaciones humanas, este modelo es más inteligente que el Llama 70B original, destacándose especialmente en tareas que requieren precisión matemática y factual."
  },
  "deepseek-r1-distill-llama-8b": {
    "description": "El modelo de la serie DeepSeek-R1-Distill se obtiene mediante la técnica de destilación de conocimiento, ajustando muestras generadas por DeepSeek-R1 a modelos de código abierto como Qwen y Llama."
  },
+  "deepseek-r1-distill-qianfan-llama-70b": {
+    "description": "Lanzado por primera vez el 14 de febrero de 2025, destilado por el equipo de desarrollo del modelo Qianfan a partir del modelo base Llama3_70B (Construido con Meta Llama), con datos de destilación que también incluyen el corpus de Qianfan."
+  },
+  "deepseek-r1-distill-qianfan-llama-8b": {
+    "description": "Lanzado por primera vez el 14 de febrero de 2025, destilado por el equipo de desarrollo del modelo Qianfan a partir del modelo base Llama3_8B (Construido con Meta Llama), con datos de destilación que también incluyen el corpus de Qianfan."
+  },
+  "deepseek-r1-distill-qwen": {
+    "description": "deepseek-r1-distill-qwen es un modelo basado en Qwen destilado a partir de DeepSeek-R1."
+  },
  "deepseek-r1-distill-qwen-1.5b": {
    "description": "El modelo de la serie DeepSeek-R1-Distill se obtiene mediante la técnica de destilación de conocimiento, ajustando muestras generadas por DeepSeek-R1 a modelos de código abierto como Qwen y Llama."
  },
@@ -677,6 +728,12 @@
  "deepseek-r1-distill-qwen-7b": {
    "description": "El modelo de la serie DeepSeek-R1-Distill se obtiene mediante la técnica de destilación de conocimiento, ajustando muestras generadas por DeepSeek-R1 a modelos de código abierto como Qwen y Llama."
  },
+  "deepseek-r1-fast-online": {
+    "description": "DeepSeek R1 versión rápida completa, que soporta búsqueda en línea en tiempo real, combinando la potente capacidad de 671B de parámetros con una velocidad de respuesta más rápida."
+  },
+  "deepseek-r1-online": {
+    "description": "DeepSeek R1 versión completa, con 671B de parámetros, que soporta búsqueda en línea en tiempo real, con una capacidad de comprensión y generación más potente."
+  },
  "deepseek-reasoner": {
    "description": "Modelo de inferencia lanzado por DeepSeek. Antes de proporcionar la respuesta final, el modelo genera primero una cadena de pensamiento para mejorar la precisión de la respuesta final."
  },
@@ -689,6 +746,9 @@
  "deepseek-v3": {
    "description": "DeepSeek-V3 es un modelo MoE desarrollado por Hangzhou DeepSeek Artificial Intelligence Technology Research Co., Ltd., que ha destacado en múltiples evaluaciones, ocupando el primer lugar en la lista de modelos de código abierto. En comparación con el modelo V2.5, la velocidad de generación se ha incrementado tres veces, brindando a los usuarios una experiencia de uso más rápida y fluida."
  },
+  "deepseek-v3-0324": {
+    "description": "DeepSeek-V3-0324 es un modelo MoE de 671B parámetros, destacándose en habilidades de programación y técnicas, comprensión del contexto y procesamiento de textos largos."
+  },
  "deepseek/deepseek-chat": {
    "description": "Un nuevo modelo de código abierto que fusiona capacidades generales y de codificación, no solo conserva la capacidad de diálogo general del modelo Chat original y la potente capacidad de procesamiento de código del modelo Coder, sino que también se alinea mejor con las preferencias humanas. Además, DeepSeek-V2.5 ha logrado mejoras significativas en tareas de escritura, seguimiento de instrucciones y más."
  },
@@ -755,6 +815,9 @@
  "ernie-4.0-turbo-8k-preview": {
    "description": "El modelo de lenguaje grande de bandera de Baidu, desarrollado internamente, de ultra gran escala, muestra un rendimiento excepcional en general, siendo ampliamente aplicable en escenarios de tareas complejas en diversos campos; soporta la integración automática con el plugin de búsqueda de Baidu, garantizando la actualidad de la información de preguntas y respuestas. En comparación con ERNIE 4.0, presenta un rendimiento superior."
  },
+  "ernie-4.5-8k-preview": {
+    "description": "El modelo grande Wenxin 4.5 es un nuevo modelo base multimodal nativo desarrollado por Baidu, que logra una optimización colaborativa a través de modelado conjunto de múltiples modalidades, con excelentes capacidades de comprensión multimodal; presenta una capacidad lingüística más avanzada, con mejoras en comprensión, generación, lógica y memoria, así como una notable reducción de alucinaciones y mejoras en razonamiento lógico y capacidades de codificación."
+  },
  "ernie-char-8k": {
    "description": "Modelo de lenguaje grande de escenario vertical desarrollado internamente por Baidu, adecuado para aplicaciones como NPC de juegos, diálogos de servicio al cliente y juegos de rol de diálogos, con un estilo de personaje más distintivo y consistente, y una mayor capacidad de seguimiento de instrucciones y rendimiento de inferencia."
  },
@@ -788,9 +851,6 @@
  "gemini-1.0-pro-latest": {
    "description": "Gemini 1.0 Pro es el modelo de IA de alto rendimiento de Google, diseñado para la escalabilidad en una amplia gama de tareas."
  },
-  "gemini-1.5-flash": {
-    "description": "Gemini 1.5 Flash es el último modelo de IA multimodal de Google, que cuenta con una capacidad de procesamiento rápido, admite entradas de texto, imágenes y videos, y es adecuado para la escalabilidad eficiente en diversas tareas."
-  },
  "gemini-1.5-flash-001": {
    "description": "Gemini 1.5 Flash 001 es un modelo multimodal eficiente, que admite la escalabilidad para aplicaciones amplias."
  },
@@ -803,6 +863,9 @@
  "gemini-1.5-flash-8b-exp-0924": {
    "description": "Gemini 1.5 Flash 8B 0924 es el último modelo experimental, con mejoras significativas en el rendimiento tanto en casos de uso de texto como multimodal."
  },
+  "gemini-1.5-flash-8b-latest": {
+    "description": "Gemini 1.5 Flash 8B es un modelo multimodal eficiente que admite una amplia gama de aplicaciones escalables."
+  },
  "gemini-1.5-flash-exp-0827": {
    "description": "Gemini 1.5 Flash 0827 ofrece capacidades de procesamiento multimodal optimizadas, adecuadas para diversas tareas complejas."
  },
@@ -830,24 +893,27 @@
  "gemini-2.0-flash-001": {
    "description": "Gemini 2.0 Flash ofrece funciones y mejoras de próxima generación, incluyendo velocidad excepcional, uso de herramientas nativas, generación multimodal y una ventana de contexto de 1M tokens."
  },
+  "gemini-2.0-flash-exp": {
+    "description": "Variante del modelo Gemini 2.0 Flash, optimizada para objetivos como la rentabilidad y la baja latencia."
+  },
+  "gemini-2.0-flash-exp-image-generation": {
+    "description": "Modelo experimental Gemini 2.0 Flash, que admite la generación de imágenes"
+  },
  "gemini-2.0-flash-lite": {
    "description": "Variante del modelo Gemini 2.0 Flash, optimizada para objetivos como la rentabilidad y la baja latencia."
  },
  "gemini-2.0-flash-lite-001": {
    "description": "Variante del modelo Gemini 2.0 Flash, optimizada para objetivos como la rentabilidad y la baja latencia."
  },
-  "gemini-2.0-flash-lite-preview-02-05": {
-    "description": "Un modelo Gemini 2.0 Flash optimizado para objetivos de costo-efectividad y baja latencia."
-  },
-  "gemini-2.0-flash-thinking-exp": {
-    "description": "Gemini 2.0 Flash Exp es el último modelo experimental de IA multimodal de Google, con características de próxima generación, velocidad excepcional, llamadas nativas a herramientas y generación multimodal."
-  },
  "gemini-2.0-flash-thinking-exp-01-21": {
    "description": "Gemini 2.0 Flash Exp es el último modelo experimental de IA multimodal de Google, con características de próxima generación, velocidad excepcional, llamadas nativas a herramientas y generación multimodal."
  },
  "gemini-2.0-pro-exp-02-05": {
    "description": "Gemini 2.0 Pro Experimental es el último modelo de IA multimodal experimental de Google, con mejoras de calidad en comparación con versiones anteriores, especialmente en conocimiento del mundo, código y contextos largos."
  },
+  "gemini-2.5-pro-exp-03-25": {
+    "description": "Gemini 2.5 Pro Experimental es el modelo de pensamiento más avanzado de Google, capaz de razonar sobre problemas complejos en código, matemáticas y campos STEM, además de utilizar contextos largos para analizar grandes conjuntos de datos, bibliotecas de código y documentos."
+  },
  "gemma-7b-it": {
    "description": "Gemma 7B es adecuado para el procesamiento de tareas de pequeña y mediana escala, combinando rentabilidad."
  },
@@ -1016,6 +1082,9 @@
  "gpt-4o-mini-realtime-preview": {
    "description": "Versión en tiempo real de GPT-4o-mini, que admite entrada y salida de audio y texto en tiempo real."
  },
+  "gpt-4o-mini-tts": {
+    "description": "GPT-4o mini TTS es un modelo de texto a voz basado en GPT-4o mini, que ofrece generación de voz de alta calidad a un costo más bajo."
+  },
  "gpt-4o-realtime-preview": {
    "description": "Versión en tiempo real de GPT-4o, que admite entrada y salida de audio y texto en tiempo real."
  },
@@ -1073,6 +1142,12 @@
  "hunyuan-standard-vision": {
    "description": "El modelo multimodal más reciente de Hunyuan, que soporta respuestas en múltiples idiomas, con capacidades equilibradas en chino e inglés."
  },
+  "hunyuan-t1-20250321": {
+    "description": "Construye de manera integral las capacidades de modelos en ciencias exactas y humanidades, con una fuerte capacidad para capturar información de textos largos. Soporta la inferencia y respuesta a problemas científicos de diversas dificultades, incluyendo matemáticas, lógica, ciencias y código."
+  },
+  "hunyuan-t1-latest": {
+    "description": "El primer modelo de inferencia híbrido de gran escala Hybrid-Transformer-Mamba de la industria, que amplía la capacidad de inferencia, ofrece una velocidad de decodificación excepcional y alinea aún más con las preferencias humanas."
+  },
  "hunyuan-translation": {
    "description": "Soporta la traducción entre 15 idiomas, incluyendo chino, inglés, japonés, francés, portugués, español, turco, ruso, árabe, coreano, italiano, alemán, vietnamita, malayo e indonesio, con evaluación automatizada basada en el conjunto de evaluación de traducción en múltiples escenarios y puntuación COMET, superando en general a modelos de tamaño similar en la capacidad de traducción entre idiomas comunes."
  },
@@ -1082,9 +1157,6 @@
  "hunyuan-turbo": {
    "description": "Versión preliminar de la nueva generación del modelo de lenguaje de Hunyuan, que utiliza una nueva estructura de modelo de expertos mixtos (MoE), con una eficiencia de inferencia más rápida y un rendimiento más fuerte en comparación con Hunyuan-Pro."
  },
-  "hunyuan-turbo-20241120": {
-    "description": "Versión fija de hunyuan-turbo del 20 de noviembre de 2024, una versión intermedia entre hunyuan-turbo y hunyuan-turbo-latest."
-  },
  "hunyuan-turbo-20241223": {
    "description": "Optimización de esta versión: escalado de instrucciones de datos, mejora significativa de la capacidad de generalización del modelo; mejora significativa de las capacidades de matemáticas, código y razonamiento lógico; optimización de la comprensión de texto y de palabras relacionadas; optimización de la calidad de generación de contenido en la creación de texto."
  },
@@ -1094,6 +1166,15 @@
  "hunyuan-turbo-vision": {
    "description": "El nuevo modelo insignia de lenguaje visual de Hunyuan de nueva generación, que utiliza una nueva estructura de modelo de expertos mixtos (MoE), mejorando de manera integral las capacidades de reconocimiento básico, creación de contenido, preguntas y respuestas de conocimiento, y análisis y razonamiento en comparación con la generación anterior de modelos."
  },
+  "hunyuan-turbos-20250226": {
+    "description": "hunyuan-TurboS pv2.1.2 es una versión fija con un aumento en el número de tokens de entrenamiento; mejora en las capacidades de pensamiento en matemáticas/lógica/código; mejora en la experiencia general en chino e inglés, incluyendo creación de textos, comprensión de textos, preguntas y respuestas de conocimiento, y charlas informales."
+  },
+  "hunyuan-turbos-20250313": {
+    "description": "Unificación del estilo de pasos de resolución matemática, mejorando las preguntas y respuestas matemáticas en múltiples rondas. Optimización del estilo de respuesta en la creación de textos, eliminando el sabor a IA y aumentando la elegancia."
+  },
+  "hunyuan-turbos-latest": {
+    "description": "hunyuan-TurboS es la última versión del modelo insignia Hunyuan, con una mayor capacidad de pensamiento y una mejor experiencia."
+  },
  "hunyuan-vision": {
    "description": "El último modelo multimodal de Hunyuan, que admite la entrada de imágenes y texto para generar contenido textual."
  },
@@ -1124,12 +1205,18 @@
  "lite": {
    "description": "Spark Lite es un modelo de lenguaje grande y ligero, con una latencia extremadamente baja y una capacidad de procesamiento eficiente, completamente gratuito y de código abierto, que admite funciones de búsqueda en línea en tiempo real. Su característica de respuesta rápida lo hace destacar en aplicaciones de inferencia y ajuste de modelos en dispositivos de baja potencia, brindando a los usuarios una excelente relación costo-beneficio y experiencia inteligente, especialmente en escenarios de preguntas y respuestas, generación de contenido y búsqueda."
  },
+  "llama-2-7b-chat": {
+    "description": "Llama2 es una serie de modelos de lenguaje de gran escala (LLM) desarrollados y publicados por Meta, que incluye modelos de texto generativo preentrenados y ajustados de diferentes tamaños, desde 7 mil millones hasta 70 mil millones de parámetros. A nivel de arquitectura, Llama2 es un modelo de lenguaje autoregresivo que utiliza una arquitectura de transformador optimizada. Las versiones ajustadas utilizan un ajuste de fine-tuning supervisado (SFT) y aprendizaje por refuerzo con retroalimentación humana (RLHF) para alinear las preferencias de utilidad y seguridad humanas. Llama2 supera a la serie Llama en varios conjuntos de datos académicos, proporcionando ideas para el diseño y desarrollo de numerosos otros modelos."
+  },
  "llama-3.1-70b-versatile": {
    "description": "Llama 3.1 70B ofrece una capacidad de razonamiento AI más potente, adecuada para aplicaciones complejas, soportando un procesamiento computacional extenso y garantizando eficiencia y precisión."
  },
  "llama-3.1-8b-instant": {
    "description": "Llama 3.1 8B es un modelo de alto rendimiento que ofrece una rápida capacidad de generación de texto, ideal para aplicaciones que requieren eficiencia a gran escala y rentabilidad."
  },
+  "llama-3.1-instruct": {
+    "description": "El modelo Llama 3.1 ajustado para instrucciones está optimizado para escenarios de conversación, superando a muchos modelos de chat de código abierto existentes en pruebas de referencia comunes de la industria."
+  },
  "llama-3.2-11b-vision-instruct": {
    "description": "Capacidad excepcional de razonamiento visual en imágenes de alta resolución, adecuada para aplicaciones de comprensión visual."
  },
@@ -1142,12 +1229,18 @@
  "llama-3.2-90b-vision-preview": {
    "description": "Llama 3.2 está diseñado para manejar tareas que combinan datos visuales y textuales. Destaca en tareas como la descripción de imágenes y preguntas visuales, cruzando la brecha entre la generación de lenguaje y el razonamiento visual."
  },
+  "llama-3.2-vision-instruct": {
+    "description": "El modelo Llama 3.2-Vision con ajuste fino de instrucciones está optimizado para reconocimiento visual, razonamiento sobre imágenes, descripción de imágenes y respuesta a preguntas generales relacionadas con imágenes."
+  },
  "llama-3.3-70b-instruct": {
    "description": "Llama 3.3 es el modelo de lenguaje de código abierto multilingüe más avanzado de la serie Llama, que ofrece un rendimiento comparable al modelo de 405B a un costo extremadamente bajo. Basado en la estructura Transformer, y mejorado en utilidad y seguridad a través de ajuste fino supervisado (SFT) y aprendizaje por refuerzo con retroalimentación humana (RLHF). Su versión ajustada para instrucciones está optimizada para diálogos multilingües, superando a muchos modelos de chat de código abierto y cerrado en múltiples benchmarks de la industria. La fecha límite de conocimiento es diciembre de 2023."
  },
  "llama-3.3-70b-versatile": {
    "description": "El modelo de lenguaje multilingüe Meta Llama 3.3 (LLM) es un modelo generativo preentrenado y ajustado para instrucciones de 70B (entrada/salida de texto). El modelo de texto puro ajustado para instrucciones de Llama 3.3 está optimizado para casos de uso de conversación multilingüe y supera a muchos modelos de chat de código abierto y cerrado en benchmarks industriales comunes."
  },
+  "llama-3.3-instruct": {
+    "description": "El modelo de instrucción Llama 3.3, optimizado para escenarios de diálogo, supera a muchos modelos de chat de código abierto existentes en pruebas de referencia comunes de la industria."
+  },
  "llama3-70b-8192": {
    "description": "Meta Llama 3 70B proporciona una capacidad de procesamiento de complejidad inigualable, diseñado a medida para proyectos de alta demanda."
  },
@@ -1187,6 +1280,9 @@
  "max-32k": {
    "description": "Spark Max 32K está equipado con una capacidad de procesamiento de contexto grande, con una comprensión contextual más fuerte y habilidades de razonamiento lógico, soportando entradas de texto de 32K tokens, adecuado para la lectura de documentos largos, preguntas y respuestas de conocimiento privado y otros escenarios."
  },
+  "megrez-3b-instruct": {
+    "description": "Megrez-3B-Instruct es un modelo de lenguaje grande entrenado completamente de forma autónoma por Wúwèn Xīnqióng. Megrez-3B-Instruct tiene como objetivo crear una solución de inteligencia periférica rápida, compacta y fácil de usar, basada en el concepto de colaboración entre hardware y software."
+  },
  "meta-llama-3-70b-instruct": {
    "description": "Un poderoso modelo de 70 mil millones de parámetros que sobresale en razonamiento, codificación y amplias aplicaciones de lenguaje."
  },
@@ -1223,9 +1319,6 @@
  "meta-llama/Llama-3.2-90B-Vision-Instruct-Turbo": {
    "description": "LLaMA 3.2 está diseñado para manejar tareas que combinan datos visuales y textuales. Se destaca en tareas como descripción de imágenes y preguntas visuales, cruzando la brecha entre la generación de lenguaje y el razonamiento visual."
  },
-  "meta-llama/Llama-3.3-70B-Instruct": {
-    "description": "Llama 3.3 es el modelo de lenguaje de código abierto multilingüe más avanzado de la serie Llama, que ofrece un rendimiento comparable al modelo de 405B a un costo muy bajo. Basado en la estructura Transformer, y mejorado en utilidad y seguridad a través de ajuste fino supervisado (SFT) y aprendizaje por refuerzo con retroalimentación humana (RLHF). Su versión ajustada por instrucciones está optimizada para diálogos multilingües, superando a muchos modelos de chat de código abierto y cerrado en múltiples benchmarks de la industria. La fecha de corte de conocimiento es diciembre de 2023."
-  },
  "meta-llama/Llama-3.3-70B-Instruct-Turbo": {
    "description": "El modelo de lenguaje grande multilingüe Meta Llama 3.3 (LLM) es un modelo generativo preentrenado y ajustado por instrucciones de 70B (entrada de texto/salida de texto). El modelo de texto puro ajustado por instrucciones de Llama 3.3 está optimizado para casos de uso de diálogo multilingüe y supera a muchos modelos de chat de código abierto y cerrados en benchmarks de la industria."
  },
@@ -1253,15 +1346,9 @@
  "meta-llama/Meta-Llama-3.1-70B": {
    "description": "Llama 3.1 es el modelo líder lanzado por Meta, que soporta hasta 405B de parámetros, aplicable en diálogos complejos, traducción multilingüe y análisis de datos."
  },
-  "meta-llama/Meta-Llama-3.1-70B-Instruct": {
-    "description": "LLaMA 3.1 70B proporciona soporte de conversación eficiente en múltiples idiomas."
-  },
  "meta-llama/Meta-Llama-3.1-70B-Instruct-Turbo": {
    "description": "El modelo Llama 3.1 70B está finamente ajustado para aplicaciones de alta carga, cuantificado a FP8 para ofrecer una capacidad de cálculo y precisión más eficientes, asegurando un rendimiento excepcional en escenarios complejos."
  },
-  "meta-llama/Meta-Llama-3.1-8B-Instruct": {
-    "description": "LLaMA 3.1 ofrece soporte multilingüe y es uno de los modelos generativos líderes en la industria."
-  },
  "meta-llama/Meta-Llama-3.1-8B-Instruct-Turbo": {
    "description": "El modelo Llama 3.1 8B utiliza cuantificación FP8, soportando hasta 131,072 tokens de contexto, destacándose entre los modelos de código abierto, ideal para tareas complejas y superando muchos estándares de la industria."
  },
@@ -1355,12 +1442,18 @@
  "mistral-large": {
    "description": "Mixtral Large es el modelo insignia de Mistral, combinando capacidades de generación de código, matemáticas y razonamiento, soportando una ventana de contexto de 128k."
  },
+  "mistral-large-instruct": {
+    "description": "Mistral-Large-Instruct-2407 es un modelo avanzado de lenguaje denso (LLM) con 123 mil millones de parámetros, que posee capacidades de razonamiento, conocimiento y codificación de última generación."
+  },
  "mistral-large-latest": {
    "description": "Mistral Large es el modelo insignia, especializado en tareas multilingües, razonamiento complejo y generación de código, ideal para aplicaciones de alta gama."
  },
  "mistral-nemo": {
    "description": "Mistral Nemo, desarrollado en colaboración entre Mistral AI y NVIDIA, es un modelo de 12B de alto rendimiento."
  },
+  "mistral-nemo-instruct": {
+    "description": "Mistral-Nemo-Instruct-2407 es un modelo de lenguaje grande (LLM) que es una versión ajustada por instrucciones de Mistral-Nemo-Base-2407."
+  },
  "mistral-small": {
    "description": "Mistral Small se puede utilizar en cualquier tarea basada en lenguaje que requiera alta eficiencia y baja latencia."
  },
@@ -1577,6 +1670,12 @@
  "qwen2": {
    "description": "Qwen2 es el nuevo modelo de lenguaje a gran escala de Alibaba, que ofrece un rendimiento excepcional para satisfacer diversas necesidades de aplicación."
  },
+  "qwen2-72b-instruct": {
+    "description": "Qwen2 es la nueva serie de modelos de lenguaje de gran escala presentada por el equipo de Qwen. Se basa en la arquitectura Transformer y utiliza funciones de activación SwiGLU, sesgo de atención QKV (attention QKV bias), atención de consulta grupal (group query attention), una mezcla de atención de ventana deslizante y atención completa (mixture of sliding window attention and full attention). Además, el equipo de Qwen ha mejorado el tokenizador para adaptarse a múltiples lenguajes naturales y códigos."
+  },
+  "qwen2-7b-instruct": {
+    "description": "Qwen2 es una nueva serie de modelos de lenguaje de gran escala desarrollada por el equipo de Qwen. Se basa en la arquitectura Transformer y utiliza funciones de activación SwiGLU, sesgo de atención QKV (attention QKV bias), atención de consulta grupal (group query attention), una mezcla de atención de ventana deslizante y atención completa (mixture of sliding window attention and full attention). Además, el equipo de Qwen ha mejorado el tokenizador para adaptarse a múltiples lenguajes naturales y códigos."
+  },
  "qwen2.5": {
    "description": "Qwen2.5 es la nueva generación de modelos de lenguaje a gran escala de Alibaba, que ofrece un rendimiento excepcional para satisfacer diversas necesidades de aplicación."
  },
@@ -1604,6 +1703,12 @@
  "qwen2.5-coder-7b-instruct": {
    "description": "La versión de código abierto del modelo de código Tongyi Qwen."
  },
+  "qwen2.5-coder-instruct": {
+    "description": "Qwen2.5-Coder es el modelo de lenguaje de gran tamaño más reciente de la serie Qwen especializado en código (anteriormente conocido como CodeQwen)."
+  },
+  "qwen2.5-instruct": {
+    "description": "Qwen2.5 es la última serie de modelos de lenguaje extenso Qwen. Para Qwen2.5, hemos lanzado varios modelos de lenguaje base y modelos de lenguaje ajustados por instrucciones, con parámetros que van desde 500 millones hasta 7.2 mil millones."
+  },
  "qwen2.5-math-1.5b-instruct": {
    "description": "El modelo Qwen-Math tiene habilidades poderosas para resolver problemas matemáticos."
  },
@@ -1613,12 +1718,21 @@
  "qwen2.5-math-7b-instruct": {
    "description": "El modelo Qwen-Math tiene una poderosa capacidad para resolver problemas matemáticos."
  },
+  "qwen2.5-omni-7b": {
+    "description": "La serie de modelos Qwen-Omni admite la entrada de datos de múltiples modalidades, incluyendo video, audio, imágenes y texto, y produce audio y texto como salida."
+  },
+  "qwen2.5-vl-32b-instruct": {
+    "description": "La serie de modelos Qwen2.5-VL ha mejorado el nivel de inteligencia, utilidad y aplicabilidad del modelo, optimizando su rendimiento en escenarios como conversaciones naturales, creación de contenido, servicios de conocimiento especializado y desarrollo de código. La versión 32B utiliza técnicas de aprendizaje por refuerzo para optimizar el modelo, ofreciendo en comparación con otros modelos de la serie Qwen2.5 VL, un estilo de salida más acorde con las preferencias humanas, capacidad de razonamiento para problemas matemáticos complejos, así como comprensión y razonamiento detallado de imágenes."
+  },
  "qwen2.5-vl-72b-instruct": {
    "description": "Mejora general en seguimiento de instrucciones, matemáticas, resolución de problemas y código, con capacidades de reconocimiento de objetos mejoradas, soporta formatos diversos para localizar elementos visuales con precisión, y puede entender archivos de video largos (hasta 10 minutos) y localizar eventos en segundos, comprendiendo la secuencia y velocidad del tiempo, soportando el control de agentes en OS o móviles, con fuerte capacidad de extracción de información clave y salida en formato Json. Esta versión es la de 72B, la más potente de la serie."
  },
  "qwen2.5-vl-7b-instruct": {
    "description": "Mejora general en seguimiento de instrucciones, matemáticas, resolución de problemas y código, con capacidades de reconocimiento de objetos mejoradas, soporta formatos diversos para localizar elementos visuales con precisión, y puede entender archivos de video largos (hasta 10 minutos) y localizar eventos en segundos, comprendiendo la secuencia y velocidad del tiempo, soportando el control de agentes en OS o móviles, con fuerte capacidad de extracción de información clave y salida en formato Json. Esta versión es la de 72B, la más potente de la serie."
  },
+  "qwen2.5-vl-instruct": {
+    "description": "Qwen2.5-VL es la última versión del modelo de lenguaje visual de la familia de modelos Qwen."
+  },
  "qwen2.5:0.5b": {
    "description": "Qwen2.5 es la nueva generación de modelos de lenguaje a gran escala de Alibaba, que ofrece un rendimiento excepcional para satisfacer diversas necesidades de aplicación."
  },
@@ -1754,6 +1868,9 @@
  "wizardlm2:8x22b": {
    "description": "WizardLM 2 es un modelo de lenguaje proporcionado por Microsoft AI, que destaca en diálogos complejos, multilingües, razonamiento y asistentes inteligentes."
  },
+  "yi-1.5-34b-chat": {
+    "description": "Yi-1.5 es una versión mejorada de Yi. Utiliza un corpus de alta calidad de 500B tokens para continuar el preentrenamiento de Yi y se微调 en 3M muestras de ajuste fino diversificadas."
+  },
  "yi-large": {
    "description": "Modelo de mil millones de parámetros completamente nuevo, que ofrece capacidades excepcionales de preguntas y respuestas y generación de texto."
  },
@@ -23,6 +23,9 @@
  "cloudflare": {
    "description": "Ejecuta modelos de aprendizaje automático impulsados por GPU sin servidor en la red global de Cloudflare."
  },
+  "cohere": {
+    "description": "Cohere le ofrece los modelos multilingües más avanzados, potentes funciones de búsqueda y un espacio de trabajo de IA diseñado a medida para empresas modernas, todo integrado en una plataforma segura."
+  },
  "deepseek": {
    "description": "DeepSeek es una empresa centrada en la investigación y aplicación de tecnologías de inteligencia artificial, cuyo modelo más reciente, DeepSeek-V2.5, combina capacidades de diálogo general y procesamiento de código, logrando mejoras significativas en alineación con preferencias humanas, tareas de escritura y seguimiento de instrucciones."
  },
@@ -53,6 +56,9 @@
  "hunyuan": {
    "description": "Un modelo de lenguaje desarrollado por Tencent, que posee una poderosa capacidad de creación en chino, habilidades de razonamiento lógico en contextos complejos y una capacidad confiable para ejecutar tareas."
  },
+  "infiniai": {
+    "description": "Proporciona a los desarrolladores de aplicaciones servicios de modelos grandes de alto rendimiento, fáciles de usar y seguros, cubriendo todo el proceso desde el desarrollo de modelos grandes hasta su implementación como servicio."
+  },
  "internlm": {
    "description": "Organización de código abierto dedicada a la investigación y desarrollo de herramientas para modelos grandes. Proporciona a todos los desarrolladores de IA una plataforma de código abierto eficiente y fácil de usar, permitiendo el acceso a las tecnologías y algoritmos más avanzados."
  },
@@ -98,6 +104,9 @@
  "sambanova": {
    "description": "SambaNova Cloud permite a los desarrolladores utilizar fácilmente los mejores modelos de código abierto y disfrutar de la velocidad de inferencia más rápida."
  },
+  "search1api": {
+    "description": "Search1API proporciona acceso a la serie de modelos DeepSeek que se pueden conectar a Internet según sea necesario, incluyendo versiones estándar y rápidas, con soporte para la selección de modelos de diferentes escalas de parámetros."
+  },
  "sensenova": {
    "description": "SenseTime ofrece servicios de modelos grandes de pila completa, aprovechando el sólido soporte de la gran infraestructura de SenseTime."
  },
@@ -137,6 +146,9 @@
  "xai": {
    "description": "xAI es una empresa dedicada a construir inteligencia artificial para acelerar los descubrimientos científicos humanos. Nuestra misión es promover nuestra comprensión compartida del universo."
  },
+  "xinference": {
+    "description": "Xorbits Inference (Xinference) es una plataforma de código abierto diseñada para simplificar la ejecución e integración de diversos modelos de IA. Con Xinference, puedes utilizar cualquier modelo LLM de código abierto, modelos de incrustación y modelos multimodales para ejecutar inferencias en entornos locales o en la nube, y crear potentes aplicaciones de IA."
+  },
  "zeroone": {
    "description": "01.AI se centra en la tecnología de inteligencia artificial de la era 2.0, promoviendo enérgicamente la innovación y aplicación de 'humano + inteligencia artificial', utilizando modelos extremadamente potentes y tecnologías de IA avanzadas para mejorar la productividad humana y lograr el empoderamiento tecnológico."
  },
--- a/Show More
+++ b/Show More
				`@@ -0,0 +1 @@`
				`export const isDev = process.env.NODE_ENV === 'development';`