Merge branch 'main' into chore/try-react-compiler

📝 docs: Add NEXT_PUBLIC_ENABLE_NEXT_AUTH to clerk example (#6309 )
💄 style(chat): auto send message from URL (#6497 )
2026-06-20 06:15:58 +00:00 · 2025-03-09 19:06:06 +08:00 · 2025-03-09 19:05:37 +08:00 · 2025-03-09 19:01:59 +08:00 · 2025-03-09 19:00:22 +08:00 · 2025-03-09 18:57:50 +08:00
404 changed files with 21186 additions and 3659 deletions
@@ -6,7 +6,7 @@


 ########################################
-######## Model Provider Service ########
+########## AI Provider Service #########
 ########################################

 ### OpenAI ###
@@ -33,7 +33,7 @@ OPENAI_API_KEY=sk-xxxxxxxxx
 # AZURE_ENDPOINT=https://docs-test-001.openai.azure.com

 # Azure's API version, follows the YYYY-MM-DD format
-# AZURE_API_VERSION=2024-06-01
+# AZURE_API_VERSION=2024-10-21


 ### Anthropic Service ####
@@ -127,6 +127,10 @@ OPENAI_API_KEY=sk-xxxxxxxxx

 # TENCENT_CLOUD_API_KEY=sk-xxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxx

+### PPIO ####
+
+# PPIO_API_KEY=sk-xxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxx
+
 ########################################
 ############ Market Service ############
 ########################################
@@ -214,7 +218,7 @@ OPENAI_API_KEY=sk-xxxxxxxxx
 # DATABASE_URL=postgres://username:password@host:port/database

 # use `openssl rand -base64 32` to generate a key for the encryption of the database
-# we use this key to encrypt the user api key
+# we use this key to encrypt the user api key and proxy url
 #KEY_VAULTS_SECRET=xxxxx/xxxxxxxxxxxxxx=

 # Specify the Embedding model and Reranker model(unImplemented)
@@ -2,6 +2,733 @@

 # Changelog

+### [Version 1.69.4](https://github.com/lobehub/lobe-chat/compare/v1.69.3...v1.69.4)
+
+<sup>Released on **2025-03-09**</sup>
+
+#### 🐛 Bug Fixes
+
+- **misc**: Fix mistral can not chat.
+
+<br/>
+
+<details>
+<summary><kbd>Improvements and Fixes</kbd></summary>
+
+#### What's fixed
+
+- **misc**: Fix mistral can not chat, closes [#6828](https://github.com/lobehub/lobe-chat/issues/6828) ([00cba71](https://github.com/lobehub/lobe-chat/commit/00cba71))
+
+</details>
+
+<div align="right">
+
+[![](https://img.shields.io/badge/-BACK_TO_TOP-151515?style=flat-square)](#readme-top)
+
+</div>
+
+### [Version 1.69.3](https://github.com/lobehub/lobe-chat/compare/v1.69.2...v1.69.3)
+
+<sup>Released on **2025-03-08**</sup>
+
+#### 💄 Styles
+
+- **misc**: Add login ui for next-auth.
+
+<br/>
+
+<details>
+<summary><kbd>Improvements and Fixes</kbd></summary>
+
+#### Styles
+
+- **misc**: Add login ui for next-auth, closes [#6434](https://github.com/lobehub/lobe-chat/issues/6434) ([541f275](https://github.com/lobehub/lobe-chat/commit/541f275))
+
+</details>
+
+<div align="right">
+
+[![](https://img.shields.io/badge/-BACK_TO_TOP-151515?style=flat-square)](#readme-top)
+
+</div>
+
+### [Version 1.69.2](https://github.com/lobehub/lobe-chat/compare/v1.69.1...v1.69.2)
+
+<sup>Released on **2025-03-07**</sup>
+
+#### ♻ Code Refactoring
+
+- **misc**: Refactor the agent runtime implement.
+
+<br/>
+
+<details>
+<summary><kbd>Improvements and Fixes</kbd></summary>
+
+#### Code refactoring
+
+- **misc**: Refactor the agent runtime implement, closes [#6784](https://github.com/lobehub/lobe-chat/issues/6784) ([14a9874](https://github.com/lobehub/lobe-chat/commit/14a9874))
+
+</details>
+
+<div align="right">
+
+[![](https://img.shields.io/badge/-BACK_TO_TOP-151515?style=flat-square)](#readme-top)
+
+</div>
+
+### [Version 1.69.1](https://github.com/lobehub/lobe-chat/compare/v1.69.0...v1.69.1)
+
+<sup>Released on **2025-03-07**</sup>
+
+#### 💄 Styles
+
+- **misc**: Add Qwen QwQ model.
+
+<br/>
+
+<details>
+<summary><kbd>Improvements and Fixes</kbd></summary>
+
+#### Styles
+
+- **misc**: Add Qwen QwQ model, closes [#6783](https://github.com/lobehub/lobe-chat/issues/6783) ([3d3c2ce](https://github.com/lobehub/lobe-chat/commit/3d3c2ce))
+
+</details>
+
+<div align="right">
+
+[![](https://img.shields.io/badge/-BACK_TO_TOP-151515?style=flat-square)](#readme-top)
+
+</div>
+
+## [Version 1.69.0](https://github.com/lobehub/lobe-chat/compare/v1.68.11...v1.69.0)
+
+<sup>Released on **2025-03-07**</sup>
+
+#### ✨ Features
+
+- **misc**: Support Anthropic Context Caching.
+
+<br/>
+
+<details>
+<summary><kbd>Improvements and Fixes</kbd></summary>
+
+#### What's improved
+
+- **misc**: Support Anthropic Context Caching, closes [#6704](https://github.com/lobehub/lobe-chat/issues/6704) ([471e3ed](https://github.com/lobehub/lobe-chat/commit/471e3ed))
+
+</details>
+
+<div align="right">
+
+[![](https://img.shields.io/badge/-BACK_TO_TOP-151515?style=flat-square)](#readme-top)
+
+</div>
+
+### [Version 1.68.11](https://github.com/lobehub/lobe-chat/compare/v1.68.10...v1.68.11)
+
+<sup>Released on **2025-03-07**</sup>
+
+#### 💄 Styles
+
+- **misc**: Add Gemini 2.0 Flash model variations, add QwQ models.
+
+<br/>
+
+<details>
+<summary><kbd>Improvements and Fixes</kbd></summary>
+
+#### Styles
+
+- **misc**: Add Gemini 2.0 Flash model variations, closes [#6679](https://github.com/lobehub/lobe-chat/issues/6679) ([d5a8fcb](https://github.com/lobehub/lobe-chat/commit/d5a8fcb))
+- **misc**: Add QwQ models, closes [#6770](https://github.com/lobehub/lobe-chat/issues/6770) ([cd30fcc](https://github.com/lobehub/lobe-chat/commit/cd30fcc))
+
+</details>
+
+<div align="right">
+
+[![](https://img.shields.io/badge/-BACK_TO_TOP-151515?style=flat-square)](#readme-top)
+
+</div>
+
+### [Version 1.68.10](https://github.com/lobehub/lobe-chat/compare/v1.68.9...v1.68.10)
+
+<sup>Released on **2025-03-06**</sup>
+
+#### 🐛 Bug Fixes
+
+- **misc**: Fix litellm streaming usage and refactor the usage chunk.
+
+<br/>
+
+<details>
+<summary><kbd>Improvements and Fixes</kbd></summary>
+
+#### What's fixed
+
+- **misc**: Fix litellm streaming usage and refactor the usage chunk, closes [#6734](https://github.com/lobehub/lobe-chat/issues/6734) ([9f09952](https://github.com/lobehub/lobe-chat/commit/9f09952))
+
+</details>
+
+<div align="right">
+
+[![](https://img.shields.io/badge/-BACK_TO_TOP-151515?style=flat-square)](#readme-top)
+
+</div>
+
+### [Version 1.68.9](https://github.com/lobehub/lobe-chat/compare/v1.68.8...v1.68.9)
+
+<sup>Released on **2025-03-05**</sup>
+
+#### 💄 Styles
+
+- **misc**: Add epub file chunk split support.
+
+<br/>
+
+<details>
+<summary><kbd>Improvements and Fixes</kbd></summary>
+
+#### Styles
+
+- **misc**: Add epub file chunk split support, closes [#6317](https://github.com/lobehub/lobe-chat/issues/6317) ([a79ab7a](https://github.com/lobehub/lobe-chat/commit/a79ab7a))
+
+</details>
+
+<div align="right">
+
+[![](https://img.shields.io/badge/-BACK_TO_TOP-151515?style=flat-square)](#readme-top)
+
+</div>
+
+### [Version 1.68.8](https://github.com/lobehub/lobe-chat/compare/v1.68.7...v1.68.8)
+
+<sup>Released on **2025-03-05**</sup>
+
+#### 💄 Styles
+
+- **misc**: Improve openrouter models info.
+
+<br/>
+
+<details>
+<summary><kbd>Improvements and Fixes</kbd></summary>
+
+#### Styles
+
+- **misc**: Improve openrouter models info, closes [#6708](https://github.com/lobehub/lobe-chat/issues/6708) ([5693e68](https://github.com/lobehub/lobe-chat/commit/5693e68))
+
+</details>
+
+<div align="right">
+
+[![](https://img.shields.io/badge/-BACK_TO_TOP-151515?style=flat-square)](#readme-top)
+
+</div>
+
+### [Version 1.68.7](https://github.com/lobehub/lobe-chat/compare/v1.68.6...v1.68.7)
+
+<sup>Released on **2025-03-05**</sup>
+
+#### ♻ Code Refactoring
+
+- **misc**: Refactor agent runtime to better code format.
+
+<br/>
+
+<details>
+<summary><kbd>Improvements and Fixes</kbd></summary>
+
+#### Code refactoring
+
+- **misc**: Refactor agent runtime to better code format, closes [#6284](https://github.com/lobehub/lobe-chat/issues/6284) ([fc1ed4a](https://github.com/lobehub/lobe-chat/commit/fc1ed4a))
+
+</details>
+
+<div align="right">
+
+[![](https://img.shields.io/badge/-BACK_TO_TOP-151515?style=flat-square)](#readme-top)
+
+</div>
+
+### [Version 1.68.6](https://github.com/lobehub/lobe-chat/compare/v1.68.5...v1.68.6)
+
+<sup>Released on **2025-03-05**</sup>
+
+#### 🐛 Bug Fixes
+
+- **misc**: Fix custom ai provider sdk type.
+
+<br/>
+
+<details>
+<summary><kbd>Improvements and Fixes</kbd></summary>
+
+#### What's fixed
+
+- **misc**: Fix custom ai provider sdk type, closes [#6712](https://github.com/lobehub/lobe-chat/issues/6712) ([7f8c379](https://github.com/lobehub/lobe-chat/commit/7f8c379))
+
+</details>
+
+<div align="right">
+
+[![](https://img.shields.io/badge/-BACK_TO_TOP-151515?style=flat-square)](#readme-top)
+
+</div>
+
+### [Version 1.68.5](https://github.com/lobehub/lobe-chat/compare/v1.68.4...v1.68.5)
+
+<sup>Released on **2025-03-04**</sup>
+
+#### 💄 Styles
+
+- **misc**: Fix provider order.
+
+<br/>
+
+<details>
+<summary><kbd>Improvements and Fixes</kbd></summary>
+
+#### Styles
+
+- **misc**: Fix provider order, closes [#6702](https://github.com/lobehub/lobe-chat/issues/6702) ([27e4980](https://github.com/lobehub/lobe-chat/commit/27e4980))
+
+</details>
+
+<div align="right">
+
+[![](https://img.shields.io/badge/-BACK_TO_TOP-151515?style=flat-square)](#readme-top)
+
+</div>
+
+### [Version 1.68.4](https://github.com/lobehub/lobe-chat/compare/v1.68.3...v1.68.4)
+
+<sup>Released on **2025-03-04**</sup>
+
+#### 💄 Styles
+
+- **misc**: Support to show token usages.
+
+<br/>
+
+<details>
+<summary><kbd>Improvements and Fixes</kbd></summary>
+
+#### Styles
+
+- **misc**: Support to show token usages, closes [#6693](https://github.com/lobehub/lobe-chat/issues/6693) ([71a638e](https://github.com/lobehub/lobe-chat/commit/71a638e))
+
+</details>
+
+<div align="right">
+
+[![](https://img.shields.io/badge/-BACK_TO_TOP-151515?style=flat-square)](#readme-top)
+
+</div>
+
+### [Version 1.68.3](https://github.com/lobehub/lobe-chat/compare/v1.68.2...v1.68.3)
+
+<sup>Released on **2025-03-03**</sup>
+
+#### 🐛 Bug Fixes
+
+- **misc**: Improve url rules.
+
+<br/>
+
+<details>
+<summary><kbd>Improvements and Fixes</kbd></summary>
+
+#### What's fixed
+
+- **misc**: Improve url rules, closes [#6669](https://github.com/lobehub/lobe-chat/issues/6669) ([5ee59e3](https://github.com/lobehub/lobe-chat/commit/5ee59e3))
+
+</details>
+
+<div align="right">
+
+[![](https://img.shields.io/badge/-BACK_TO_TOP-151515?style=flat-square)](#readme-top)
+
+</div>
+
+### [Version 1.68.2](https://github.com/lobehub/lobe-chat/compare/v1.68.1...v1.68.2)
+
+<sup>Released on **2025-03-03**</sup>
+
+#### 💄 Styles
+
+- **misc**: Add build-in web search support for Wenxin & Hunyuan.
+
+<br/>
+
+<details>
+<summary><kbd>Improvements and Fixes</kbd></summary>
+
+#### Styles
+
+- **misc**: Add build-in web search support for Wenxin & Hunyuan, closes [#6617](https://github.com/lobehub/lobe-chat/issues/6617) ([dfd1f09](https://github.com/lobehub/lobe-chat/commit/dfd1f09))
+
+</details>
+
+<div align="right">
+
+[![](https://img.shields.io/badge/-BACK_TO_TOP-151515?style=flat-square)](#readme-top)
+
+</div>
+
+### [Version 1.68.1](https://github.com/lobehub/lobe-chat/compare/v1.68.0...v1.68.1)
+
+<sup>Released on **2025-03-03**</sup>
+
+#### 🐛 Bug Fixes
+
+- **misc**: Fix page crash with crawler error.
+
+<br/>
+
+<details>
+<summary><kbd>Improvements and Fixes</kbd></summary>
+
+#### What's fixed
+
+- **misc**: Fix page crash with crawler error, closes [#6662](https://github.com/lobehub/lobe-chat/issues/6662) ([0c24251](https://github.com/lobehub/lobe-chat/commit/0c24251))
+
+</details>
+
+<div align="right">
+
+[![](https://img.shields.io/badge/-BACK_TO_TOP-151515?style=flat-square)](#readme-top)
+
+</div>
+
+## [Version 1.68.0](https://github.com/lobehub/lobe-chat/compare/v1.67.2...v1.68.0)
+
+<sup>Released on **2025-03-03**</sup>
+
+#### ✨ Features
+
+- **misc**: Add new model provider PPIO.
+
+#### 🐛 Bug Fixes
+
+- **misc**: Fix search web-browsing display bug.
+
+<br/>
+
+<details>
+<summary><kbd>Improvements and Fixes</kbd></summary>
+
+#### What's improved
+
+- **misc**: Add new model provider PPIO, closes [#6133](https://github.com/lobehub/lobe-chat/issues/6133) ([23a3fda](https://github.com/lobehub/lobe-chat/commit/23a3fda))
+
+#### What's fixed
+
+- **misc**: Fix search web-browsing display bug, closes [#6653](https://github.com/lobehub/lobe-chat/issues/6653) ([f472643](https://github.com/lobehub/lobe-chat/commit/f472643))
+
+</details>
+
+<div align="right">
+
+[![](https://img.shields.io/badge/-BACK_TO_TOP-151515?style=flat-square)](#readme-top)
+
+</div>
+
+### [Version 1.67.2](https://github.com/lobehub/lobe-chat/compare/v1.67.1...v1.67.2)
+
+<sup>Released on **2025-03-02**</sup>
+
+#### 🐛 Bug Fixes
+
+- **misc**: Improve some crawl case.
+
+<br/>
+
+<details>
+<summary><kbd>Improvements and Fixes</kbd></summary>
+
+#### What's fixed
+
+- **misc**: Improve some crawl case, closes [#6634](https://github.com/lobehub/lobe-chat/issues/6634) ([d38ab02](https://github.com/lobehub/lobe-chat/commit/d38ab02))
+
+</details>
+
+<div align="right">
+
+[![](https://img.shields.io/badge/-BACK_TO_TOP-151515?style=flat-square)](#readme-top)
+
+</div>
+
+### [Version 1.67.1](https://github.com/lobehub/lobe-chat/compare/v1.67.0...v1.67.1)
+
+<sup>Released on **2025-03-02**</sup>
+
+<br/>
+
+<details>
+<summary><kbd>Improvements and Fixes</kbd></summary>
+
+</details>
+
+<div align="right">
+
+[![](https://img.shields.io/badge/-BACK_TO_TOP-151515?style=flat-square)](#readme-top)
+
+</div>
+
+## [Version 1.67.0](https://github.com/lobehub/lobe-chat/compare/v1.66.6...v1.67.0)
+
+<sup>Released on **2025-03-02**</sup>
+
+#### ✨ Features
+
+- **misc**: Support web page crawl in the search.
+
+<br/>
+
+<details>
+<summary><kbd>Improvements and Fixes</kbd></summary>
+
+#### What's improved
+
+- **misc**: Support web page crawl in the search, closes [#6582](https://github.com/lobehub/lobe-chat/issues/6582) ([5e02602](https://github.com/lobehub/lobe-chat/commit/5e02602))
+
+</details>
+
+<div align="right">
+
+[![](https://img.shields.io/badge/-BACK_TO_TOP-151515?style=flat-square)](#readme-top)
+
+</div>
+
+### [Version 1.66.6](https://github.com/lobehub/lobe-chat/compare/v1.66.5...v1.66.6)
+
+<sup>Released on **2025-03-02**</sup>
+
+#### 💄 Styles
+
+- **misc**: Add `gpt-4.5-preview` for OpenAI.
+
+<br/>
+
+<details>
+<summary><kbd>Improvements and Fixes</kbd></summary>
+
+#### Styles
+
+- **misc**: Add `gpt-4.5-preview` for OpenAI, closes [#6618](https://github.com/lobehub/lobe-chat/issues/6618) ([3ec3af0](https://github.com/lobehub/lobe-chat/commit/3ec3af0))
+
+</details>
+
+<div align="right">
+
+[![](https://img.shields.io/badge/-BACK_TO_TOP-151515?style=flat-square)](#readme-top)
+
+</div>
+
+### [Version 1.66.5](https://github.com/lobehub/lobe-chat/compare/v1.66.4...v1.66.5)
+
+<sup>Released on **2025-02-28**</sup>
+
+#### 💄 Styles
+
+- **misc**: Improve portal style.
+
+<br/>
+
+<details>
+<summary><kbd>Improvements and Fixes</kbd></summary>
+
+#### Styles
+
+- **misc**: Improve portal style, closes [#6588](https://github.com/lobehub/lobe-chat/issues/6588) ([55b5416](https://github.com/lobehub/lobe-chat/commit/55b5416))
+
+</details>
+
+<div align="right">
+
+[![](https://img.shields.io/badge/-BACK_TO_TOP-151515?style=flat-square)](#readme-top)
+
+</div>
+
+### [Version 1.66.4](https://github.com/lobehub/lobe-chat/compare/v1.66.3...v1.66.4)
+
+<sup>Released on **2025-02-28**</sup>
+
+#### 💄 Styles
+
+- **misc**: Optimize smooth output.
+
+<br/>
+
+<details>
+<summary><kbd>Improvements and Fixes</kbd></summary>
+
+#### Styles
+
+- **misc**: Optimize smooth output, closes [#5824](https://github.com/lobehub/lobe-chat/issues/5824) ([7a84ad9](https://github.com/lobehub/lobe-chat/commit/7a84ad9))
+
+</details>
+
+<div align="right">
+
+[![](https://img.shields.io/badge/-BACK_TO_TOP-151515?style=flat-square)](#readme-top)
+
+</div>
+
+### [Version 1.66.3](https://github.com/lobehub/lobe-chat/compare/v1.66.2...v1.66.3)
+
+<sup>Released on **2025-02-27**</sup>
+
+#### 🐛 Bug Fixes
+
+- **misc**: Fix fetch assistants plugin error.
+
+<br/>
+
+<details>
+<summary><kbd>Improvements and Fixes</kbd></summary>
+
+#### What's fixed
+
+- **misc**: Fix fetch assistants plugin error, closes [#6576](https://github.com/lobehub/lobe-chat/issues/6576) ([9669a02](https://github.com/lobehub/lobe-chat/commit/9669a02))
+
+</details>
+
+<div align="right">
+
+[![](https://img.shields.io/badge/-BACK_TO_TOP-151515?style=flat-square)](#readme-top)
+
+</div>
+
+### [Version 1.66.2](https://github.com/lobehub/lobe-chat/compare/v1.66.1...v1.66.2)
+
+<sup>Released on **2025-02-27**</sup>
+
+#### 🐛 Bug Fixes
+
+- **misc**: Update Claude sonnet 3.7 model ID.
+
+<br/>
+
+<details>
+<summary><kbd>Improvements and Fixes</kbd></summary>
+
+#### What's fixed
+
+- **misc**: Update Claude sonnet 3.7 model ID, closes [#6567](https://github.com/lobehub/lobe-chat/issues/6567) ([d1039d6](https://github.com/lobehub/lobe-chat/commit/d1039d6))
+
+</details>
+
+<div align="right">
+
+[![](https://img.shields.io/badge/-BACK_TO_TOP-151515?style=flat-square)](#readme-top)
+
+</div>
+
+### [Version 1.66.1](https://github.com/lobehub/lobe-chat/compare/v1.66.0...v1.66.1)
+
+<sup>Released on **2025-02-27**</sup>
+
+#### 💄 Styles
+
+- **misc**: Added eu-central-1 region for bedrock.
+
+<br/>
+
+<details>
+<summary><kbd>Improvements and Fixes</kbd></summary>
+
+#### Styles
+
+- **misc**: Added eu-central-1 region for bedrock, closes [#6555](https://github.com/lobehub/lobe-chat/issues/6555) ([6f1e599](https://github.com/lobehub/lobe-chat/commit/6f1e599))
+
+</details>
+
+<div align="right">
+
+[![](https://img.shields.io/badge/-BACK_TO_TOP-151515?style=flat-square)](#readme-top)
+
+</div>
+
+## [Version 1.66.0](https://github.com/lobehub/lobe-chat/compare/v1.65.2...v1.66.0)
+
+<sup>Released on **2025-02-27**</sup>
+
+#### ✨ Features
+
+- **misc**: Add online search support for available providers.
+
+<br/>
+
+<details>
+<summary><kbd>Improvements and Fixes</kbd></summary>
+
+#### What's improved
+
+- **misc**: Add online search support for available providers, closes [#6475](https://github.com/lobehub/lobe-chat/issues/6475) ([cb0a3bc](https://github.com/lobehub/lobe-chat/commit/cb0a3bc))
+
+</details>
+
+<div align="right">
+
+[![](https://img.shields.io/badge/-BACK_TO_TOP-151515?style=flat-square)](#readme-top)
+
+</div>
+
+### [Version 1.65.2](https://github.com/lobehub/lobe-chat/compare/v1.65.1...v1.65.2)
+
+<sup>Released on **2025-02-27**</sup>
+
+#### 💄 Styles
+
+- **misc**: Support parsing the search flag when parsing the model list, Update Gemini & Qwen models.
+
+<br/>
+
+<details>
+<summary><kbd>Improvements and Fixes</kbd></summary>
+
+#### Styles
+
+- **misc**: Support parsing the search flag when parsing the model list, closes [#6546](https://github.com/lobehub/lobe-chat/issues/6546) ([8c768ed](https://github.com/lobehub/lobe-chat/commit/8c768ed))
+- **misc**: Update Gemini & Qwen models, closes [#6531](https://github.com/lobehub/lobe-chat/issues/6531) ([efde928](https://github.com/lobehub/lobe-chat/commit/efde928))
+
+</details>
+
+<div align="right">
+
+[![](https://img.shields.io/badge/-BACK_TO_TOP-151515?style=flat-square)](#readme-top)
+
+</div>
+
+### [Version 1.65.1](https://github.com/lobehub/lobe-chat/compare/v1.65.0...v1.65.1)
+
+<sup>Released on **2025-02-26**</sup>
+
+#### 🐛 Bug Fixes
+
+- **misc**: Fix claude 3.7 sonnet thinking with tool use.
+
+<br/>
+
+<details>
+<summary><kbd>Improvements and Fixes</kbd></summary>
+
+#### What's fixed
+
+- **misc**: Fix claude 3.7 sonnet thinking with tool use, closes [#6528](https://github.com/lobehub/lobe-chat/issues/6528) ([a76d2bf](https://github.com/lobehub/lobe-chat/commit/a76d2bf))
+
+</details>
+
+<div align="right">
+
+[![](https://img.shields.io/badge/-BACK_TO_TOP-151515?style=flat-square)](#readme-top)
+
+</div>
+
 ## [Version 1.65.0](https://github.com/lobehub/lobe-chat/compare/v1.64.3...v1.65.0)

 <sup>Released on **2025-02-25**</sup>
@@ -67,8 +67,9 @@ ENV NODE_OPTIONS="--max-old-space-size=8192"

 WORKDIR /app

-COPY package.json ./
+COPY package.json pnpm-workspace.yaml ./
 COPY .npmrc ./
+COPY packages ./packages

 RUN \
    # If you want to build docker in China, build with --build-arg USE_CN_MIRROR=true
@@ -86,10 +87,7 @@ RUN \
    # Use pnpm for corepack
    && corepack use $(sed -n 's/.*"packageManager": "\(.*\)".*/\1/p' package.json) \
    # Install the dependencies
-    && pnpm i \
-    # Add sharp dependencies
-    && mkdir -p /deps \
-    && pnpm add sharp --prefix /deps
+    && pnpm i

 COPY . .

@@ -101,13 +99,9 @@ FROM busybox:latest AS app

 COPY --from=base /distroless/ /

-COPY --from=builder /app/public /app/public
-
 # Automatically leverage output traces to reduce image size
 # https://nextjs.org/docs/advanced-features/output-file-tracing
 COPY --from=builder /app/.next/standalone /app/
-COPY --from=builder /app/.next/static /app/.next/static
-COPY --from=builder /deps/node_modules/.pnpm /app/node_modules/.pnpm

 # Copy server launcher
 COPY --from=builder /app/scripts/serverLauncher/startServer.js /app/startServer.js
@@ -203,6 +197,8 @@ ENV \
    OPENROUTER_API_KEY="" OPENROUTER_MODEL_LIST="" \
    # Perplexity
    PERPLEXITY_API_KEY="" PERPLEXITY_MODEL_LIST="" PERPLEXITY_PROXY_URL="" \
+    # PPIO
+    PPIO_API_KEY="" PPIO_MODEL_LIST="" \
    # Qwen
    QWEN_API_KEY="" QWEN_MODEL_LIST="" QWEN_PROXY_URL="" \
    # SambaNova
@@ -76,8 +76,9 @@ ENV NODE_OPTIONS="--max-old-space-size=8192"

 WORKDIR /app

-COPY package.json ./
+COPY package.json pnpm-workspace.yaml ./
 COPY .npmrc ./
+COPY packages ./packages

 RUN \
    # If you want to build docker in China, build with --build-arg USE_CN_MIRROR=true
@@ -96,9 +97,11 @@ RUN \
    && corepack use $(sed -n 's/.*"packageManager": "\(.*\)".*/\1/p' package.json) \
    # Install the dependencies
    && pnpm i \
-    # Add sharp and db migration dependencies
+    # Add db migration dependencies
    && mkdir -p /deps \
-    && pnpm add sharp pg drizzle-orm --prefix /deps
+    && cd /deps \
+    && pnpm init \
+    && pnpm add pg drizzle-orm

 COPY . .

@@ -110,23 +113,20 @@ FROM busybox:latest AS app

 COPY --from=base /distroless/ /

-COPY --from=builder /app/public /app/public
-
 # Automatically leverage output traces to reduce image size
 # https://nextjs.org/docs/advanced-features/output-file-tracing
 COPY --from=builder /app/.next/standalone /app/
-COPY --from=builder /app/.next/static /app/.next/static
-
-# copy dependencies
-COPY --from=builder /deps/node_modules/.pnpm /app/node_modules/.pnpm
-COPY --from=builder /deps/node_modules/pg /app/node_modules/pg
-COPY --from=builder /deps/node_modules/drizzle-orm /app/node_modules/drizzle-orm

 # Copy database migrations
 COPY --from=builder /app/src/database/migrations /app/migrations
 COPY --from=builder /app/scripts/migrateServerDB/docker.cjs /app/docker.cjs
 COPY --from=builder /app/scripts/migrateServerDB/errorHint.js /app/errorHint.js

+# copy dependencies
+COPY --from=builder /deps/node_modules/.pnpm /app/node_modules/.pnpm
+COPY --from=builder /deps/node_modules/pg /app/node_modules/pg
+COPY --from=builder /deps/node_modules/drizzle-orm /app/node_modules/drizzle-orm
+
 # Copy server launcher
 COPY --from=builder /app/scripts/serverLauncher/startServer.js /app/startServer.js

@@ -240,6 +240,8 @@ ENV \
    OPENROUTER_API_KEY="" OPENROUTER_MODEL_LIST="" \
    # Perplexity
    PERPLEXITY_API_KEY="" PERPLEXITY_MODEL_LIST="" PERPLEXITY_PROXY_URL="" \
+    # PPIO
+    PPIO_API_KEY="" PPIO_MODEL_LIST="" \
    # Qwen
    QWEN_API_KEY="" QWEN_MODEL_LIST="" QWEN_PROXY_URL="" \
    # SambaNova
@@ -68,8 +68,9 @@ ENV NODE_OPTIONS="--max-old-space-size=8192"

 WORKDIR /app

-COPY package.json ./
+COPY package.json pnpm-workspace.yaml ./
 COPY .npmrc ./
+COPY packages ./packages

 RUN \
    # If you want to build docker in China, build with --build-arg USE_CN_MIRROR=true
@@ -87,10 +88,7 @@ RUN \
    # Use pnpm for corepack
    && corepack use $(sed -n 's/.*"packageManager": "\(.*\)".*/\1/p' package.json) \
    # Install the dependencies
-    && pnpm i \
-    # Add sharp dependencies
-    && mkdir -p /deps \
-    && pnpm add sharp --prefix /deps
+    && pnpm i

 COPY . .

@@ -102,13 +100,9 @@ FROM busybox:latest AS app

 COPY --from=base /distroless/ /

-COPY --from=builder /app/public /app/public
-
 # Automatically leverage output traces to reduce image size
 # https://nextjs.org/docs/advanced-features/output-file-tracing
 COPY --from=builder /app/.next/standalone /app/
-COPY --from=builder /app/.next/static /app/.next/static
-COPY --from=builder /deps/node_modules/.pnpm /app/node_modules/.pnpm

 # Copy server launcher
 COPY --from=builder /app/scripts/serverLauncher/startServer.js /app/startServer.js
@@ -196,9 +196,10 @@ We have implemented support for the following model service providers:
 - **[Cloudflare Workers AI](https://lobechat.com/discover/provider/cloudflare)**: Run serverless GPU-powered machine learning models on Cloudflare's global network.
 - **[GitHub](https://lobechat.com/discover/provider/github)**: With GitHub Models, developers can become AI engineers and leverage the industry's leading AI models.

-<details><summary><kbd>See more providers (+26)</kbd></summary>
+<details><summary><kbd>See more providers (+27)</kbd></summary>

 - **[Novita](https://lobechat.com/discover/provider/novita)**: Novita AI is a platform providing a variety of large language models and AI image generation API services, flexible, reliable, and cost-effective. It supports the latest open-source models like Llama3 and Mistral, offering a comprehensive, user-friendly, and auto-scaling API solution for generative AI application development, suitable for the rapid growth of AI startups.
+- **[PPIO](https://lobechat.com/discover/provider/ppio)**: PPIO supports stable and cost-efficient open-source LLM APIs, such as DeepSeek, Llama, Qwen etc.
 - **[Together AI](https://lobechat.com/discover/provider/togetherai)**: Together AI is dedicated to achieving leading performance through innovative AI models, offering extensive customization capabilities, including rapid scaling support and intuitive deployment processes to meet various enterprise needs.
 - **[Fireworks AI](https://lobechat.com/discover/provider/fireworksai)**: Fireworks AI is a leading provider of advanced language model services, focusing on functional calling and multimodal processing. Its latest model, Firefunction V2, is based on Llama-3, optimized for function calling, conversation, and instruction following. The visual language model FireLLaVA-13B supports mixed input of images and text. Other notable models include the Llama series and Mixtral series, providing efficient multilingual instruction following and generation support.
 - **[Groq](https://lobechat.com/discover/provider/groq)**: Groq's LPU inference engine has excelled in the latest independent large language model (LLM) benchmarks, redefining the standards for AI solutions with its remarkable speed and efficiency. Groq represents instant inference speed, demonstrating strong performance in cloud-based deployments.
@@ -227,7 +228,7 @@ We have implemented support for the following model service providers:

 </details>

-> 📊 Total providers: [<kbd>**36**</kbd>](https://lobechat.com/discover/providers)
+> 📊 Total providers: [<kbd>**37**</kbd>](https://lobechat.com/discover/providers)

 <!-- PROVIDER LIST -->

@@ -329,7 +330,7 @@ In addition, these plugins are not limited to news aggregation, but can also ext
 | [Bing_websearch](https://lobechat.com/discover/plugin/Bingsearch-identifier)<br/><sup>By **FineHow** on **2024-12-22**</sup> | Search for information from the internet base BingApi<br/>`bingsearch`                                                  |
 | [PortfolioMeta](https://lobechat.com/discover/plugin/StockData)<br/><sup>By **portfoliometa** on **2024-12-22**</sup>        | Analyze stocks and get comprehensive real-time investment data and analytics.<br/>`stock`                               |

-> 📊 Total plugins: [<kbd>**48**</kbd>](https://lobechat.com/discover/plugins)
+> 📊 Total plugins: [<kbd>**47**</kbd>](https://lobechat.com/discover/plugins)

 <!-- PLUGIN LIST -->

@@ -560,25 +561,22 @@ If you have deployed your own project following the one-click deployment steps i

 We provide a Docker image for deploying the LobeChat service on your own private device. Use the following command to start the LobeChat service:

+1. create a folder to for storage files
+
 ```fish
-$ docker run -d -p 3210:3210 \
-  -e OPENAI_API_KEY=sk-xxxx \
-  -e ACCESS_CODE=lobe66 \
-  --name lobe-chat \
-  lobehub/lobe-chat
+$ mkdir lobe-chat-db && cd lobe-chat-db
 ```

-> \[!TIP]
->
-> If you need to use the OpenAI service through a proxy, you can configure the proxy address using the `OPENAI_PROXY_URL` environment variable:
+2. init the LobeChat infrastructure

 ```fish
-$ docker run -d -p 3210:3210 \
-  -e OPENAI_API_KEY=sk-xxxx \
-  -e OPENAI_PROXY_URL=https://api-proxy.com/v1 \
-  -e ACCESS_CODE=lobe66 \
-  --name lobe-chat \
-  lobehub/lobe-chat
+bash <(curl -fsSL https://lobe.li/setup.sh)
+```
+
+3. Start the LobeChat service
+
+```fish
+docker compose up -d
 ```

 > \[!NOTE]
@@ -671,7 +669,7 @@ If you would like to learn more details, please feel free to look at our [📘 D

 ## 🤝 Contributing

-Contributions of all types are more than welcome; if you are interested in contributing code, feel free to check out our GitHub [Issues][github-issues-link] and [Projects][github-project-link] to get stuck in to show us what you’re made of.
+Contributions of all types are more than welcome; if you are interested in contributing code, feel free to check out our GitHub [Issues][github-issues-link] and [Projects][github-project-link] to get stuck in to show us what you're made of.

 > \[!TIP]
 >
@@ -793,15 +791,15 @@ This project is [Apache 2.0](./LICENSE) licensed.
 [discord-link]: https://discord.gg/AYFPHvv2jT
 [discord-shield]: https://img.shields.io/discord/1127171173982154893?color=5865F2&label=discord&labelColor=black&logo=discord&logoColor=white&style=flat-square
 [discord-shield-badge]: https://img.shields.io/discord/1127171173982154893?color=5865F2&label=discord&labelColor=black&logo=discord&logoColor=white&style=for-the-badge
-[docker-pulls-link]: https://hub.docker.com/r/lobehub/lobe-chat
-[docker-pulls-shield]: https://img.shields.io/docker/pulls/lobehub/lobe-chat?color=45cc11&labelColor=black&style=flat-square
-[docker-release-link]: https://hub.docker.com/r/lobehub/lobe-chat
-[docker-release-shield]: https://img.shields.io/docker/v/lobehub/lobe-chat?color=369eff&label=docker&labelColor=black&logo=docker&logoColor=white&style=flat-square&sort=semver
-[docker-size-link]: https://hub.docker.com/r/lobehub/lobe-chat
-[docker-size-shield]: https://img.shields.io/docker/image-size/lobehub/lobe-chat?color=369eff&labelColor=black&style=flat-square
+[docker-pulls-link]: https://hub.docker.com/r/lobehub/lobe-chat-database
+[docker-pulls-shield]: https://img.shields.io/docker/pulls/lobehub/lobe-chat?color=45cc11&labelColor=black&style=flat-square&sort=semver
+[docker-release-link]: https://hub.docker.com/r/lobehub/lobe-chat-database
+[docker-release-shield]: https://img.shields.io/docker/v/lobehub/lobe-chat-database?color=369eff&label=docker&labelColor=black&logo=docker&logoColor=white&style=flat-square&sort=semver
+[docker-size-link]: https://hub.docker.com/r/lobehub/lobe-chat-database
+[docker-size-shield]: https://img.shields.io/docker/image-size/lobehub/lobe-chat-database?color=369eff&labelColor=black&style=flat-square&sort=semver
 [docs]: https://lobehub.com/docs/usage/start
 [docs-dev-guide]: https://github.com/lobehub/lobe-chat/wiki/index
-[docs-docker]: https://lobehub.com/docs/self-hosting/platform/docker
+[docs-docker]: https://lobehub.com/docs/self-hosting/server-database/docker-compose
 [docs-env-var]: https://lobehub.com/docs/self-hosting/environment-variables
 [docs-feat-agent]: https://lobehub.com/docs/usage/features/agent-market
 [docs-feat-artifacts]: https://lobehub.com/docs/usage/features/artifacts
@@ -892,7 +890,7 @@ This project is [Apache 2.0](./LICENSE) licensed.
 [profile-link]: https://github.com/lobehub
 [share-linkedin-link]: https://linkedin.com/feed
 [share-linkedin-shield]: https://img.shields.io/badge/-share%20on%20linkedin-black?labelColor=black&logo=linkedin&logoColor=white&style=flat-square
-[share-mastodon-link]: https://mastodon.social/share?text=Check%20this%20GitHub%20repository%20out%20%F0%9F%A4%AF%20LobeChat%20-%20An%20open-source,%20extensible%20(Function%20Calling),%20high-performance%20chatbot%20framework.%20It%20supports%20one-click%20free%20deployment%20of%20your%20private%20ChatGPT/LLM%20web%20application.%20https://github.com/lobehub/lobe-chat%20#chatbot%20#chatGPT%20#openAI
+[share-mastodon-link]: https://mastodon.social/share?text=Check%20this%20GitHub%20repository%20out%20%F0%9F%A4%AF%20LobeChat%20-%20An%20open-source,%20extensible%20%28Function%20Calling%29,%20high-performance%20chatbot%20framework.%20It%20supports%20one-click%20free%20deployment%20of%20your%20private%20ChatGPT%2FLLM%20web%20application.%20https://github.com/lobehub/lobe-chat%20#chatbot%20#chatGPT%20#openAI
 [share-mastodon-shield]: https://img.shields.io/badge/-share%20on%20mastodon-black?labelColor=black&logo=mastodon&logoColor=white&style=flat-square
 [share-reddit-link]: https://www.reddit.com/submit?title=Check%20this%20GitHub%20repository%20out%20%F0%9F%A4%AF%20LobeChat%20-%20An%20open-source%2C%20extensible%20%28Function%20Calling%29%2C%20high-performance%20chatbot%20framework.%20It%20supports%20one-click%20free%20deployment%20of%20your%20private%20ChatGPT%2FLLM%20web%20application.%20%23chatbot%20%23chatGPT%20%23openAI&url=https%3A%2F%2Fgithub.com%2Flobehub%2Flobe-chat
 [share-reddit-shield]: https://img.shields.io/badge/-share%20on%20reddit-black?labelColor=black&logo=reddit&logoColor=white&style=flat-square
@@ -196,9 +196,10 @@ LobeChat 支持文件上传与知识库功能，你可以上传文件、图片
 - **[Cloudflare Workers AI](https://lobechat.com/discover/provider/cloudflare)**: 在 Cloudflare 的全球网络上运行由无服务器 GPU 驱动的机器学习模型。
 - **[GitHub](https://lobechat.com/discover/provider/github)**: 通过 GitHub 模型，开发人员可以成为 AI 工程师，并使用行业领先的 AI 模型进行构建。

-<details><summary><kbd>See more providers (+26)</kbd></summary>
+<details><summary><kbd>See more providers (+27)</kbd></summary>

 - **[Novita](https://lobechat.com/discover/provider/novita)**: Novita AI 是一个提供多种大语言模型与 AI 图像生成的 API 服务的平台，灵活、可靠且具有成本效益。它支持 Llama3、Mistral 等最新的开源模型，并为生成式 AI 应用开发提供了全面、用户友好且自动扩展的 API 解决方案，适合 AI 初创公司的快速发展。
+- **[PPIO](https://lobechat.com/discover/provider/ppio)**: PPIO 派欧云提供稳定、高性价比的开源模型 API 服务，支持 DeepSeek 全系列、Llama、Qwen 等行业领先大模型。
 - **[Together AI](https://lobechat.com/discover/provider/togetherai)**: Together AI 致力于通过创新的 AI 模型实现领先的性能，提供广泛的自定义能力，包括快速扩展支持和直观的部署流程，满足企业的各种需求。
 - **[Fireworks AI](https://lobechat.com/discover/provider/fireworksai)**: Fireworks AI 是一家领先的高级语言模型服务商，专注于功能调用和多模态处理。其最新模型 Firefunction V2 基于 Llama-3，优化用于函数调用、对话及指令跟随。视觉语言模型 FireLLaVA-13B 支持图像和文本混合输入。其他 notable 模型包括 Llama 系列和 Mixtral 系列，提供高效的多语言指令跟随与生成支持。
 - **[Groq](https://lobechat.com/discover/provider/groq)**: Groq 的 LPU 推理引擎在最新的独立大语言模型（LLM）基准测试中表现卓越，以其惊人的速度和效率重新定义了 AI 解决方案的标准。Groq 是一种即时推理速度的代表，在基于云的部署中展现了良好的性能。
@@ -227,7 +228,7 @@ LobeChat 支持文件上传与知识库功能，你可以上传文件、图片

 </details>

-> 📊 Total providers: [<kbd>**36**</kbd>](https://lobechat.com/discover/providers)
+> 📊 Total providers: [<kbd>**37**</kbd>](https://lobechat.com/discover/providers)

 <!-- PROVIDER LIST -->

@@ -322,7 +323,7 @@ LobeChat 的插件生态系统是其核心功能的重要扩展，它极大地
 | [必应网页搜索](https://lobechat.com/discover/plugin/Bingsearch-identifier)<br/><sup>By **FineHow** on **2024-12-22**</sup> | 通过 BingApi 搜索互联网上的信息<br/>`bingsearch`                                   |
 | [PortfolioMeta](https://lobechat.com/discover/plugin/StockData)<br/><sup>By **portfoliometa** on **2024-12-22**</sup>      | 分析股票并获取全面的实时投资数据和分析。<br/>`股票`                                |

-> 📊 Total plugins: [<kbd>**48**</kbd>](https://lobechat.com/discover/plugins)
+> 📊 Total plugins: [<kbd>**47**</kbd>](https://lobechat.com/discover/plugins)

 <!-- PLUGIN LIST -->

@@ -540,27 +541,24 @@ LobeChat 提供了 Vercel 的 自托管版本 和 [Docker 镜像][docker-release
 [![][docker-size-shield]][docker-size-link]
 [![][docker-pulls-shield]][docker-pulls-link]

-我们提供了 Docker 镜像，供你在自己的私有设备上部署 LobeChat 服务。使用以下命令即可使用一键启动 LobeChat 服务：
+We provide a Docker image for deploying the LobeChat service on your own private device. Use the following command to start the LobeChat service:
+
+1. create a folder to for storage files

 ```fish
-$ docker run -d -p 3210:3210 \
-  -e OPENAI_API_KEY=sk-xxxx \
-  -e ACCESS_CODE=lobe66 \
-  --name lobe-chat \
-  lobehub/lobe-chat
+$ mkdir lobe-chat-db && cd lobe-chat-db
 ```

-> \[!TIP]
->
-> 如果你需要通过代理使用 OpenAI 服务，你可以使用 `OPENAI_PROXY_URL` 环境变量来配置代理地址：
+2. 启动一键脚本

 ```fish
-$ docker run -d -p 3210:3210 \
-  -e OPENAI_API_KEY=sk-xxxx \
-  -e OPENAI_PROXY_URL=https://api-proxy.com/v1 \
-  -e ACCESS_CODE=lobe66 \
-  --name lobe-chat \
-  lobehub/lobe-chat
+bash <(curl -fsSL https://lobe.li/setup.sh) -l zh_CN
+```
+
+3. 启动 LobeChat
+
+```fish
+docker compose up -d
 ```

 > \[!NOTE]
@@ -813,15 +811,15 @@ This project is [Apache 2.0](./LICENSE) licensed.
 [discord-link]: https://discord.gg/AYFPHvv2jT
 [discord-shield]: https://img.shields.io/discord/1127171173982154893?color=5865F2&label=discord&labelColor=black&logo=discord&logoColor=white&style=flat-square
 [discord-shield-badge]: https://img.shields.io/discord/1127171173982154893?color=5865F2&label=discord&labelColor=black&logo=discord&logoColor=white&style=for-the-badge
-[docker-pulls-link]: https://hub.docker.com/r/lobehub/lobe-chat
-[docker-pulls-shield]: https://img.shields.io/docker/pulls/lobehub/lobe-chat?color=45cc11&labelColor=black&style=flat-square
-[docker-release-link]: https://hub.docker.com/r/lobehub/lobe-chat
-[docker-release-shield]: https://img.shields.io/docker/v/lobehub/lobe-chat?color=369eff&label=docker&labelColor=black&logo=docker&logoColor=white&style=flat-square
-[docker-size-link]: https://hub.docker.com/r/lobehub/lobe-chat
-[docker-size-shield]: https://img.shields.io/docker/image-size/lobehub/lobe-chat?color=369eff&labelColor=black&style=flat-square
+[docker-pulls-link]: https://hub.docker.com/r/lobehub/lobe-chat-database
+[docker-pulls-shield]: https://img.shields.io/docker/pulls/lobehub/lobe-chat?color=45cc11&labelColor=black&style=flat-square&sort=semver
+[docker-release-link]: https://hub.docker.com/r/lobehub/lobe-chat-database
+[docker-release-shield]: https://img.shields.io/docker/v/lobehub/lobe-chat-database?color=369eff&label=docker&labelColor=black&logo=docker&logoColor=white&style=flat-square&sort=semver
+[docker-size-link]: https://hub.docker.com/r/lobehub/lobe-chat-database
+[docker-size-shield]: https://img.shields.io/docker/image-size/lobehub/lobe-chat-database?color=369eff&labelColor=black&style=flat-square&sort=semver
 [docs]: https://lobehub.com/zh/docs/usage/start
 [docs-dev-guide]: https://github.com/lobehub/lobe-chat/wiki/index
-[docs-docker]: https://lobehub.com/docs/self-hosting/platform/docker
+[docs-docker]: https://lobehub.com/zh/docs/self-hosting/server-database/docker-compose
 [docs-env-var]: https://lobehub.com/docs/self-hosting/environment-variables
 [docs-feat-agent]: https://lobehub.com/docs/usage/features/agent-market
 [docs-feat-artifacts]: https://lobehub.com/docs/usage/features/artifacts
@@ -1,4 +1,216 @@
 [
+  {
+    "children": {
+      "fixes": ["Fix mistral can not chat."]
+    },
+    "date": "2025-03-09",
+    "version": "1.69.4"
+  },
+  {
+    "children": {
+      "improvements": ["Add login ui for next-auth."]
+    },
+    "date": "2025-03-08",
+    "version": "1.69.3"
+  },
+  {
+    "children": {
+      "improvements": ["Refactor the agent runtime implement."]
+    },
+    "date": "2025-03-07",
+    "version": "1.69.2"
+  },
+  {
+    "children": {
+      "improvements": ["Add Qwen QwQ model."]
+    },
+    "date": "2025-03-07",
+    "version": "1.69.1"
+  },
+  {
+    "children": {
+      "features": ["Support Anthropic Context Caching."]
+    },
+    "date": "2025-03-07",
+    "version": "1.69.0"
+  },
+  {
+    "children": {
+      "improvements": ["Add Gemini 2.0 Flash model variations, add QwQ models."]
+    },
+    "date": "2025-03-07",
+    "version": "1.68.11"
+  },
+  {
+    "children": {
+      "fixes": ["Fix litellm streaming usage and refactor the usage chunk."]
+    },
+    "date": "2025-03-06",
+    "version": "1.68.10"
+  },
+  {
+    "children": {
+      "improvements": ["Add epub file chunk split support."]
+    },
+    "date": "2025-03-05",
+    "version": "1.68.9"
+  },
+  {
+    "children": {
+      "improvements": ["Improve openrouter models info."]
+    },
+    "date": "2025-03-05",
+    "version": "1.68.8"
+  },
+  {
+    "children": {
+      "improvements": ["Refactor agent runtime to better code format."]
+    },
+    "date": "2025-03-05",
+    "version": "1.68.7"
+  },
+  {
+    "children": {
+      "fixes": ["Fix custom ai provider sdk type."]
+    },
+    "date": "2025-03-05",
+    "version": "1.68.6"
+  },
+  {
+    "children": {
+      "improvements": ["Fix provider order."]
+    },
+    "date": "2025-03-04",
+    "version": "1.68.5"
+  },
+  {
+    "children": {
+      "improvements": ["Support to show token usages."]
+    },
+    "date": "2025-03-04",
+    "version": "1.68.4"
+  },
+  {
+    "children": {
+      "fixes": ["Improve url rules."]
+    },
+    "date": "2025-03-03",
+    "version": "1.68.3"
+  },
+  {
+    "children": {
+      "improvements": ["Add build-in web search support for Wenxin & Hunyuan."]
+    },
+    "date": "2025-03-03",
+    "version": "1.68.2"
+  },
+  {
+    "children": {
+      "fixes": ["Fix page crash with crawler error."]
+    },
+    "date": "2025-03-03",
+    "version": "1.68.1"
+  },
+  {
+    "children": {
+      "features": ["Add new model provider PPIO."],
+      "fixes": ["Fix search web-browsing display bug."]
+    },
+    "date": "2025-03-03",
+    "version": "1.68.0"
+  },
+  {
+    "children": {
+      "fixes": ["Improve some crawl case."]
+    },
+    "date": "2025-03-02",
+    "version": "1.67.2"
+  },
+  {
+    "children": {},
+    "date": "2025-03-02",
+    "version": "1.67.1"
+  },
+  {
+    "children": {
+      "features": ["Support web page crawl in the search."]
+    },
+    "date": "2025-03-02",
+    "version": "1.67.0"
+  },
+  {
+    "children": {
+      "improvements": ["Add gpt-4.5-preview for OpenAI."]
+    },
+    "date": "2025-03-02",
+    "version": "1.66.6"
+  },
+  {
+    "children": {
+      "improvements": ["Improve portal style."]
+    },
+    "date": "2025-02-28",
+    "version": "1.66.5"
+  },
+  {
+    "children": {
+      "improvements": ["Optimize smooth output."]
+    },
+    "date": "2025-02-28",
+    "version": "1.66.4"
+  },
+  {
+    "children": {
+      "fixes": ["Fix fetch assistants plugin error."]
+    },
+    "date": "2025-02-27",
+    "version": "1.66.3"
+  },
+  {
+    "children": {
+      "fixes": ["Update Claude sonnet 3.7 model ID."]
+    },
+    "date": "2025-02-27",
+    "version": "1.66.2"
+  },
+  {
+    "children": {
+      "improvements": ["Added eu-central-1 region for bedrock."]
+    },
+    "date": "2025-02-27",
+    "version": "1.66.1"
+  },
+  {
+    "children": {
+      "features": ["Add online search support for available providers."]
+    },
+    "date": "2025-02-27",
+    "version": "1.66.0"
+  },
+  {
+    "children": {
+      "improvements": [
+        "Support parsing the search flag when parsing the model list, Update Gemini & Qwen models."
+      ]
+    },
+    "date": "2025-02-27",
+    "version": "1.65.2"
+  },
+  {
+    "children": {
+      "fixes": ["Fix claude 3.7 sonnet thinking with tool use."]
+    },
+    "date": "2025-02-26",
+    "version": "1.65.1"
+  },
+  {
+    "children": {
+      "features": ["Support claude sonnet 3.7 thinking."],
+      "improvements": ["Update Gemini 2.0 search settings."]
+    },
+    "date": "2025-02-25",
+    "version": "1.65.0"
+  },
  {
    "children": {
      "improvements": ["Add Claude 3.7 Sonnet and Haiku 3.5."]
@@ -3,6 +3,7 @@ services:
  network-service:
    image: alpine
    container_name: lobe-network
+    restart: always
    ports:
      - '${MINIO_PORT}:${MINIO_PORT}' # MinIO API
      - '9001:9001' # MinIO Console
@@ -76,6 +77,19 @@ services:
    env_file:
      - .env

+  searxng:
+    image: searxng/searxng
+    container_name: lobe-searxng
+    volumes:
+      - './searxng-settings.yml:/etc/searxng/settings.yml'
+    environment:
+      - 'SEARXNG_SETTINGS_FILE=/etc/searxng/settings.yml'
+    restart: always
+    networks:
+      - lobe-network
+    env_file:
+      - .env
+
  lobe:
    image: lobehub/lobe-chat-database
    container_name: lobe-chat
@@ -102,6 +116,7 @@ services:
      - 'S3_SECRET_ACCESS_KEY=${MINIO_ROOT_PASSWORD}'
      - 'LLM_VISION_IMAGE_USE_BASE64=1'
      - 'S3_SET_ACL=0'
+      - 'SEARXNG_URL=http://searxng:8080'
    env_file:
      - .env
    restart: always
@@ -170,6 +170,16 @@ show_message() {
                ;;
            esac
        ;;
+        tips_download_failed)
+            case $LANGUAGE in
+                zh_CN)
+                    echo "$2 下载失败，请检查网络连接。"
+                ;;
+                *)
+                    echo "$2 Download failed, please check the network connection."
+                ;;
+            esac
+        ;;
        tips_already_installed)
            case $LANGUAGE in
                zh_CN)
@@ -260,6 +270,30 @@ show_message() {
                ;;
            esac
        ;;
+        tips_no_docker_permission)
+            case $LANGUAGE in
+                zh_CN)
+                    echo "WARN: 看起来当前用户没有 Docker 权限。"
+                    echo "使用 'sudo usermod -aG docker $USER' 为用户分配 Docker 权限（可能需要重新启动 shell）。"
+                ;;
+                *)
+                    echo "WARN: It look like the current user does not have Docker permissions."
+                    echo "Use 'sudo usermod -aG docker $USER' to assign Docker permissions to the user (may require restarting shell)."
+                ;;
+            esac
+        ;;
+        tips_init_database_failed)
+            case $LANGUAGE in
+                zh_CN)
+                    echo "无法初始化数据库，为了避免你的数据重复初始化，请在首次成功启动时运行以下指令清空 Casdoor 初始配置文件："
+                    echo "echo '{}' > init_data.json"
+                ;;
+                *)
+                    echo "Failed to initialize the database. To avoid your data being initialized repeatedly, run the following command to unmount the initial configuration file of Casdoor when you first start successfully:"
+                    echo "echo '{}' > init_data.json"
+                ;;
+            esac
+        ;;
        ask_regenerate_secrets)
            case $LANGUAGE in
                zh_CN)
@@ -320,12 +354,27 @@ show_message() {
                ;;
            esac
        ;;
+        ask_init_database)
+            case $LANGUAGE in
+                zh_CN)
+                    echo "是否初始化数据库？"
+                ;;
+                *)
+                    echo "Do you want to initialize the database?"
+                ;;
+            esac
+        ;;
    esac
 }

 # Function to download files
 download_file() {
-    wget -q --show-progress "$1" -O "$2"
+    wget --show-progress "$1" -O "$2"
+    # If run failed, exit
+    if [ $? -ne 0 ]; then
+        show_message "tips_download_failed" "$2"
+        exit 1
+    fi
 }

 print_centered() {
@@ -394,6 +443,7 @@ SUB_DIR="docker-compose/local"
 FILES=(
    "$SUB_DIR/docker-compose.yml"
    "$SUB_DIR/init_data.json"
+    "$SUB_DIR/searxng-settings.yml"
 )
 ENV_EXAMPLES=(
    "$SUB_DIR/.env.zh-CN.example"
@@ -434,6 +484,7 @@ section_download_files(){
    
    download_file "$SOURCE_URL/${FILES[0]}" "docker-compose.yml"
    download_file "$SOURCE_URL/${FILES[1]}" "init_data.json"
+    download_file "$SOURCE_URL/${FILES[2]}" "searxng-settings.yml"
    
    # Download .env.example with the specified language
    if [ "$LANGUAGE" = "zh_CN" ]; then
@@ -627,12 +678,54 @@ section_regenerate_secrets() {
        fi
    fi
 }
+
 show_message "ask_regenerate_secrets"
 ask "(y/n)" "y"
 if [[ "$ask_result" == "y" ]]; then
    section_regenerate_secrets
 fi

+section_init_database() {
+    if ! command -v docker &> /dev/null ; then
+        echo "docker" $(show_message "tips_no_executable")
+	    return 1
+    fi
+
+    if ! docker compose &> /dev/null ; then
+	    echo "docker compose" $(show_message "tips_no_executable")
+	    return 1
+    fi
+
+    # Check if user has permissions to run Docker by trying to get the status of Docker (docker status).
+    # If this fails, the user probably does not have permissions for Docker.
+    # ref: https://github.com/paperless-ngx/paperless-ngx/blob/89e5c08a1fe4ca0b7641ae8fbd5554502199ae40/install-paperless-ngx.sh#L64-L72
+    if ! docker stats --no-stream &> /dev/null ; then
+	    echo $(show_message "tips_no_docker_permission")
+	    return 1
+    fi
+
+    docker compose pull
+    docker compose up --detach postgresql casdoor
+    # hopefully enough time for even the slower systems
+	sleep 15
+	docker compose stop
+
+    # Init finished, remove init mount
+    echo '{}' > init_data.json
+}
+
+show_message "ask_init_database"
+ask "(y/n)" "y"
+if [[ "$ask_result" == "y" ]]; then
+    # If return 1 means failed
+    section_init_database
+    if [ $? -ne 0 ]; then
+        echo $(show_message "tips_init_database_failed")
+    fi
+else 
+    show_message "tips_init_database_failed"
+fi
+
 section_display_configurated_report() {
    # Display configuration reports
    echo $(show_message "security_secrect_regenerate_report")
@@ -657,4 +750,4 @@ section_display_configurated_report() {
    printf "\n%s" "$(show_message "tips_show_documentation")"
    printf "%s\n" $(show_message "tips_show_documentation_url")
 }
-section_display_configurated_report
+section_display_configurated_report
@@ -27,11 +27,12 @@ By setting the environment variables `NEXT_PUBLIC_CLERK_PUBLISHABLE_KEY` and `CL

 Before using NextAuth, please set the following variables in LobeChat's environment variables:

-| Environment Variable      | Type     | Description                                                                                                                                                                                  |
-| ------------------------- | -------- | -------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------- |
-| `NEXT_AUTH_SECRET`        | Required | The key used to encrypt Auth.js session tokens. You can use the following command: `openssl rand -base64 32`, or visit `https://generate-secret.vercel.app/32` to generate the key.          |
-| `NEXTAUTH_URL`            | Required | This URL specifies the callback address for Auth.js when performing OAuth verification. Set this only if the default generated redirect address is incorrect. `https://example.com/api/auth` |
-| `NEXT_AUTH_SSO_PROVIDERS` | Optional | This environment variable is used to enable multiple identity verification sources simultaneously, separated by commas, for example, `auth0,microsoft-entra-id,authentik`.                   |
+| Environment Variable           | Type     | Description                                                                                                                                                                                                                                |
+| ------------------------------ | -------- | ------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------ |
+| `NEXT_PUBLIC_ENABLE_NEXT_AUTH` | Required | This is used to enable the NextAuth service. Set it to `1` to enable it; changing this setting requires recompiling the application. Users deploying with the `lobehub/lobe-chat-database` image have this configuration added by default. |
+| `NEXT_AUTH_SECRET`             | Required | The key used to encrypt Auth.js session tokens. You can use the following command: `openssl rand -base64 32`, or visit `https://generate-secret.vercel.app/32` to generate the key.                                                        |
+| `NEXTAUTH_URL`                 | Required | This URL specifies the callback address for Auth.js when performing OAuth verification. Set this only if the default generated redirect address is incorrect. `https://example.com/api/auth`                                               |
+| `NEXT_AUTH_SSO_PROVIDERS`      | Optional | This environment variable is used to enable multiple identity verification sources simultaneously, separated by commas, for example, `auth0,microsoft-entra-id,authentik`.                                                                 |

 Currently supported identity verification services include:

@@ -24,11 +24,12 @@ LobeChat 与 Clerk 做了深度集成，能够为用户提供一个更加安全

 在使用 NextAuth 之前，请先在 LobeChat 的环境变量中设置以下变量：

-| 环境变量                      | 类型 | 描述                                                                                                           |
-| ------------------------- | -- | ------------------------------------------------------------------------------------------------------------ |
-| `NEXT_AUTH_SECRET`        | 必选 | 用于加密 Auth.js 会话令牌的密钥。您可以使用以下命令： `openssl rand -base64 32`，或者访问 `https://generate-secret.vercel.app/32` 生成秘钥。 |
-| `NEXTAUTH_URL`            | 必选 | 该 URL 用于指定 Auth.js 在执行 OAuth 验证时的回调地址，当默认生成的重定向地址发生不正确时才需要设置。`https://example.com/api/auth`                  |
-| `NEXT_AUTH_SSO_PROVIDERS` | 可选 | 该环境变量用于同时启用多个身份验证源，以逗号 `,` 分割，例如 `auth0,microsoft-entra-id,authentik`。                                       |
+| 环境变量                           | 类型 | 描述                                                                                                           |
+| ------------------------------ | -- | ------------------------------------------------------------------------------------------------------------ |
+| `NEXT_PUBLIC_ENABLE_NEXT_AUTH` | 必选 | 用于启用 NextAuth 服务，设置为 `1` 以启用，更改此项需要重新编译应用。使用 `lobehub/lobe-chat-database` 镜像部署的用户已经默认添加了该项配置。                |
+| `NEXT_AUTH_SECRET`             | 必选 | 用于加密 Auth.js 会话令牌的密钥。您可以使用以下命令： `openssl rand -base64 32`，或者访问 `https://generate-secret.vercel.app/32` 生成秘钥。 |
+| `NEXTAUTH_URL`                 | 必选 | 该 URL 用于指定 Auth.js 在执行 OAuth 验证时的回调地址，当默认生成的重定向地址发生不正确时才需要设置。`https://example.com/api/auth`                  |
+| `NEXT_AUTH_SSO_PROVIDERS`      | 可选 | 该环境变量用于同时启用多个身份验证源，以逗号 `,` 分割，例如 `auth0,microsoft-entra-id,authentik`。                                       |

 目前支持的身份验证服务有：

@@ -27,6 +27,7 @@ Go to [Clerk](https://clerk.com?utm_source=lobehub\&utm_medium=docs) to register
  ```shell
  NEXT_PUBLIC_CLERK_PUBLISHABLE_KEY=pk_live_xxxxxxxxxxx
  CLERK_SECRET_KEY=sk_live_xxxxxxxxxxxxxxxxxxxxxx
+  NEXT_PUBLIC_ENABLE_NEXT_AUTH=0
  ```

  ### Create and Configure Webhook in Clerk
@@ -17,7 +17,7 @@ LobeChat supports customizing the model list during deployment. This configurati
 You can use `+` to add a model, `-` to hide a model, and use `model name=display name<extension configuration>` to customize the display name of a model, separated by English commas. The basic syntax is as follows:

 ```text
-id=displayName<maxToken:vision:reasoning:fc:file>,model2,model3
+id=displayName<maxToken:vision:reasoning:search:fc:file>,model2,model3
 ```

 For example: `+qwen-7b-chat,+glm-6b,-gpt-3.5-turbo,gpt-4-0125-preview=gpt-4-turbo`
@@ -29,7 +29,7 @@ In the above example, it adds `qwen-7b-chat` and `glm-6b` to the model list, rem
 Considering the diversity of model capabilities, we started to add extension configuration in version `0.147.8`, with the following rules:

 ```shell
-id=displayName<maxToken:vision:reasoning:fc:file>
+id=displayName<maxToken:vision:reasoning:search:fc:file>
 ```

 The first value in angle brackets is designated as the `maxToken` for this model. The second value and beyond are the model's extension capabilities, separated by colons `:`, and the order is not important.
@@ -40,6 +40,7 @@ Examples are as follows:
 - `spark-v3.5=讯飞星火 v3.5<8192:fc>`: Xunfei Spark 3.5 model, maximum context of 8k, supports Function Call;
 - `gemini-1.5-flash-latest=Gemini 1.5 Flash<16000:vision>`: Google Vision model, maximum context of 16k, supports image recognition;
 - `o3-mini=OpenAI o3-mini<200000:reasoning:fc>`: OpenAI o3-mini model, maximum context of 200k, supports reasoning and Function Call;
+- `qwen-max-latest=Qwen Max<32768:search:fc>`: Qwen 2.5 Max model, maximum context of 32k, supports web search and Function Call;
 - `gpt-4-all=ChatGPT Plus<128000:fc:vision:file>`, hacked version of ChatGPT Plus web, context of 128k, supports image recognition, Function Call, file upload.

 Currently supported extension capabilities are:
@@ -49,4 +50,5 @@ Currently supported extension capabilities are:
 | `fc`        | Function Calling                                         |
 | `vision`    | Image Recognition                                        |
 | `reasoning` | Support Reasoning                                        |
+| `search`    | Support Web Search                                        |
 | `file`      | File Upload (a bit hacky, not recommended for daily use) |
@@ -16,7 +16,7 @@ LobeChat 支持在部署时自定义模型列表，详情请参考 [模型提供
 你可以使用 `+` 增加一个模型，使用 `-` 来隐藏一个模型，使用 `模型名=展示名<扩展配置>` 来自定义模型的展示名，用英文逗号隔开。通过 `<>` 来添加扩展配置。基本语法如下：

 ```text
-id=displayName<maxToken:vision:reasoning:fc:file>,model2,model3
+id=displayName<maxToken:vision:reasoning:search:fc:file>,model2,model3
 ```

 例如： `+qwen-7b-chat,+glm-6b,-gpt-3.5-turbo,gpt-4-0125-preview=gpt-4-turbo`
@@ -28,7 +28,7 @@ id=displayName<maxToken:vision:reasoning:fc:file>,model2,model3
 考虑到模型的能力多样性，我们在 `0.147.8` 版本开始增加扩展性配置，它的规则如下：

 ```shell
-id=displayName<maxToken:vision:reasoning:fc:file>
+id=displayName<maxToken:vision:reasoning:search:fc:file>
 ```

 尖括号第一个值约定为这个模型的 `maxToken` 。第二个及以后作为模型的扩展能力，能力与能力之间用冒号 `:` 作为分隔符，顺序不重要。
@@ -39,6 +39,7 @@ id=displayName<maxToken:vision:reasoning:fc:file>
 - `spark-v3.5=讯飞星火 v3.5<8192:fc>`：讯飞星火 3.5 模型，最大上下文 8k，支持 Function Call；
 - `gemini-1.5-flash-latest=Gemini 1.5 Flash<16000:vision>`：Google 视觉模型，最大上下文 16k，支持图像识别；
 - `o3-mini=OpenAI o3-mini<200000:reasoning:fc>`：OpenAI o3-mini 模型，最大上下文 200k，支持推理及 Function Call；
+- `qwen-max-latest=Qwen Max<32768:search:fc>`：通义千问 2.5 Max 模型，最大上下文 32k，支持联网搜索及 Function Call；
 - `gpt-4-all=ChatGPT Plus<128000:fc:vision:file>`，hack 的 ChatGPT Plus 网页版，上下 128k ，支持图像识别、Function Call、文件上传

 目前支持的扩展能力有：
@@ -48,4 +49,5 @@ id=displayName<maxToken:vision:reasoning:fc:file>
 | `fc`        | 函数调用（function calling） |
 | `vision`    | 视觉识别                   |
 | `reasoning` | 支持推理                   |
+| `search`    | 支持联网搜索                   |
 | `file`      | 文件上传（比较 hack，不建议日常使用）  |
@@ -217,6 +217,22 @@ If you need to use Azure OpenAI to provide model services, you can refer to the
 - Default: `-`
 - Example: `-all,+01-ai/yi-34b-chat,+huggingfaceh4/zephyr-7b-beta`

+## PPIO
+
+### `PPIO_API_KEY`
+
+- Type: Required
+- Description: This your PPIO API Key.
+- Default: -
+- Example: `sk_xxxxxxxxxx`
+
+### `PPIO_MODEL_LIST`
+
+- Type: Optional
+- Description: Used to control the model list, use `+` to add a model, use `-` to hide a model, use `model_name=display_name` to customize the display name of a model, separated by commas. Definition syntax rules see [model-list][model-list]
+- Default: `-`
+- Example: `-all,+deepseek/deepseek-v3/community,+deepseek/deepseek-r1-distill-llama-70b`
+
 ## Github

 ### `GITHUB_TOKEN`
@@ -215,6 +215,22 @@ LobeChat 在部署时提供了丰富的模型服务商相关的环境变量，
 - 默认值：`-`
 - 示例：`-all,+01-ai/yi-34b-chat,+huggingfaceh4/zephyr-7b-beta`

+## PPIO
+
+### `PPIO_API_KEY`
+
+- 类型：必选
+- 描述：这是你在 PPIO 网站申请的 API 密钥
+- 默认值：-
+- 示例：`sk_xxxxxxxxxxxx`
+
+### `PPIO_MODEL_LIST`
+
+- 类型：可选
+- 描述：用来控制模型列表，使用 `+` 增加一个模型，使用 `-` 来隐藏一个模型，使用 `模型名=展示名<扩展配置>` 来自定义模型的展示名，用英文逗号隔开。模型定义语法规则见 [模型列表][model-list]
+- 默认值：`-`
+- 示例：`-all,+deepseek/deepseek-v3/community,+deepseek/deepseek-r1-distill-llama-70b`
+
 ## Github

 ### `GITHUB_TOKEN`
@@ -0,0 +1,69 @@
+---
+title: Using Azure AI API Key in LobeChat
+description: Learn how to configure and use Azure AI models in LobeChat, get the API key, and start a conversation.
+tags:
+  - LobeChat
+  - Azure AI
+  - API Key
+  - Web UI
+---
+
+# Using Azure AI in LobeChat
+
+<Image alt={'Using Azure AI in LobeChat'} cover src={'https://github.com/user-attachments/assets/81d0349a-44fe-4dfc-bbc4-8e9a1e09567d'} />
+
+[Azure AI](https://azure.microsoft.com) is an open artificial intelligence technology platform based on the Microsoft Azure cloud platform. It provides various AI functionalities, including natural language processing, machine learning, and computer vision, helping businesses easily develop and deploy AI applications.
+
+This document will guide you on how to integrate Azure AI models into LobeChat:
+
+<Steps>
+  ### Step 1: Deploy Azure AI Project and Model
+
+  - First, visit [Azure AI Foundry](https://ai.azure.com/) and complete the registration and login process.
+  - After logging in, select `Browse models` on the homepage.
+
+  <Image alt={'Accessing Azure AI Foundry'} inStep src={'https://github.com/user-attachments/assets/1c6a3e42-8e24-4148-b2c3-0bfe60a8cf77'} />
+
+  - Choose the model you want in the model marketplace.
+  - Enter the model details and click the `Deploy` button.
+
+  <Image alt={'Browsing Models'} inStep src={'https://github.com/user-attachments/assets/3ed3226c-3d4c-49ef-b2c0-8953dac8a92e'} />
+
+  - In the pop-up dialog, create a new project.
+
+  <Image alt={'Creating a New Project'} inStep src={'https://github.com/user-attachments/assets/199b862a-5de4-4a54-83b2-f4dbf69be902'} />
+
+  <Callout type={'note'}>
+    For detailed configuration of Azure AI Foundry, please refer to the [official documentation](https://learn.microsoft.com/azure/ai-foundry/model-inference/).
+  </Callout>
+
+  ### Step 2: Obtain the Model's API Key and Endpoint
+
+  - In the details of the deployed model, you can find the Endpoint and API Key information.
+  - Copy and save the obtained information.
+
+  <Image alt={'Obtaining API Key'} inStep src={'https://github.com/user-attachments/assets/30c33426-412d-4dec-b096-317fe5880e79'} />
+
+  ### Step 3: Configure Azure AI in LobeChat
+
+  - Visit the `App Settings` and `AI Service Provider` interface in LobeChat.
+  - Find the settings for `Azure AI` in the list of providers.
+
+  <Image alt={'Entering Azure AI API Key'} inStep src={'https://github.com/user-attachments/assets/eb41f77f-ccdd-4a48-a8a2-7badac868c03'} />
+
+  - Enable the Azure AI service provider and fill in the obtained Endpoint and API Key.
+
+  <Callout type={'warning'}>
+    For the Endpoint, you only need to fill in the first part: `https://xxxxxx.services.ai.azure.com/models`.
+  </Callout>
+
+  - Choose an Azure AI model for your assistant and start the conversation.
+
+  <Image alt={'Selecting Azure AI Model'} inStep src={'https://github.com/user-attachments/assets/a1ba8ec0-e259-4da4-8980-0cf82ca5f52b'} />
+
+  <Callout type={'warning'}>
+    You may need to pay the API service provider for usage. Please refer to Azure AI's relevant pricing policies.
+  </Callout>
+</Steps>
+
+Now you can use the models provided by Azure AI in LobeChat for conversations.
@@ -0,0 +1,69 @@
+---
+title: 在 LobeChat 中使用 Azure AI API Key
+description: 学习如何在 LobeChat 中配置和使用 Azure AI 模型，获取 API 密钥并开始对话。
+tags:
+  - LobeChat
+  - Azure AI
+  - API密钥
+  - Web UI
+---
+
+# 在 LobeChat 中使用 Azure AI
+
+<Image alt={'在 LobeChat 中使用 Azure AI '} cover src={'https://github.com/user-attachments/assets/81d0349a-44fe-4dfc-bbc4-8e9a1e09567d'} />
+
+[Azure AI](https://azure.microsoft.com) 是一个基于 Microsoft Azure 云平台的开放式人工智能技术平台，提供包括自然语言处理、机器学习、计算机视觉等多种 AI 功能，帮助企业轻松开发和部署 AI 应用。
+
+本文档将指导你如何在 LobeChat 中接入 Azure AI 的模型:
+
+<Steps>
+  ### 步骤一：部署 Azure AI 项目以及模型
+
+  - 首先，访问[Azure AI Foundry](https://ai.azure.com/)并完成注册登录
+  - 登录后在首页选择`浏览模型`
+
+  <Image alt={'进入 Azure AI Foundry'} inStep src={'https://github.com/user-attachments/assets/1c6a3e42-8e24-4148-b2c3-0bfe60a8cf77'} />
+
+  - 在模型广场中选择你想要模型
+  - 进入模型详情，点击`部署`按钮
+
+  <Image alt={'浏览模型'} inStep src={'https://github.com/user-attachments/assets/3ed3226c-3d4c-49ef-b2c0-8953dac8a92e'} />
+
+  - 在弹出的对话框中创建一个新的项目
+
+  <Image alt={'创建新项目'} inStep src={'https://github.com/user-attachments/assets/199b862a-5de4-4a54-83b2-f4dbf69be902'} />
+
+  <Callout type={'note'}>
+    Azure AI Foundry 的详细配置请参考[官方文档](https://learn.microsoft.com/azure/ai-foundry/model-inference/)
+  </Callout>
+
+  ### 步骤二：获取模型的 API Key 及 Endpoint
+
+  - 在已部署的模型详情里，可以查询到 Endpoint 以及 API Key 信息
+  - 复制并保存好获取的信息
+
+  <Image alt={'获取 API Key'} inStep src={'https://github.com/user-attachments/assets/30c33426-412d-4dec-b096-317fe5880e79'} />
+
+  ### 步骤三：在 LobeChat 中配置 Azure AI
+
+  - 访问 LobeChat 的 `应用设置` 的 `AI 服务供应商` 界面
+  - 在供应商列表中找到 `Azure AI` 的设置项
+
+  <Image alt={'填写 Azure AI  API 密钥'} inStep src={'https://github.com/user-attachments/assets/eb41f77f-ccdd-4a48-a8a2-7badac868c03'} />
+
+  - 打开 Azure AI 服务商并填入获取的 Endpoint 以及 API 密钥
+
+  <Callout type={'warning'}>
+    Endpoint 只需要填入前面部分 `https://xxxxxx.services.ai.azure.com/models` 即可
+  </Callout>
+
+  - 为你的助手选择一个 Azure AI 模型即可开始对话
+
+  <Image alt={'选择 Azure AI 模型'} inStep src={'https://github.com/user-attachments/assets/a1ba8ec0-e259-4da4-8980-0cf82ca5f52b'} />
+
+  <Callout type={'warning'}>
+    在使用过程中你可能需要向 API 服务提供商付费，请参考 Azure AI 的相关费用政策。
+  </Callout>
+</Steps>
+
+至此你已经可以在 LobeChat 中使用 Azure AI 提供的模型进行对话了。
@@ -15,7 +15,7 @@ tags:

 <Image alt={'Using DeepSeek in LobeChat'} cover src={'https://github.com/lobehub/lobe-chat/assets/34400653/b4d12904-9d5d-46de-bd66-901eeb9c8e52'} />

-[DeepSeek](https://www.deepseek.com/) is an advanced open-source Large Language Model (LLM). The latest version, DeepSeek-V2, has made significant optimizations in architecture and performance, reducing training costs by 42.5% and inference costs by 93.3%.
+[DeepSeek](https://www.deepseek.com/) represents a cutting-edge open-source large language model. The latest versions, DeepSeek-V3 and DeepSeek-R1, have undergone substantial improvements in both architecture and performance, particularly shining in their inference capabilities. By leveraging innovative training methodologies and reinforcement learning, the model has effectively boosted its inference prowess, now nearly matching the pinnacle performance of OpenAI.

 This document will guide you on how to use DeepSeek in LobeChat:

@@ -48,12 +48,12 @@ This document will guide you on how to use DeepSeek in LobeChat:
  - Access the `App Settings` interface in LobeChat.
  - Find the setting for `DeepSeek` under `Language Models`.

-  <Image alt={'Enter Deepseek API Key'} inStep src={'https://github.com/lobehub/lobe-chat/assets/34400653/bae262d6-0d49-47f3-bc9c-356cf6f3f34e'} />
+  <Image alt={'Enter Deepseek API Key'} inStep src={'https://github.com/user-attachments/assets/aaa3e2c5-7f16-4cfb-86b6-2814a1aafe3a'} />

  - Open DeepSeek and enter the obtained API key.
  - Choose a DeepSeek model for your assistant to start the conversation.

-  <Image alt={'Select Deepseek Model'} inStep src={'https://github.com/lobehub/lobe-chat/assets/34400653/84568505-6efe-4518-8888-682ccdd92197'} />
+  <Image alt={'Select Deepseek Model'} inStep src={'https://github.com/user-attachments/assets/84a5c971-1262-4639-b79f-c8b138530803'} />

  <Callout type={'warning'}>
    You may need to pay the API service provider during usage, please refer to DeepSeek's relevant
@@ -4,6 +4,7 @@ description: 学习如何在 LobeChat 中配置和使用 DeepSeek 语言模型
 tags:
  - LobeChat
  - DeepSeek
+  - DeepSeek R1
  - API密钥
  - Web UI
 ---
@@ -12,9 +13,9 @@ tags:

 <Image alt={'在 LobeChat 中使用 DeepSeek'} cover src={'https://github.com/lobehub/lobe-chat/assets/34400653/b4d12904-9d5d-46de-bd66-901eeb9c8e52'} />

-[DeepSeek](https://www.deepseek.com/) 是一款先进的开源大型语言模型（LLM）。最新版本 DeepSeek-V2 在架构和性能上进行了显著优化，同时训练成本降低了 42.5%, 推理成本降低了 93.3%。
+[DeepSeek](https://www.deepseek.com/) 是一款先进的开源大型语言模型（LLM）。最新的 DeepSeek-V3 和 DeepSeek-R1 在架构和性能上进行了显著优化，特别是在推理能力方面表现出色。它通过创新性的训练方法和强化学习技术，成功地提升了模型的推理能力，并且其性能已逼近 OpenAI 的顶尖水平。

-本文档将指导你如何在 LobeChat 中使用 DeepSeek:
+本文档将指导你如何在 LobeChat 中使用 DeepSeek：

 <Steps>
  ### 步骤一：获取 DeepSeek API 密钥
@@ -44,12 +45,12 @@ tags:
  - 访问 LobeChat 的 `应用设置`界面
  - 在 `语言模型` 下找到 `DeepSeek` 的设置项

-  <Image alt={'填写 Deepseek API 密钥'} inStep src={'https://github.com/lobehub/lobe-chat/assets/34400653/bae262d6-0d49-47f3-bc9c-356cf6f3f34e'} />
+  <Image alt={'填写 Deepseek API 密钥'} inStep src={'https://github.com/user-attachments/assets/aaa3e2c5-7f16-4cfb-86b6-2814a1aafe3a'} />

  - 打开 DeepSeek 并填入获取的 API 密钥
  - 为你的助手选择一个 DeepSeek 模型即可开始对话

-  <Image alt={'选择 Deepseek 模型'} inStep src={'https://github.com/lobehub/lobe-chat/assets/34400653/84568505-6efe-4518-8888-682ccdd92197'} />
+  <Image alt={'选择 Deepseek 模型'} inStep src={'https://github.com/user-attachments/assets/84a5c971-1262-4639-b79f-c8b138530803'} />

  <Callout type={'warning'}>
    在使用过程中你可能需要向 API 服务提供商付费，请参考 DeepSeek 的相关费用政策。
@@ -0,0 +1,51 @@
+---
+title: Using Jina AI API Key in LobeChat
+description: Learn how to configure and use Jina AI models in LobeChat, obtain an API key, and start conversations.
+tags:
+  - LobeChat
+  - Jina AI
+  - API Key
+  - Web UI
+---
+
+# Using Jina AI in LobeChat
+
+<Image alt={'Using Jina AI in LobeChat'} cover src={'https://github.com/user-attachments/assets/840442b1-bf56-4a5f-9700-b3608b16a8a5'} />
+
+[Jina AI](https://jina.ai/) is an open-source neural search company founded in 2020. It focuses on using deep learning technology to process multimodal data, providing efficient information retrieval solutions and supporting search for various data types such as text, images, and videos.
+
+This document will guide you on how to use Jina AI in LobeChat:
+
+<Steps>
+  ### Step 1: Obtain a Jina AI API Key
+
+  - Visit the [Jina AI official website](https://jina.ai/) and click the `API` button on the homepage.
+
+  <Image alt={'Obtain a Jina AI API Key'} inStep src={'https://github.com/user-attachments/assets/5ea37821-4ea8-437c-a15e-3b182d10f19e'} />
+
+  - Find the API Key generated for you in the `API Key` menu below.
+  - Copy and save the generated API Key.
+
+  <Callout type={'info'}>
+    * Jina AI provides each user with 1M free API Tokens, and the API can be used without registration.
+    * If you need to manage the API Key or recharge the API, you need to register and log in to the [Jina AI Console](https://jina.ai/api-dashboard/).
+  </Callout>
+
+  ### Step 2: Configure Jina AI in LobeChat
+
+  - Visit LobeChat's `Application Settings` interface.
+  - Find the `Jina AI` setting under `Language Model`.
+
+  <Image alt={'Fill in Jina AI API Key'} inStep src={'https://github.com/user-attachments/assets/1077bee5-b379-4063-b7bd-23b98ec146e2'} />
+
+  - Enable Jina AI and fill in the obtained API Key.
+  - Select a Jina AI model for your assistant and start the conversation.
+
+  <Image alt={'Select Jina AI Model'} inStep src={'https://github.com/user-attachments/assets/be06e348-8d4c-440c-b59f-b71120f21335'} />
+
+  <Callout type={'warning'}>
+    You may need to pay the API service provider during use. Please refer to Jina AI's relevant fee policy.
+  </Callout>
+</Steps>
+
+Now you can use the models provided by Jina AI in LobeChat to have conversations.
@@ -0,0 +1,51 @@
+---
+title: 在 LobeChat 中使用 Jina AI API Key
+description: 学习如何在 LobeChat 中配置和使用 Jina AI 模型，获取 API 密钥并开始对话。
+tags:
+  - LobeChat
+  - Jina AI
+  - API密钥
+  - Web UI
+---
+
+# 在 LobeChat 中使用 Jina AI
+
+<Image alt={'在 LobeChat 中使用 Jina AI'} cover src={'https://github.com/user-attachments/assets/840442b1-bf56-4a5f-9700-b3608b16a8a5'} />
+
+[Jina AI](https://jina.ai/) 是一家成立于 2020 年的开源神经搜索公司，专注于利用深度学习技术处理多模态数据，提供高效的信息检索解决方案，支持文本、图像、视频等多种数据类型的搜索。
+
+本文档将指导你如何在 LobeChat 中使用 Jina AI:
+
+<Steps>
+  ### 步骤一：获取 Jina AI API 密钥
+
+  - 访问 [Jina AI 官方网站](https://jina.ai/)，点击首页的 `API` 按钮
+
+  <Image alt={'获取 Jina AI API 密钥'} inStep src={'https://github.com/user-attachments/assets/5ea37821-4ea8-437c-a15e-3b182d10f19e'} />
+
+  - 在下方的 `API Key` 菜单中找到系统为你生成的 API Key
+  - 复制并保存生成的 API Key
+
+  <Callout type={'info'}>
+    * Jina AI 会为每个用户提供 1M 免费的 API Token，无需注册即可使用 API
+    * 如果需要管理 API Key，或为 API 充值，你需要注册并登录 [Jina AI 控制台](https://jina.ai/api-dashboard/)
+  </Callout>
+
+  ### 步骤二：在 LobeChat 中配置 Jina AI
+
+  - 访问 LobeChat 的 `应用设置`界面
+  - 在 `语言模型` 下找到 `Jina AI` 的设置项
+
+  <Image alt={'填写 Jina AI API 密钥'} inStep src={'https://github.com/user-attachments/assets/1077bee5-b379-4063-b7bd-23b98ec146e2'} />
+
+  - 打开 Jina AI 并填入获取的 API 密钥
+  - 为你的助手选择一个 Jina AI 模型即可开始对话
+
+  <Image alt={'选择 Jina AI 模型'} inStep src={'https://github.com/user-attachments/assets/be06e348-8d4c-440c-b59f-b71120f21335'} />
+
+  <Callout type={'warning'}>
+    在使用过程中你可能需要向 API 服务提供商付费，请参考 Jina AI 的相关费用政策。
+  </Callout>
+</Steps>
+
+至此你已经可以在 LobeChat 中使用 Jina AI 提供的模型进行对话了。
@@ -0,0 +1,75 @@
+---
+title: Using LM Studio in LobeChat
+description: Learn how to configure and use LM Studio, and run AI models for conversations in LobeChat through LM Studio.
+tags:
+  - LobeChat
+  - LM Studio
+  - Open Source Model
+  - Web UI
+---
+
+# Using LM Studio in LobeChat
+
+<Image alt={'Using LM Studio in LobeChat'} cover src={'https://github.com/user-attachments/assets/cc1f6146-8063-4a4d-947a-7fd6b9133c0c'} />
+
+[LM Studio](https://lmstudio.ai/) is a platform for testing and running large language models (LLMs), providing an intuitive and easy-to-use interface suitable for developers and AI enthusiasts. It supports deploying and running various open-source LLM models, such as Deepseek or Qwen, on local computers, enabling offline AI chatbot functionality, thereby protecting user privacy and providing greater flexibility.
+
+This document will guide you on how to use LM Studio in LobeChat:
+
+<Steps>
+  ### Step 1: Obtain and Install LM Studio
+
+  - Go to the [LM Studio official website](https://lmstudio.ai/)
+  - Choose your platform and download the installation package. LM Studio currently supports MacOS, Windows, and Linux platforms.
+  - Follow the prompts to complete the installation and run LM Studio.
+
+  <Image alt={'Install and run LM Studio'} inStep src={'https://github.com/user-attachments/assets/e887fa04-c553-45f1-917f-5c123ac9c68b'} />
+
+  ### Step 2: Search and Download Models
+
+  - Open the `Discover` menu on the left, search for and download the model you want to use.
+  - Find a suitable model (such as Deepseek R1) and click download.
+  - The download may take some time, please wait patiently for it to complete.
+
+  <Image alt={'Search and download models'} inStep src={'https://github.com/user-attachments/assets/f878355f-710b-452e-8606-0c75c47f29d2'} />
+
+  ### Step 3: Deploy and Run Models
+
+  - Select the downloaded model in the top model selection bar and load the model.
+  - Configure the model runtime parameters in the pop-up panel. Refer to the [LM Studio official documentation](https://lmstudio.ai/docs) for detailed parameter settings.
+
+  <Image alt={'Configure model runtime parameters'} inStep src={'https://github.com/user-attachments/assets/dba58ea6-7df8-4971-b6d4-b24d5f486ba7'} />
+
+  - Click the `Load Model` button and wait for the model to finish loading and running.
+  - Once the model is loaded, you can use it in the chat interface for conversations.
+
+  ### Step 4: Enable Local Service
+
+  - If you want to use the model through other programs, you need to start a local API service. Start the service through the `Developer` panel or the software menu. The LM Studio service starts on port `1234` on your local machine by default.
+
+  <Image alt={'Start local service'} inStep src={'https://github.com/user-attachments/assets/08ced88b-4968-46e8-b1da-0c04ddf5b743'} />
+
+  - After the local service is started, you also need to enable the `CORS (Cross-Origin Resource Sharing)` option in the service settings so that the model can be used in other programs.
+
+  <Image alt={'Enable CORS'} inStep src={'https://github.com/user-attachments/assets/8ce79bd6-f1a3-48bb-b3d0-5271c84801c2'} />
+
+  ### Step 5: Use LM Studio in LobeChat
+
+  - Visit the `AI Service Provider` interface in LobeChat's `Application Settings`.
+  - Find the settings for `LM Studio` in the list of providers.
+
+  <Image alt={'Fill in the LM Studio address'} inStep src={'https://github.com/user-attachments/assets/143ff392-97b5-427a-97a7-f2f577915728'} />
+
+  - Open the LM Studio service provider and fill in the API service address.
+
+  <Callout type={"warning"}>
+    If your LM Studio is running locally, make sure to turn on `Client Request Mode`.
+  </Callout>
+
+  - Add the model you are running in the model list below.
+  - Select a Volcano Engine model for your assistant to start the conversation.
+
+  <Image alt={'Select LM Studio model'} inStep src={'https://github.com/user-attachments/assets/bd399cef-283c-4706-bdc8-de9de662de41'} />
+</Steps>
+
+Now you can use the model running in LM Studio in LobeChat for conversations.
@@ -0,0 +1,75 @@
+---
+title: 在 LobeChat 中使用 LM Studio
+description: 学习如何配置和使用 LM Studio，并在 LobeChat 中 通过 LM Studio 运行 AI 模型进行对话。
+tags:
+  - LobeChat
+  - LM Studio
+  - 开源模型
+  - Web UI
+---
+
+# 在 LobeChat 中使用 LM Studio
+
+<Image alt={'在 LobeChat 中使用 LM Studio'} cover src={'https://github.com/user-attachments/assets/cc1f6146-8063-4a4d-947a-7fd6b9133c0c'} />
+
+[LM Studio](https://lmstudio.ai/) 是一个用于测试和运行大型语言模型（LLM）的平台，提供了直观易用的界面，适合开发人员和 AI 爱好者使用。它支持在本地电脑上部署和运行各种开源 LLM 模型，例如 Deepseek 或 Qwen，实现离线 AI 聊天机器人的功能，从而保护用户隐私并提供更大的灵活性。
+
+本文档将指导你如何在 LobeChat 中使用 LM Studio:
+
+<Steps>
+  ### 步骤一：获取并安装 LM Studio
+
+  - 前往 [LM Studio 官网](https://lmstudio.ai/)
+  - 选择你的平台并下载安装包，LM Studio 目前支持 MacOS、Windows 和 Linux 平台
+  - 按照提示完成安装，运行 LM Studio
+
+  <Image alt={'安装并运行 LM Studio'} inStep src={'https://github.com/user-attachments/assets/e887fa04-c553-45f1-917f-5c123ac9c68b'} />
+
+  ### 步骤二：搜索并下载模型
+
+  - 打开左侧的 `Discover` 菜单，搜索并下载你想要使用的模型
+  - 找到合适的模型（如 Deepseek R1），点击下载
+  - 下载可能需要一些时间，耐心等待完成
+
+  <Image alt={'搜索并下载模型'} inStep src={'https://github.com/user-attachments/assets/f878355f-710b-452e-8606-0c75c47f29d2'} />
+
+  ### 步骤三：部署并运行模型
+
+  - 在顶部的模型选择栏中选择下载好的模型，并加载模型
+  - 在弹出的面板中配置模型运行参数，详细的参数设置请参考 [LM Studio 官方文档](https://lmstudio.ai/docs)
+
+  <Image alt={'配置模型运行参数'} inStep src={'https://github.com/user-attachments/assets/dba58ea6-7df8-4971-b6d4-b24d5f486ba7'} />
+
+  - 点击 `加载模型` 按钮，等待模型完成加载并运行
+  - 模型加载完成后，你可以在聊天界面中使用该模型进行对话
+
+  ### 步骤四：启用本地服务
+
+  - 如果你希望通过其它程序使用该模型，需要启动一个本地 API 服务，通过 `Developer` 面板或软件菜单启动服务，LM Studio 服务默认启动在本机的 `1234` 端口
+
+  <Image alt={'启动本地服务'} inStep src={'https://github.com/user-attachments/assets/08ced88b-4968-46e8-b1da-0c04ddf5b743'} />
+
+  - 本地服务启动后，你还需要在服务设置中开启 `CORS（跨域资源共享）`选项，这样才能在其它程序中使用该模型
+
+  <Image alt={'开启 CORS'} inStep src={'https://github.com/user-attachments/assets/8ce79bd6-f1a3-48bb-b3d0-5271c84801c2'} />
+
+  ### 步骤五：在 LobeChat 中使用 LM Studio
+
+  - 访问 LobeChat 的 `应用设置` 的 `AI 服务供应商` 界面
+  - 在供应商列表中找到 `LM Studio` 的设置项
+
+  <Image alt={'填写 LM Studio 的地址'} inStep src={'https://github.com/user-attachments/assets/143ff392-97b5-427a-97a7-f2f577915728'} />
+
+  - 打开 LM Studio 服务商并填入 API 服务地址
+
+  <Callout type={"warning"}>
+    如果你的 LM Studio 运行在本地，请确保打开`客户端请求模式`
+  </Callout>
+
+  - 在下方的模型列表中添加你运行的模型
+  - 为你的助手选择一个火山引擎模型即可开始对话
+
+  <Image alt={'选择 LM Studio 模型'} inStep src={'https://github.com/user-attachments/assets/bd399cef-283c-4706-bdc8-de9de662de41'} />
+</Steps>
+
+至此你已经可以在 LobeChat 中使用 LM Studio 运行的模型进行对话了。
@@ -0,0 +1,55 @@
+---
+title: Using Nvidia NIM API Key in LobeChat
+description: Learn how to configure and use Nvidia NIM AI models in LobeChat, obtain an API key, and start a conversation.
+tags:
+  - LobeChat
+  - Nvidia NIM
+  - API Key
+  - Web UI
+---
+
+# Using Nvidia NIM in LobeChat
+
+<Image alt={'Using Nvidia NIM in LobeChat'} cover src={'https://github.com/user-attachments/assets/539349dd-2c16-4f42-b525-cca74e113541'} />
+
+[NVIDIA NIM](https://developer.nvidia.com/nim) is part of NVIDIA AI Enterprise and is designed to accelerate the deployment of generative AI applications through microservices. It provides a set of easy-to-use inference microservices that can run on any cloud, data center, or workstation, supporting NVIDIA GPU acceleration.
+
+This document will guide you on how to access and use AI models provided by Nvidia NIM in LobeChat:
+
+<Steps>
+  ### Step 1: Obtain Nvidia NIM API Key
+
+  - First, visit the [Nvidia NIM console](https://build.nvidia.com/explore/discover) and complete the registration and login.
+  - On the `Models` page, select the model you need, such as Deepseek-R1.
+
+  <Image alt={'Select Model'} inStep src={'https://github.com/user-attachments/assets/b49ed0c1-d6bf-4f46-b9df-5f7c730afaa3'} />
+
+  - On the model details page, click "Build with this NIM".
+  - In the pop-up dialog, click the `Generate API Key` button.
+
+  <Image alt={'Get API Key'} inStep src={'https://github.com/user-attachments/assets/5321f987-2c64-4211-8549-bd30ca9b59b9'} />
+
+  - Copy and save the created API Key.
+
+  <Callout type={'warning'}>
+    Please store the key securely as it will only appear once. If you accidentally lose it, you will need to create a new key.
+  </Callout>
+
+  ### Step 2: Configure Nvidia NIM in LobeChat
+
+  - Visit the `Application Settings` -> `AI Service Provider` interface in LobeChat.
+  - Find the settings item for `Nvidia NIM` in the list of providers.
+
+  <Image alt={'Fill in the Nvidia NIM API Key'} inStep src={'https://github.com/user-attachments/assets/dfc45807-2ed6-43eb-af4c-47df66dfff7d'} />
+
+  - Enable the Nvidia NIM service provider and fill in the obtained API key.
+  - Select an Nvidia NIM model for your assistant and start the conversation.
+
+  <Image alt={'Select Nvidia NIM Model'} inStep src={'https://github.com/user-attachments/assets/cb4ba5fe-c223-4b9f-a662-de93e4a536d1'} />
+
+  <Callout type={'warning'}>
+    You may need to pay the API service provider during use, please refer to Nvidia NIM's related fee policies.
+  </Callout>
+</Steps>
+
+Now you can use the models provided by Nvidia NIM to have conversations in LobeChat.
@@ -0,0 +1,55 @@
+---
+title: 在 LobeChat 中使用 Nvidia NIM API Key
+description: 学习如何在 LobeChat 中配置和使用 Nvidia NIM AI 模型，获取 API 密钥并开始对话。
+tags:
+  - LobeChat
+  - Nvidia NIM
+  - API密钥
+  - Web UI
+---
+
+# 在 LobeChat 中使用 Nvidia NIM
+
+<Image alt={'在 LobeChat 中使用 Nvidia NIM'} cover src={'https://github.com/user-attachments/assets/539349dd-2c16-4f42-b525-cca74e113541'} />
+
+[NVIDIA NIM](https://developer.nvidia.com/nim) 是 NVIDIA AI Enterprise 的一部分，旨在通过微服务加速生成式 AI 应用的部署。它提供了一组易于使用的推理微服务，可以在任何云、数据中心或工作站上运行，支持 NVIDIA GPU 加速。
+
+本文档将指导你如何在 LobeChat 中接入并使用 Nvidia NIM 提供的 AI 模型:
+
+<Steps>
+  ### 步骤一：获取 Nvidia NIM  API 密钥
+
+  - 首先，访问[Nvidia NIM 控制台](https://build.nvidia.com/explore/discover)并完成注册登录
+  - 在 `Models` 页面选择你需要的模型，例如 Deepseek-R1
+
+  <Image alt={'选择模型'} inStep src={'https://github.com/user-attachments/assets/b49ed0c1-d6bf-4f46-b9df-5f7c730afaa3'} />
+
+  - 在模型详情页点击`使用此NIM构建`
+  - 在弹出的对话框中点击`生成 API Key` 按钮
+
+  <Image alt={'获取 API Key'} inStep src={'https://github.com/user-attachments/assets/5321f987-2c64-4211-8549-bd30ca9b59b9'} />
+
+  - 复制并保存创建好的 API Key
+
+  <Callout type={'warning'}>
+    请安全地存储密钥，因为它只会出现一次。如果你意外丢失它，您将需要创建一个新密钥。
+  </Callout>
+
+  ### 步骤二：在 LobeChat 中配置 Nvidia NIM
+
+  - 访问 LobeChat 的 `应用设置` 的 `AI 服务供应商` 界面
+  - 在供应商列表中找到 ` Nvidia NIM` 的设置项
+
+  <Image alt={'填写 Nvidia NIM API 密钥'} inStep src={'https://github.com/user-attachments/assets/dfc45807-2ed6-43eb-af4c-47df66dfff7d'} />
+
+  - 打开 Nvidia NIM 服务商并填入获取的 API 密钥
+  - 为你的助手选择一个 Nvidia NIM 模型即可开始对话
+
+  <Image alt={'选择 Nvidia NIM 模型'} inStep src={'https://github.com/user-attachments/assets/cb4ba5fe-c223-4b9f-a662-de93e4a536d1'} />
+
+  <Callout type={'warning'}>
+    在使用过程中你可能需要向 API 服务提供商付费，请参考 Nvidia NIM 的相关费用政策。
+  </Callout>
+</Steps>
+
+至此你已经可以在 LobeChat 中使用 Nvidia NIM 提供的模型进行对话了。
@@ -0,0 +1,57 @@
+---
+title: Using PPIO API Key in LobeChat
+description: >-
+  Learn how to integrate PPIO's language model APIs into LobeChat. Follow the
+  steps to register, create an PPIO API key, configure settings, and chat with
+  our various AI models.
+tags:
+  - PPIO
+  - DeepSeek
+  - Llama
+  - Qwen
+  - uncensored
+  - API key
+  - Web UI
+---
+
+# Using PPIO in LobeChat
+
+<Image alt={'Using PPIO in LobeChat'} cover src={'https://github.com/user-attachments/assets/d0a5e152-160a-4862-8393-546f4e2e5387'} />
+
+[PPIO](https://ppinfra.com/user/register?invited_by=RQIMOC&utm_source=github_lobechat) supports stable and cost-efficient open-source LLM APIs, such as DeepSeek, Llama, Qwen etc.
+
+This document will guide you on how to integrate PPIO in LobeChat:
+
+<Steps>
+  ### Step 1: Register and Log in to PPIO
+
+  - Visit [PPIO](https://ppinfra.com/user/register?invited_by=RQIMOC&utm_source=github_lobechat) and create an account
+  - Upon registration, PPIO will provide a ￥5 credit (about 5M tokens).
+
+  <Image alt={'Register PPIO'} height={457} inStep src={'https://github.com/user-attachments/assets/7cb3019b-78c1-48e0-a64c-a6a4836affd9'} />
+
+  ### Step 2: Obtain the API Key
+
+  - Visit PPIO's [key management page](https://ppinfra.com/settings/key-management), create and copy an API Key.
+
+  <Image alt={'Obtain PPIO API key'} inStep src={'https://github.com/user-attachments/assets/5abcf21d-5a6c-4fc8-8de6-bc47d4d2fa98'} />
+
+  ### Step 3: Configure PPIO in LobeChat
+
+  - Visit the `Settings` interface in LobeChat
+  - Find the setting for `PPIO` under `Language Model`
+
+  <Image alt={'Enter PPIO API key in LobeChat'} inStep src={'https://github.com/user-attachments/assets/9b70b292-6c52-4715-b844-ff5df78d16b9'} />
+
+  - Open PPIO and enter the obtained API key
+  - Choose a PPIO model for your assistant to start the conversation
+
+  <Image alt={'Select and use PPIO model'} inStep src={'https://github.com/user-attachments/assets/b824b741-f2d8-42c8-8cb9-1266862affa7'} />
+
+  <Callout type={'warning'}>
+    During usage, you may need to pay the API service provider, please refer to PPIO's [pricing
+    policy](https://ppinfra.com/llm-api?utm_source=github_lobe-chat&utm_medium=github_readme&utm_campaign=link).
+  </Callout>
+</Steps>
+
+You can now engage in conversations using the models provided by PPIO in LobeChat.
@@ -0,0 +1,55 @@
+---
+title: 在 LobeChat 中使用 PPIO 派欧云 API Key
+description: >-
+  学习如何将 PPIO 派欧云的 LLM API 集成到 LobeChat 中。跟随以下步骤注册 PPIO 账号、创建 API Key、并在 LobeChat
+  中进行设置。
+tags:
+  - PPIO
+  - PPInfra
+  - DeepSeek
+  - Qwen
+  - Llama3
+  - API key
+  - Web UI
+---
+
+# 在 LobeChat 中使用 PPIO 派欧云
+
+<Image alt={'在 LobeChat 中使用 PPIO'} cover src={'https://github.com/user-attachments/assets/d0a5e152-160a-4862-8393-546f4e2e5387'} />
+
+[PPIO 派欧云](https://ppinfra.com/user/register?invited_by=RQIMOC&utm_source=github_lobechat)提供稳定、高性价比的开源模型 API 服务，支持 DeepSeek 全系列、Llama、Qwen 等行业领先大模型。
+
+本文档将指导你如何在 LobeChat 中使用 PPIO:
+
+<Steps>
+  ### 步骤一：注册 PPIO 派欧云账号并登录
+
+  - 访问 [PPIO 派欧云](https://ppinfra.com/user/register?invited_by=RQIMOC&utm_source=github_lobechat) 并注册账号
+  - 注册后，PPIO 会赠送 5 元（约 500 万 tokens）的使用额度
+
+  <Image alt={'注册 PPIO'} height={457} inStep src={'https://github.com/user-attachments/assets/7cb3019b-78c1-48e0-a64c-a6a4836affd9'} />
+
+  ### 步骤二：创建 API 密钥
+
+  - 访问 PPIO 派欧云的 [密钥管理页面](https://ppinfra.com/settings/key-management) ，创建并且复制一个 API 密钥.
+
+  <Image alt={'创建 PPIO API 密钥'} inStep src={'https://github.com/user-attachments/assets/5abcf21d-5a6c-4fc8-8de6-bc47d4d2fa98'} />
+
+  ### 步骤三：在 LobeChat 中配置 PPIO 派欧云
+
+  - 访问 LobeChat 的 `设置` 界面
+  - 在 `语言模型` 下找到 `PPIO` 的设置项
+  - 打开 PPIO 并填入获得的 API 密钥
+
+  <Image alt={'在 LobeChat 中输入 PPIO API 密钥'} inStep src={'https://github.com/user-attachments/assets/9b70b292-6c52-4715-b844-ff5df78d16b9'} />
+
+  - 为你的助手选择一个 PPIO 模型即可开始对话
+
+  <Image alt={'选择并使用 PPIO 模型'} inStep src={'https://github.com/user-attachments/assets/b824b741-f2d8-42c8-8cb9-1266862affa7'} />
+
+  <Callout type={'warning'}>
+    在使用过程中你可能需要向 API 服务提供商付费，PPIO 的 API 费用参考[这里](https://ppinfra.com/llm-api?utm_source=github_lobe-chat&utm_medium=github_readme&utm_campaign=link)。
+  </Callout>
+</Steps>
+
+至此你已经可以在 LobeChat 中使用 PPIO 提供的模型进行对话了。
@@ -0,0 +1,50 @@
+---
+title: Using SambaNova API Key in LobeChat
+description: Learn how to configure and use SambaNova models in LobeChat, obtain an API key, and start a conversation.
+tags:
+  - LobeChat
+  - SambaNova
+  - API Key
+  - Web UI
+---
+
+# Using SambaNova in LobeChat
+
+<Image alt={'Using SambaNova in LobeChat'} cover src={'https://github.com/user-attachments/assets/1028aa1a-6c19-4191-b28a-2020e5637155'} />
+
+[SambaNova](https://sambanova.ai/) is a company based in Palo Alto, California, USA, focused on developing high-performance AI hardware and software solutions. It provides fast AI model training, fine-tuning, and inference capabilities, especially suitable for large-scale generative AI models.
+
+This document will guide you on how to use SambaNova in LobeChat:
+
+<Steps>
+  ### Step 1: Obtain a SambaNova API Key
+
+  - First, you need to register and log in to [SambaNova Cloud](https://cloud.sambanova.ai/)
+  - Create an API key in the `APIs` page
+
+  <Image alt={'Obtain a SambaNova API Key'} inStep src={'https://github.com/user-attachments/assets/ed6965c8-6884-4adf-a457-573a96755f55'} />
+
+  - Copy the obtained API key and save it securely
+
+  <Callout type={'warning'}>
+    Please save the generated API Key securely, as it will only appear once. If you accidentally lose it, you will need to create a new API key.
+  </Callout>
+
+  ### Step 2: Configure SambaNova in LobeChat
+
+  - Access the `Application Settings` interface of LobeChat
+  - Find the `SambaNova` setting item under `Language Model`
+
+  <Image alt={'Fill in the SambaNova API Key'} inStep src={'https://github.com/user-attachments/assets/328e9755-8da9-4849-8569-e099924822fe'} />
+
+  - Turn on SambaNova and fill in the obtained API key
+  - Select a SambaNova model for your assistant to start the conversation
+
+  <Image alt={'Select a SambaNova Model'} inStep src={'https://github.com/user-attachments/assets/6dbf4560-3f62-4b33-9f41-96e12b5087b1'} />
+
+  <Callout type={'warning'}>
+    You may need to pay the API service provider during use, please refer to SambaNova's related fee policies.
+  </Callout>
+</Steps>
+
+Now you can use the models provided by SambaNova in LobeChat to conduct conversations.
@@ -0,0 +1,50 @@
+---
+title: 在 LobeChat 中使用 SambaNova API Key
+description: 学习如何在 LobeChat 中配置和使用 SambaNova 模型，获取 API 密钥并开始对话。
+tags:
+  - LobeChat
+  - SambaNova
+  - API密钥
+  - Web UI
+---
+
+# 在 LobeChat 中使用 SambaNova
+
+<Image alt={'在 LobeChat 中使用 SambaNova'} cover src={'https://github.com/user-attachments/assets/1028aa1a-6c19-4191-b28a-2020e5637155'} />
+
+[SambaNova](https://sambanova.ai/) 是一家位于美国加利福尼亚州帕洛阿尔托的公司，专注于开发高性能 AI 硬件和软件解决方案，提供快速的 AI 模型训练、微调和推理能力，尤其适用于大规模生成式 AI 模型。
+
+本文档将指导你如何在 LobeChat 中使用 SambaNova:
+
+<Steps>
+  ### 步骤一：获取 SambaNova API 密钥
+
+  - 首先，你需要注册并登录 [SambaNova Cloud](https://cloud.sambanova.ai/)
+  - 在 `APIs` 页面中创建一个 API 密钥
+
+  <Image alt={'获取 SambaNova API 密钥'} inStep src={'https://github.com/user-attachments/assets/ed6965c8-6884-4adf-a457-573a96755f55'} />
+
+  - 复制得到的 API 密钥并妥善保存
+
+  <Callout type={'warning'}>
+    请妥善保存生成的 API Key，它只会出现一次，如果不小心丢失了，你需要重新创建一个 API key
+  </Callout>
+
+  ### 步骤二：在 LobeChat 中配置 SambaNova
+
+  - 访问 LobeChat 的 `应用设置`界面
+  - 在 `语言模型` 下找到 `SambaNova` 的设置项
+
+  <Image alt={'填写 SambaNova API 密钥'} inStep src={'https://github.com/user-attachments/assets/328e9755-8da9-4849-8569-e099924822fe'} />
+
+  - 打开 SambaNova 并填入获取的 API 密钥
+  - 为你的助手选择一个 SambaNova 模型即可开始对话
+
+  <Image alt={'选择 SambaNova 模型'} inStep src={'https://github.com/user-attachments/assets/6dbf4560-3f62-4b33-9f41-96e12b5087b1'} />
+
+  <Callout type={'warning'}>
+    在使用过程中你可能需要向 API 服务提供商付费，请参考 SambaNova 的相关费用政策。
+  </Callout>
+</Steps>
+
+至此你已经可以在 LobeChat 中使用 SambaNova 提供的模型进行对话了。
@@ -0,0 +1,49 @@
+---
+title: Using Tencent Cloud API Key in LobeChat
+description: Learn how to configure and use Tencent Cloud AI models in LobeChat, obtain an API key, and start a conversation.
+tags:
+  - LobeChat
+  - Tencent Cloud
+  - API Key
+  - Web UI
+---
+
+# Using Tencent Cloud in LobeChat
+
+<Image alt={'Using Tencent Cloud in LobeChat'} cover src={'https://github.com/user-attachments/assets/aa91ca54-65fc-4e33-8c76-999f0a5d2bee'} />
+
+[Tencent Cloud](https://cloud.tencent.com/) is the cloud computing service brand of Tencent, specializing in providing cloud computing services for enterprises and developers. Tencent Cloud provides a series of AI large model solutions, through which AI models can be connected stably and efficiently.
+
+This document will guide you on how to connect Tencent Cloud's AI models in LobeChat:
+
+<Steps>
+  ### Step 1: Obtain the Tencent Cloud API Key
+
+  - First, visit [Tencent Cloud](https://cloud.tencent.com/) and complete the registration and login.
+  - Enter the Tencent Cloud Console and navigate to [Large-scale Knowledge Engine Atomic Capability](https://console.cloud.tencent.com/lkeap).
+  - Activate the Large-scale Knowledge Engine, which requires real-name authentication during the activation process.
+
+  <Image alt={'Enter the Large-scale Knowledge Engine Atomic Capability Page'} inStep src={'https://github.com/user-attachments/assets/22e1a039-5e6e-4c40-8266-19821677618a'} />
+
+  - In the `Access via OpenAI SDK` option, click the `Create API Key` button to create a new API Key.
+  - You can view and manage the created API Keys in `API Key Management`.
+  - Copy and save the created API Key.
+
+  ### Step 2: Configure Tencent Cloud in LobeChat
+
+  - Visit the `Application Settings` and `AI Service Provider` interface of LobeChat.
+  - Find the `Tencent Cloud` settings item in the list of providers.
+
+  <Image alt={'Fill in the Tencent Cloud API Key'} inStep src={'https://github.com/user-attachments/assets/a9de7780-d0cb-47d5-ad9c-fcbbec14b940'} />
+
+  - Open the Tencent Cloud provider and fill in the obtained API Key.
+  - Select a Tencent Cloud model for your assistant to start the conversation.
+
+  <Image alt={'Select Tencent Cloud Model'} inStep src={'https://github.com/user-attachments/assets/162bc64e-0d34-4a4e-815a-028247b73143'} />
+
+  <Callout type={'warning'}>
+    You may need to pay the API service provider during use, please refer to Tencent Cloud's relevant fee policy.
+  </Callout>
+</Steps>
+
+You can now use the models provided by Tencent Cloud in LobeChat to have conversations.
@@ -0,0 +1,49 @@
+---
+title: 在 LobeChat 中使用腾讯云 API Key
+description: 学习如何在 LobeChat 中配置和使用腾讯云 AI 模型，获取 API 密钥并开始对话。
+tags:
+  - LobeChat
+  - 腾讯云
+  - API密钥
+  - Web UI
+---
+
+# 在 LobeChat 中使用腾讯云
+
+<Image alt={'在 LobeChat 中使用腾讯云'} cover src={'https://github.com/user-attachments/assets/aa91ca54-65fc-4e33-8c76-999f0a5d2bee'} />
+
+[腾讯云（Tencent Cloud）](https://cloud.tencent.com/)是腾讯公司旗下的云计算服务品牌，专门为企业和开发者提供云计算服务。腾讯云提供了一系列 AI 大模型解决方案，通过这些工具可以稳定高效接入 AI 模型。
+
+本文档将指导你如何在 LobeChat 中接入腾讯云的 AI 模型:
+
+<Steps>
+  ### 步骤一：获取腾讯云 API 密钥
+
+  - 首先，访问[腾讯云](https://cloud.tencent.com/)并完成注册登录
+  - 进入腾讯云控制台并导航至[知识引擎原子能力](https://console.cloud.tencent.com/lkeap)
+  - 开通大模型知识引擎，开通过程需要实名认证
+
+  <Image alt={'进入知识引擎原子能力页面'} inStep src={'https://github.com/user-attachments/assets/22e1a039-5e6e-4c40-8266-19821677618a'} />
+
+  - 在`使用OpenAI SDK方式接入`选项中，点击 `创建 API Key` 按钮，创建一个新的 API Key
+  - 在 `API key 管理` 中可以查看和管理已创建的 API Key
+  - 复制并保存创建好的 API Key
+
+  ### 步骤二：在 LobeChat 中配置腾讯云
+
+  - 访问 LobeChat 的 `应用设置` 的 `AI 服务供应商` 界面
+  - 在供应商列表中找到 `腾讯云` 的设置项
+
+  <Image alt={'填写腾讯云 API 密钥'} inStep src={'https://github.com/user-attachments/assets/a9de7780-d0cb-47d5-ad9c-fcbbec14b940'} />
+
+  - 打开腾讯云服务商并填入获取的 API 密钥
+  - 为你的助手选择一个腾讯云模型即可开始对话
+
+  <Image alt={'选择腾讯云模型'} inStep src={'https://github.com/user-attachments/assets/162bc64e-0d34-4a4e-815a-028247b73143'} />
+
+  <Callout type={'warning'}>
+    在使用过程中你可能需要向 API 服务提供商付费，请参考腾讯云的相关费用政策。
+  </Callout>
+</Steps>
+
+至此你已经可以在 LobeChat 中使用腾讯云提供的模型进行对话了。
@@ -0,0 +1,59 @@
+---
+title: Using Vertex AI API Key in LobeChat
+description: Learn how to configure and use Vertex AI models in LobeChat, get an API key, and start a conversation.
+tags:
+  - LobeChat
+  - Vertex AI
+  - API Key
+  - Web UI
+---
+
+# Using Vertex AI in LobeChat
+
+<Image alt={'Using Vertex AI in LobeChat'} cover src={'https://github.com/user-attachments/assets/638dcd7c-2bff-4adb-bade-da2aaef872bf'} />
+
+[Vertex AI](https://cloud.google.com/vertex-ai) is a fully managed, integrated AI development platform from Google Cloud, designed for building and deploying generative AI. It provides easy access to Vertex AI Studio, Agent Builder, and over 160 foundational models for AI development.
+
+This document will guide you on how to connect Vertex AI models in LobeChat:
+
+<Steps>
+  ### Step 1: Prepare a Vertex AI Project
+
+  - First, visit [Google Cloud](https://console.cloud.google.com/) and complete the registration and login process.
+  - Create a new Google Cloud project or select an existing one.
+  - Go to the [Vertex AI Console](https://console.cloud.google.com/vertex-ai).
+  - Ensure that the Vertex AI API service is enabled for the project.
+
+  <Image alt={'Accessing Vertex AI'} inStep src={'https://github.com/user-attachments/assets/c4fe4430-7860-4339-b014-4d8d264a12c0'} />
+
+  ### Step 2: Set Up API Access Permissions
+
+  - Go to the Google Cloud [IAM Management page](https://console.cloud.google.com/iam-admin/serviceaccounts) and navigate to `Service Accounts`.
+  - Create a new service account and assign a role permission to it, such as `Vertex AI User`.
+
+  <Image alt={'Creating a Service Account'} inStep src={'https://github.com/user-attachments/assets/692e7c67-f173-45da-86ef-5c69e17988e4'} />
+
+  - On the service account management page, find the service account you just created, click `Keys`, and create a new JSON format key.
+  - After successful creation, the key file will be automatically saved to your computer in JSON format. Please keep it safe.
+
+  <Image alt={'Creating a Key'} inStep src={'https://github.com/user-attachments/assets/1fb5df18-5261-483e-a445-96f52f80dd20'} />
+
+  ### Step 3: Configure Vertex AI in LobeChat
+
+  - Visit the `App Settings` and then the `AI Service Provider` interface in LobeChat.
+  - Find the settings item for `Vertex AI` in the list of providers.
+
+  <Image alt={'Entering Vertex AI API Key'} inStep src={'https://github.com/user-attachments/assets/5d672e8b-566f-4f82-bdce-947168726bc0'} />
+
+  - Open the Vertex AI service provider settings.
+  - Fill the entire content of the JSON format key you just obtained into the API Key field.
+  - Select a Vertex AI model for your assistant to start the conversation.
+
+  <Image alt={'Selecting a Vertex AI Model'} inStep src={'https://github.com/user-attachments/assets/1a7e9600-cd0f-4c82-9d32-4e61bbb351cc'} />
+
+  <Callout type={'warning'}>
+    You may need to pay the API service provider during usage. Please refer to Google Cloud's relevant fee policies.
+  </Callout>
+</Steps>
+
+Now you can use the models provided by Vertex AI for conversations in LobeChat.
@@ -0,0 +1,59 @@
+---
+title: 在 LobeChat 中使用 Vertex AI API Key
+description: 学习如何在 LobeChat 中配置和使用 Vertex AI 模型，获取 API 密钥并开始对话。
+tags:
+  - LobeChat
+  - Vertex AI
+  - API密钥
+  - Web UI
+---
+
+# 在 LobeChat 中使用 Vertex AI
+
+<Image alt={'在 LobeChat 中使用 Vertex AI '} cover src={'https://github.com/user-attachments/assets/638dcd7c-2bff-4adb-bade-da2aaef872bf'} />
+
+[Vertex AI](https://cloud.google.com/vertex-ai) 是 Google Cloud 的一款全面托管、集成的 AI 开发平台，旨在构建与应用生成式 AI。你可轻松访问 Vertex AI Studio、Agent Builder 以及超过 160 种基础模型，进行 AI 开发。
+
+本文档将指导你如何在 LobeChat 中接入 Vertex AI 的模型:
+
+<Steps>
+  ### 步骤一：准备 Vertex AI 项目
+
+  - 首先，访问[Google Cloud](https://console.cloud.google.com/)并完成注册登录
+  - 创建一个新的 Google Cloud 项目，或选择一个已存在的项目
+  - 进入 [Vertex AI 控制台](https://console.cloud.google.com/vertex-ai)
+  - 确认该项目已开通 Vertex AI API 服务
+
+  <Image alt={'进入 Vertex AI'} inStep src={'https://github.com/user-attachments/assets/c4fe4430-7860-4339-b014-4d8d264a12c0'} />
+
+  ### 步骤二：设置 API 访问权限
+
+  - 进入 Google Cloud [IAM 管理页面](https://console.cloud.google.com/iam-admin/serviceaccounts)，并导航至`服务账号`
+  - 创建一个新的服务账号，并为其分配一个角色权限，例如 `Vertex AI User`
+
+  <Image alt={'创建服务账号'} inStep src={'https://github.com/user-attachments/assets/692e7c67-f173-45da-86ef-5c69e17988e4'} />
+
+  - 在服务账号管理页面找到刚刚创建的服务账号，点击`密钥`并创建一个新的 JSON 格式密钥
+  - 创建成功后，密钥文件将会以 JSON 文件的格式自动保存到你的电脑上，请妥善保存
+
+  <Image alt={'创建密钥'} inStep src={'https://github.com/user-attachments/assets/1fb5df18-5261-483e-a445-96f52f80dd20'} />
+
+  ### 步骤三：在 LobeChat 中配置 Vertex AI
+
+  - 访问 LobeChat 的 `应用设置` 的 `AI 服务供应商` 界面
+  - 在供应商列表中找到 `Vertex AI` 的设置项
+
+  <Image alt={'填写 Vertex AI API 密钥'} inStep src={'https://github.com/user-attachments/assets/5d672e8b-566f-4f82-bdce-947168726bc0'} />
+
+  - 打开 Vertex AI 服务供应商
+  - 将刚刚获取的 JSON 格式的全部内容填入 API Key 字段中
+  - 为你的助手选择一个 Vertex AI 模型即可开始对话
+
+  <Image alt={'选择 Vertex AI 模型'} inStep src={'https://github.com/user-attachments/assets/1a7e9600-cd0f-4c82-9d32-4e61bbb351cc'} />
+
+  <Callout type={'warning'}>
+    在使用过程中你可能需要向 API 服务提供商付费，请参考 Google Cloud 的相关费用政策。
+  </Callout>
+</Steps>
+
+至此你已经可以在 LobeChat 中使用 Vertex AI 提供的模型进行对话了。
@@ -0,0 +1,98 @@
+---
+title: Using vLLM API Key in LobeChat
+description: Learn how to configure and use the vLLM language model in LobeChat, obtain an API key, and start a conversation.
+tags:
+  - LobeChat
+  - vLLM
+  - API Key
+  - Web UI
+---
+
+# Using vLLM in LobeChat
+
+<Image alt={'Using vLLM in LobeChat'} cover src={'https://github.com/user-attachments/assets/1d77cca4-7363-4a46-9ad5-10604e111d7c'} />
+
+[vLLM](https://github.com/vllm-project/vllm) is an open-source local large language model (LLM) deployment tool that allows users to efficiently run LLM models on local devices and provides an OpenAI API-compatible service interface.
+
+This document will guide you on how to use vLLM in LobeChat:
+
+<Steps>
+  ### Step 1: Preparation
+
+  vLLM has certain requirements for hardware and software environments. Be sure to configure according to the following requirements:
+
+  | Hardware Requirements     |                                                                         |
+  | --------- | ----------------------------------------------------------------------- |
+  | GPU       | - NVIDIA CUDA <br /> - AMD ROCm <br /> - Intel XPU                      |
+  | CPU       | - Intel/AMD x86 <br /> - ARM AArch64 <br /> - Apple silicon             |
+  | Other AI Accelerators | - Google TPU <br /> - Intel Gaudi <br /> - AWS Neuron <br /> - OpenVINO |
+
+  | Software Requirements                                    |
+  | --------------------------------------- |
+  | - OS: Linux <br /> - Python: 3.9 – 3.12 |
+
+  ### Step 2: Install vLLM
+
+  If you are using an NVIDIA GPU, you can directly install vLLM using `pip`. However, it is recommended to use `uv` here, which is a very fast Python environment manager, to create and manage the Python environment. Please follow the [documentation](https://docs.astral.sh/uv/#getting-started) to install uv. After installing uv, you can use the following command to create a new Python environment and install vLLM:
+
+  ```shell
+  uv venv myenv --python 3.12 --seed
+  source myenv/bin/activate
+  uv pip install vllm
+  ```
+
+  Another method is to use `uv run` with the `--with [dependency]` option, which allows you to run commands such as `vllm serve` without creating an environment:
+
+  ```shell
+  uv run --with vllm vllm --help
+  ```
+
+  You can also use [conda](https://docs.conda.io/projects/conda/en/latest/user-guide/getting-started.html) to create and manage your Python environment.
+
+  ```shell
+  conda create -n myenv python=3.12 -y
+  conda activate myenv
+  pip install vllm
+  ```
+
+  <Callout type={"note"}>
+    For non-CUDA platforms, please refer to the [official documentation](https://docs.vllm.ai/en/latest/getting_started/installation/index.html#installation-index) to learn how to install vLLM.
+  </Callout>
+
+  ### Step 3: Start Local Service
+
+  vLLM can be deployed as an OpenAI API protocol-compatible server. By default, it will start the server at `http://localhost:8000`. You can specify the address using the `--host` and `--port` parameters. The server currently runs only one model at a time.
+
+  The following command will start a vLLM server and run the `Qwen2.5-1.5B-Instruct` model:
+
+  ```shell
+  vllm serve Qwen/Qwen2.5-1.5B-Instruct
+  ```
+
+  You can enable the server to check the API key in the header by passing the parameter `--api-key` or the environment variable `VLLM_API_KEY`. If not set, no API Key is required to access.
+
+  <Callout type={'note'}>
+    For more detailed vLLM server configuration, please refer to the [official documentation](https://docs.vllm.ai/en/latest/).
+  </Callout>
+
+  ### Step 4: Configure vLLM in LobeChat
+
+  - Access the `Application Settings` interface of LobeChat.
+  - Find the `vLLM` settings item under `Language Model`.
+
+  <Image alt={'Fill in the vLLM API Key'} inStep src={'https://github.com/user-attachments/assets/669c68bf-3f85-4a6f-bb08-d0d7fb7f7417'} />
+
+  - Open the vLLM service provider and fill in the API service address and API Key.
+
+  <Callout type={"warning"}>
+    *   If your vLLM is not configured with an API Key, please leave the API Key blank.
+    *   If your vLLM is running locally, please make sure to turn on `Client Request Mode`.
+  </Callout>
+
+  - Add the model you are running to the model list below.
+  - Select a vLLM model to run for your assistant and start the conversation.
+
+  <Image alt={'Select vLLM Model'} inStep src={'https://github.com/user-attachments/assets/fcdfb9c5-819a-488f-b28d-0857fe861219'} />
+</Steps>
+
+Now you can use the models provided by vLLM in LobeChat to have conversations.
@@ -0,0 +1,98 @@
+---
+title: 在 LobeChat 中使用 vLLM API Key
+description: 学习如何在 LobeChat 中配置和使用 vLLM 语言模型，获取 API 密钥并开始对话。
+tags:
+  - LobeChat
+  - vLLM
+  - API密钥
+  - Web UI
+---
+
+# 在 LobeChat 中使用 vLLM
+
+<Image alt={'在 LobeChat 中使用 vLLM'} cover src={'https://github.com/user-attachments/assets/1d77cca4-7363-4a46-9ad5-10604e111d7c'} />
+
+[vLLM](https://github.com/vllm-project/vllm)是一个开源的本地大型语言模型（LLM）部署工具，允许用户在本地设备上高效运行 LLM 模型，并提供兼容 OpenAI API 的服务接口。
+
+本文档将指导你如何在 LobeChat 中使用 vLLM:
+
+<Steps>
+  ### 步骤一：准备工作
+
+  vLLM 对于硬件和软件环境均有一定要求，请无比根据以下要求进行配置：
+
+  | 硬件需求      |                                                                         |
+  | --------- | ----------------------------------------------------------------------- |
+  | GPU       | - NVIDIA CUDA <br /> - AMD ROCm <br /> - Intel XPU                      |
+  | CPU       | - Intel/AMD x86 <br /> - ARM AArch64 <br /> - Apple silicon             |
+  | 其他 AI 加速器 | - Google TPU <br /> - Intel Gaudi <br /> - AWS Neuron <br /> - OpenVINO |
+
+  | 软件需求                                    |
+  | --------------------------------------- |
+  | - OS: Linux <br /> - Python: 3.9 – 3.12 |
+
+  ### 步骤二：安装 vLLM
+
+  如果你正在使用 NVIDIA GPU，你可以直接使用`pip`安装 vLLM。但这里建议使用`uv`，它一个非常快速的 Python 环境管理器，来创建和管理 Python 环境。请按照[文档](https://docs.astral.sh/uv/#getting-started)安装 uv。安装 uv 后，你可以使用以下命令创建一个新的 Python 环境并安装 vLLM：
+
+  ```shell
+  uv venv myenv --python 3.12 --seed
+  source myenv/bin/activate
+  uv pip install vllm
+  ```
+
+  另一种方法是使用`uv run`与`--with [dependency]`选项，这允许你运行`vllm serve`等命令而无需创建环境：
+
+  ```shell
+  uv run --with vllm vllm --help
+  ```
+
+  你也可以使用 [conda](https://docs.conda.io/projects/conda/en/latest/user-guide/getting-started.html) 来创建和管理你的 Python 环境。
+
+  ```shell
+  conda create -n myenv python=3.12 -y
+  conda activate myenv
+  pip install vllm
+  ```
+
+  <Callout type={"note"}>
+    对于非 CUDA 平台，请参考[官方文档](https://docs.vllm.ai/en/latest/getting_started/installation/index.html#installation-index)了解如何安装 vLLM
+  </Callout>
+
+  ### 步骤三：启动本地服务
+
+  vLLM 可以部署为一个 OpenAI API 协议兼容的服务器。默认情况下，它将在 `http://localhost:8000` 启动服务器。你可以使用 `--host` 和 `--port` 参数指定地址。服务器目前一次仅运行一个模型。
+
+  以下命令将启动一个 vLLM 服务器并运行 `Qwen2.5-1.5B-Instruct` 模型：
+
+  ```shell
+  vllm serve Qwen/Qwen2.5-1.5B-Instruct
+  ```
+
+  你可以通过传递参数 `--api-key` 或环境变量 `VLLM_API_KEY` 来启用服务器检查头部中的 API 密钥。如不设置，则无需 API Key 即可访问。
+
+  <Callout type={'note'}>
+    更详细的 vLLM 服务器配置，请参考[官方文档](https://docs.vllm.ai/en/latest/)
+  </Callout>
+
+  ### 步骤四：在 LobeChat 中配置 vLLM
+
+  - 访问 LobeChat 的 `应用设置`界面
+  - 在 `语言模型` 下找到 `vLLM` 的设置项
+
+  <Image alt={'填写 vLLM API 密钥'} inStep src={'https://github.com/user-attachments/assets/669c68bf-3f85-4a6f-bb08-d0d7fb7f7417'} />
+
+  - 打开 vLLM 服务商并填入 API 服务地址以及 API Key
+
+  <Callout type={"warning"}>
+    * 如果你的 vLLM 没有配置 API Key，请将 API Key 留空
+    * 如果你的 vLLM 运行在本地，请确保打开`客户端请求模式`
+  </Callout>
+
+  - 在下方的模型列表中添加你运行的模型
+  - 为你的助手选择一个 vLLM 运行的模型即可开始对话
+
+  <Image alt={'选择 vLLM 模型'} inStep src={'https://github.com/user-attachments/assets/fcdfb9c5-819a-488f-b28d-0857fe861219'} />
+</Steps>
+
+至此你已经可以在 LobeChat 中使用 vLLM 提供的模型进行对话了。
@@ -0,0 +1,47 @@
+---
+title: Using the Volcano Engine API Key in LobeChat
+description: Learn how to configure and use the Volcano Engine AI model in LobeChat, obtain API keys, and start conversations.
+tags:
+  - LobeChat
+  - Volcengine
+  - Doubao
+  - API Key
+  - Web UI
+---
+# Using Volcengine in LobeChat
+
+<Image alt={'Using Volcengine in LobeChat'} cover src={'https://github.com/user-attachments/assets/b9da065e-f964-44f2-8260-59e182be2729'} />
+
+[Volcengine](https://www.volcengine.com/) is a cloud service platform under ByteDance that provides large language model (LLM) services through "Volcano Ark," supporting multiple mainstream models such as Baichuan Intelligent, Mobvoi, and more.
+
+This document will guide you on how to use Volcengine in LobeChat:
+
+<Steps>
+  ### Step 1: Obtain the Volcengine API Key
+  - First, visit the [Volcengine official website](https://www.volcengine.com/) and complete the registration and login process.
+  - Access the Volcengine console and navigate to [Volcano Ark](https://console.volcengine.com/ark/).
+
+<Image alt={'Entering Volcano Ark API Management Page'} inStep src={'https://github.com/user-attachments/assets/d6ace96f-0398-4847-83e1-75c3004a0e8b'} />
+
+- Go to the `API Key Management` menu and click `Create API Key`.
+- Copy and save the created API Key.
+
+### Step 2: Configure Volcengine in LobeChat
+
+- Navigate to the `Application Settings` page in LobeChat and select `AI Service Providers`.
+- Find the `Volcengine` option in the provider list.
+
+<Image alt={'Entering Volcengine API Key'} inStep src={'https://github.com/user-attachments/assets/237864d6-cc5d-4fe4-8a2b-c278016855c5'} />
+
+- Open the Volcengine service provider and enter the obtained API Key.
+- Choose a Volcengine model for your assistant to start the conversation.
+
+<Image alt={'Selecting a Volcengine Model'} inStep src={'https://github.com/user-attachments/assets/702c191f-8250-4462-aed7-accb18b18dea'} />
+
+<Callout type={'warning'}>
+During usage, you may need to pay the API service provider, so please refer to Volcengine's pricing policy. 
+</Callout>
+
+</Steps>
+
+You can now use the models provided by Volcengine for conversations in LobeChat.
@@ -0,0 +1,48 @@
+---
+title: 在 LobeChat 中使用火山引擎 API Key
+description: 学习如何在 LobeChat 中配置和使用火山引擎 AI 模型，获取 API 密钥并开始对话。
+tags:
+  - LobeChat
+  - 火山引擎
+  - 豆包
+  - API密钥
+  - Web UI
+---
+
+# 在 LobeChat 中使用火山引擎
+
+<Image alt={'在 LobeChat 中使用火山引擎'} cover src={'https://github.com/user-attachments/assets/b9da065e-f964-44f2-8260-59e182be2729'} />
+
+[火山引擎](https://www.volcengine.com/)是字节跳动旗下的云服务平台，通过 "火山方舟" 提供大型语言模型 (LLM) 服务，支持多个主流模型如百川智能、Mobvoi 等。
+
+本文档将指导你如何在 LobeChat 中使用火山引擎:
+
+<Steps>
+  ### 步骤一：获取火山引擎 API 密钥
+
+  - 首先，访问[火山引擎官网](https://www.volcengine.com/)并完成注册登录
+  - 进入火山引擎控制台并导航至[火山方舟](https://console.volcengine.com/ark/)
+
+  <Image alt={'进入火山方舟API管理页面'} inStep src={'https://github.com/user-attachments/assets/d6ace96f-0398-4847-83e1-75c3004a0e8b'} />
+
+  - 进入 `API key 管理` 菜单，并点击 `创建 API Key`
+  - 复制并保存创建好的 API Key
+
+  ### 步骤二：在 LobeChat 中配置火山引擎
+
+  - 访问 LobeChat 的 `应用设置` 的 `AI 服务供应商` 界面
+  - 在供应商列表中找到 `火山引擎` 的设置项
+
+  <Image alt={'填写火山引擎 API 密钥'} inStep src={'https://github.com/user-attachments/assets/237864d6-cc5d-4fe4-8a2b-c278016855c5'} />
+
+  - 打开火山引擎服务商并填入获取的 API 密钥
+  - 为你的助手选择一个火山引擎模型即可开始对话
+
+  <Image alt={'选择火山引擎模型'} inStep src={'https://github.com/user-attachments/assets/702c191f-8250-4462-aed7-accb18b18dea'} />
+
+  <Callout type={'warning'}>
+    在使用过程中你可能需要向 API 服务提供商付费，请参考火山引擎的相关费用政策。
+  </Callout>
+</Steps>
+
+至此你已经可以在 LobeChat 中使用火山引擎提供的模型进行对话了。
@@ -32,7 +32,12 @@
  "duplicateTitle": "{{title}} نسخة",
  "emptyAgent": "لا يوجد مساعد",
  "extendParams": {
+    "disableContextCaching": {
+      "desc": "يمكن تقليل تكلفة توليد محادثة واحدة بنسبة تصل إلى 90%، وزيادة سرعة الاستجابة بمقدار 4 مرات (<1>اعرف المزيد</1>). عند التفعيل، سيتم تعطيل حد عدد الرسائل التاريخية تلقائيًا",
+      "title": "تفعيل تخزين السياق"
+    },
    "enableReasoning": {
+      "desc": "استنادًا إلى آلية تفكير كلود (Claude Thinking) المحدودة (<1>اعرف المزيد</1>)، عند التفعيل، سيتم تعطيل حد عدد الرسائل التاريخية تلقائيًا",
      "title": "تفعيل التفكير العميق"
    },
    "reasoningBudgetToken": {
@@ -40,6 +45,9 @@
    },
    "title": "وظائف توسيع النموذج"
  },
+  "history": {
+    "title": "سيتذكر المساعد آخر {{count}} رسالة فقط"
+  },
  "historyRange": "نطاق التاريخ",
  "historySummary": "ملخص الرسائل التاريخية",
  "inbox": {
@@ -79,6 +87,39 @@
    "deleteDisabledByThreads": "يوجد موضوعات فرعية، لا يمكن الحذف",
    "regenerate": "إعادة الإنشاء"
  },
+  "messages": {
+    "modelCard": {
+      "credit": "نقاط",
+      "creditPricing": "التسعير",
+      "creditTooltip": "لتسهيل العد، نقوم بتحويل 1$ إلى 1M نقطة، على سبيل المثال، 3$/M رموز تعني 3 نقاط/رمز",
+      "pricing": {
+        "inputCachedTokens": "مدخلات مخزنة {{amount}}/نقطة · ${{amount}}/M",
+        "inputCharts": "${{amount}}/M حرف",
+        "inputMinutes": "${{amount}}/دقيقة",
+        "inputTokens": "مدخلات {{amount}}/نقطة · ${{amount}}/M",
+        "outputTokens": "مخرجات {{amount}}/نقطة · ${{amount}}/M",
+        "writeCacheInputTokens": "تخزين إدخال الكتابة {{amount}}/نقطة · ${{amount}}/ميغابايت"
+      }
+    },
+    "tokenDetails": {
+      "average": "متوسط السعر",
+      "input": "مدخلات",
+      "inputAudio": "مدخلات صوتية",
+      "inputCached": "مدخلات مخزنة",
+      "inputCitation": "اقتباس الإدخال",
+      "inputText": "مدخلات نصية",
+      "inputTitle": "تفاصيل المدخلات",
+      "inputUncached": "مدخلات غير مخزنة",
+      "inputWriteCached": "تخزين إدخال الكتابة",
+      "output": "مخرجات",
+      "outputAudio": "مخرجات صوتية",
+      "outputText": "مخرجات نصية",
+      "outputTitle": "تفاصيل المخرجات",
+      "reasoning": "تفكير عميق",
+      "title": "تفاصيل التوليد",
+      "total": "الإجمالي المستهلك"
+    }
+  },
  "newAgent": "مساعد جديد",
  "pin": "تثبيت",
  "pinOff": "إلغاء التثبيت",
@@ -322,6 +322,9 @@
    "tooltip": "تحديث التكوين الأساسي للمزود",
    "updateSuccess": "تم التحديث بنجاح"
  },
+  "updateCustomAiProvider": {
+    "title": "تحديث إعدادات مزود الذكاء الاصطناعي المخصص"
+  },
  "vertexai": {
    "apiKey": {
      "desc": "أدخل مفاتيح Vertex AI الخاصة بك",
@@ -8,6 +8,12 @@
  "01-ai/Yi-1.5-9B-Chat-16K": {
    "description": "Yi-1.5 9B يدعم 16K توكن، ويوفر قدرة توليد لغوية فعالة وسلسة."
  },
+  "01-ai/yi-1.5-34b-chat": {
+    "description": "Zero One Everything، أحدث نموذج مفتوح المصدر تم تعديله، يحتوي على 34 مليار معلمة، ويدعم تعديلات متعددة لمشاهد الحوار، مع بيانات تدريب عالية الجودة تتماشى مع تفضيلات البشر."
+  },
+  "01-ai/yi-1.5-9b-chat": {
+    "description": "Zero One Everything، أحدث نموذج مفتوح المصدر تم تعديله، يحتوي على 9 مليار معلمة، ويدعم تعديلات متعددة لمشاهد الحوار، مع بيانات تدريب عالية الجودة تتماشى مع تفضيلات البشر."
+  },
  "360gpt-pro": {
    "description": "360GPT Pro كعضو مهم في سلسلة نماذج 360 AI، يلبي احتياجات معالجة النصوص المتنوعة بفعالية، ويدعم فهم النصوص الطويلة والحوار المتعدد الجولات."
  },
@@ -239,6 +245,9 @@
  "Qwen/QVQ-72B-Preview": {
    "description": "QVQ-72B-Preview هو نموذج بحثي طورته فريق Qwen يركز على قدرات الاستدلال البصري، حيث يتمتع بميزة فريدة في فهم المشاهد المعقدة وحل المشكلات الرياضية المتعلقة بالرؤية."
  },
+  "Qwen/QwQ-32B": {
+    "description": "QwQ هو نموذج استدلال من سلسلة Qwen. مقارنةً بالنماذج التقليدية المعتمدة على تحسين التعليمات، يتمتع QwQ بقدرة على التفكير والاستدلال، مما يتيح له تحقيق أداء معزز بشكل ملحوظ في المهام اللاحقة، خاصة في حل المشكلات الصعبة. QwQ-32B هو نموذج استدلال متوسط الحجم، قادر على تحقيق أداء تنافسي عند مقارنته بأحدث نماذج الاستدلال (مثل DeepSeek-R1، o1-mini). يستخدم هذا النموذج تقنيات مثل RoPE، SwiGLU، RMSNorm وAttention QKV bias، ويتميز بهيكل شبكة مكون من 64 طبقة و40 رأس انتباه Q (حيث KV في هيكل GQA هو 8)."
+  },
  "Qwen/QwQ-32B-Preview": {
    "description": "QwQ-32B-Preview هو أحدث نموذج بحث تجريبي من Qwen، يركز على تعزيز قدرات الاستدلال للذكاء الاصطناعي. من خلال استكشاف آليات معقدة مثل خلط اللغة والاستدلال التكراري، تشمل المزايا الرئيسية القدرة القوية على التحليل الاستدلالي، والقدرات الرياضية والبرمجية. في الوقت نفسه، هناك أيضًا مشكلات في تبديل اللغة، ودورات الاستدلال، واعتبارات الأمان، واختلافات في القدرات الأخرى."
  },
@@ -467,9 +476,6 @@
  "anthropic.claude-3-5-sonnet-20241022-v2:0": {
    "description": "لقد رفع كلود 3.5 سونيت معايير الصناعة، حيث تفوق أداؤه على نماذج المنافسين ونموذج كلود 3 أوبس، وأظهر أداءً ممتازًا في تقييمات واسعة، مع الحفاظ على سرعة وتكلفة نماذجنا المتوسطة."
  },
-  "anthropic.claude-3-7-sonnet-20250219-v1:0": {
-    "description": "Claude 3.7 Sonnet هو أحدث نموذج من Anthropic، يتميز بأداء ممتاز في تقييمات واسعة، ويتفوق على نماذج المنافسين ونموذج Claude 3.5 Sonnet، مع الحفاظ على سرعة وتكلفة نماذجنا المتوسطة."
-  },
  "anthropic.claude-3-haiku-20240307-v1:0": {
    "description": "Claude 3 Haiku هو أسرع وأصغر نموذج من Anthropic، يوفر سرعة استجابة شبه فورية. يمكنه بسرعة الإجابة على الاستفسارات والطلبات البسيطة. سيتمكن العملاء من بناء تجربة ذكاء اصطناعي سلسة تحاكي التفاعل البشري. يمكن لـ Claude 3 Haiku معالجة الصور وإرجاع إخراج نصي، مع نافذة سياقية تبلغ 200K."
  },
@@ -506,6 +512,9 @@
  "aya:35b": {
    "description": "Aya 23 هو نموذج متعدد اللغات أطلقته Cohere، يدعم 23 لغة، مما يسهل التطبيقات اللغوية المتنوعة."
  },
+  "baichuan/baichuan2-13b-chat": {
+    "description": "Baichuan-13B هو نموذج لغوي كبير مفتوح المصدر قابل للاستخدام التجاري تم تطويره بواسطة Baichuan Intelligence، ويحتوي على 13 مليار معلمة، وقد حقق أفضل النتائج في المعايير الصينية والإنجليزية."
+  },
  "charglm-3": {
    "description": "CharGLM-3 مصمم خصيصًا للأدوار التفاعلية والمرافقة العاطفية، يدعم ذاكرة متعددة الجولات طويلة الأمد وحوارات مخصصة، ويستخدم على نطاق واسع."
  },
@@ -686,9 +695,30 @@
  "deepseek/deepseek-r1": {
    "description": "DeepSeek-R1 يعزز بشكل كبير من قدرة النموذج على الاستدلال في ظل وجود بيانات محدودة جدًا. قبل تقديم الإجابة النهائية، يقوم النموذج أولاً بإخراج سلسلة من التفكير لتحسين دقة الإجابة النهائية."
  },
+  "deepseek/deepseek-r1-distill-llama-70b": {
+    "description": "DeepSeek R1 Distill Llama 70B هو نموذج لغوي كبير يعتمد على Llama3.3 70B، حيث يحقق أداءً تنافسيًا مماثلاً للنماذج الرائدة الكبيرة من خلال استخدام التعديلات المستندة إلى مخرجات DeepSeek R1."
+  },
+  "deepseek/deepseek-r1-distill-llama-8b": {
+    "description": "DeepSeek R1 Distill Llama 8B هو نموذج لغوي كبير مكرر يعتمد على Llama-3.1-8B-Instruct، تم تدريبه باستخدام مخرجات DeepSeek R1."
+  },
+  "deepseek/deepseek-r1-distill-qwen-14b": {
+    "description": "DeepSeek R1 Distill Qwen 14B هو نموذج لغوي كبير مكرر يعتمد على Qwen 2.5 14B، تم تدريبه باستخدام مخرجات DeepSeek R1. لقد تفوق هذا النموذج في العديد من اختبارات المعايير على نموذج OpenAI o1-mini، محققًا أحدث الإنجازات التقنية في النماذج الكثيفة. فيما يلي بعض نتائج اختبارات المعايير:\nAIME 2024 pass@1: 69.7\nMATH-500 pass@1: 93.9\nتصنيف CodeForces: 1481\nأظهر هذا النموذج أداءً تنافسيًا مماثلاً للنماذج الرائدة الأكبر حجمًا من خلال التعديل المستند إلى مخرجات DeepSeek R1."
+  },
+  "deepseek/deepseek-r1-distill-qwen-32b": {
+    "description": "DeepSeek R1 Distill Qwen 32B هو نموذج لغوي كبير مكرر يعتمد على Qwen 2.5 32B، تم تدريبه باستخدام مخرجات DeepSeek R1. لقد تفوق هذا النموذج في العديد من اختبارات المعايير على نموذج OpenAI o1-mini، محققًا أحدث الإنجازات التقنية في النماذج الكثيفة. فيما يلي بعض نتائج اختبارات المعايير:\nAIME 2024 pass@1: 72.6\nMATH-500 pass@1: 94.3\nتصنيف CodeForces: 1691\nأظهر هذا النموذج أداءً تنافسيًا مماثلاً للنماذج الرائدة الأكبر حجمًا من خلال التعديل المستند إلى مخرجات DeepSeek R1."
+  },
+  "deepseek/deepseek-r1/community": {
+    "description": "DeepSeek R1 هو أحدث نموذج مفتوح المصدر أطلقه فريق DeepSeek، ويتميز بأداء استدلال قوي للغاية، خاصة في المهام الرياضية والبرمجة والاستدلال، حيث وصل إلى مستوى مماثل لنموذج OpenAI o1."
+  },
  "deepseek/deepseek-r1:free": {
    "description": "DeepSeek-R1 يعزز بشكل كبير من قدرة النموذج على الاستدلال في ظل وجود بيانات محدودة جدًا. قبل تقديم الإجابة النهائية، يقوم النموذج أولاً بإخراج سلسلة من التفكير لتحسين دقة الإجابة النهائية."
  },
+  "deepseek/deepseek-v3": {
+    "description": "حقق DeepSeek-V3 تقدمًا كبيرًا في سرعة الاستدلال مقارنة بالنماذج السابقة. يحتل المرتبة الأولى بين النماذج المفتوحة المصدر، ويمكن مقارنته بأحدث النماذج المغلقة على مستوى العالم. يعتمد DeepSeek-V3 على بنية الانتباه المتعدد الرؤوس (MLA) وبنية DeepSeekMoE، والتي تم التحقق منها بشكل شامل في DeepSeek-V2. بالإضافة إلى ذلك، قدم DeepSeek-V3 استراتيجية مساعدة غير مدمرة للتوازن في الحمل، وحدد أهداف تدريب متعددة التسمية لتحقيق أداء أقوى."
+  },
+  "deepseek/deepseek-v3/community": {
+    "description": "حقق DeepSeek-V3 تقدمًا كبيرًا في سرعة الاستدلال مقارنة بالنماذج السابقة. يحتل المرتبة الأولى بين النماذج المفتوحة المصدر، ويمكن مقارنته بأحدث النماذج المغلقة على مستوى العالم. يعتمد DeepSeek-V3 على بنية الانتباه المتعدد الرؤوس (MLA) وبنية DeepSeekMoE، والتي تم التحقق منها بشكل شامل في DeepSeek-V2. بالإضافة إلى ذلك، قدم DeepSeek-V3 استراتيجية مساعدة غير مدمرة للتوازن في الحمل، وحدد أهداف تدريب متعددة التسمية لتحقيق أداء أقوى."
+  },
  "doubao-1.5-lite-32k": {
    "description": "دو باو 1.5 لايت هو نموذج الجيل الجديد الخفيف، مع سرعة استجابة قصوى، حيث يصل الأداء والوقت المستغرق إلى مستوى عالمي."
  },
@@ -800,9 +830,18 @@
  "gemini-2.0-flash-001": {
    "description": "Gemini 2.0 Flash يقدم ميزات وتحسينات من الجيل التالي، بما في ذلك سرعة فائقة، واستخدام أدوات أصلية، وتوليد متعدد الوسائط، ونافذة سياق تصل إلى 1M توكن."
  },
+  "gemini-2.0-flash-lite": {
+    "description": "نموذج جمنّي 2.0 فلاش هو نسخة معدلة، تم تحسينها لتحقيق الكفاءة من حيث التكلفة والحد من التأخير."
+  },
+  "gemini-2.0-flash-lite-001": {
+    "description": "نموذج جمنّي 2.0 فلاش هو نسخة معدلة، تم تحسينها لتحقيق الكفاءة من حيث التكلفة والحد من التأخير."
+  },
  "gemini-2.0-flash-lite-preview-02-05": {
    "description": "نموذج Gemini 2.0 Flash، تم تحسينه لأهداف التكلفة المنخفضة والكمون المنخفض."
  },
+  "gemini-2.0-flash-thinking-exp": {
+    "description": "Gemini 2.0 Flash Exp هو أحدث نموذج تجريبي متعدد الوسائط من Google، يتمتع بميزات الجيل التالي، وسرعة فائقة، واستدعاء أدوات أصلية، وتوليد متعدد الوسائط."
+  },
  "gemini-2.0-flash-thinking-exp-01-21": {
    "description": "Gemini 2.0 Flash Exp هو أحدث نموذج تجريبي متعدد الوسائط من Google، يتمتع بميزات الجيل التالي، وسرعة فائقة، واستدعاء أدوات أصلية، وتوليد متعدد الوسائط."
  },
@@ -953,6 +992,9 @@
  "gpt-4-vision-preview": {
    "description": "نموذج GPT-4 Turbo الأحدث يتمتع بقدرات بصرية. الآن، يمكن استخدام الطلبات البصرية باستخدام نمط JSON واستدعاء الوظائف. GPT-4 Turbo هو إصدار معزز يوفر دعمًا فعالًا من حيث التكلفة للمهام متعددة الوسائط. يجد توازنًا بين الدقة والكفاءة، مما يجعله مناسبًا للتطبيقات التي تتطلب تفاعلات في الوقت الحقيقي."
  },
+  "gpt-4.5-preview": {
+    "description": "نسخة المعاينة البحثية لـ GPT-4.5، وهي أكبر وأقوى نموذج GPT لدينا حتى الآن. تتمتع بمعرفة واسعة عن العالم وتفهم أفضل لنوايا المستخدم، مما يجعلها بارعة في المهام الإبداعية والتخطيط الذاتي. يمكن لـ GPT-4.5 قبول المدخلات النصية والصورية وتوليد مخرجات نصية (بما في ذلك المخرجات الهيكلية). تدعم ميزات المطورين الأساسية مثل استدعاء الدوال، وواجهة برمجة التطبيقات الجماعية، والمخرجات المتدفقة. تتألق GPT-4.5 بشكل خاص في المهام التي تتطلب التفكير الإبداعي، والتفكير المفتوح، والحوار (مثل الكتابة، والتعلم، أو استكشاف أفكار جديدة). تاريخ انتهاء المعرفة هو أكتوبر 2023."
+  },
  "gpt-4o": {
    "description": "ChatGPT-4o هو نموذج ديناميكي يتم تحديثه في الوقت الحقيقي للحفاظ على أحدث إصدار. يجمع بين فهم اللغة القوي وقدرات التوليد، مما يجعله مناسبًا لمجموعة واسعة من التطبيقات، بما في ذلك خدمة العملاء والتعليم والدعم الفني."
  },
@@ -1088,15 +1130,6 @@
  "llama-3.1-8b-instant": {
    "description": "Llama 3.1 8B هو نموذج عالي الأداء، يوفر قدرة سريعة على توليد النصوص، مما يجعله مثاليًا لمجموعة من التطبيقات التي تتطلب كفاءة كبيرة وتكلفة فعالة."
  },
-  "llama-3.1-sonar-huge-128k-online": {
-    "description": "نموذج Llama 3.1 Sonar Huge Online، يتمتع بـ 405B من المعلمات، يدعم طول سياق حوالي 127,000 علامة، مصمم لتطبيقات دردشة معقدة عبر الإنترنت."
-  },
-  "llama-3.1-sonar-large-128k-online": {
-    "description": "نموذج Llama 3.1 Sonar Large Online، يتمتع بـ 70B من المعلمات، يدعم طول سياق حوالي 127,000 علامة، مناسب لمهام دردشة عالية السعة ومتنوعة."
-  },
-  "llama-3.1-sonar-small-128k-online": {
-    "description": "نموذج Llama 3.1 Sonar Small Online، يتمتع بـ 8B من المعلمات، يدعم طول سياق حوالي 127,000 علامة، مصمم للدردشة عبر الإنترنت، قادر على معالجة تفاعلات نصية متنوعة بكفاءة."
-  },
  "llama-3.2-11b-vision-instruct": {
    "description": "قدرة استدلال الصور التي تبرز في الصور عالية الدقة، مناسبة لتطبيقات الفهم البصري."
  },
@@ -1250,6 +1283,9 @@
  "meta-llama/llama-3.2-11b-vision-instruct": {
    "description": "تم تصميم LLaMA 3.2 لمعالجة المهام التي تجمع بين البيانات البصرية والنصية. إنه يتفوق في مهام وصف الصور والأسئلة البصرية، متجاوزًا الفجوة بين توليد اللغة والاستدلال البصري."
  },
+  "meta-llama/llama-3.2-3b-instruct": {
+    "description": "meta-llama/llama-3.2-3b-instruct"
+  },
  "meta-llama/llama-3.2-90b-vision-instruct": {
    "description": "تم تصميم LLaMA 3.2 لمعالجة المهام التي تجمع بين البيانات البصرية والنصية. إنه يتفوق في مهام وصف الصور والأسئلة البصرية، متجاوزًا الفجوة بين توليد اللغة والاستدلال البصري."
  },
@@ -1484,6 +1520,9 @@
  "qwen-max-latest": {
    "description": "نموذج لغة ضخم من Qwen بمستوى تريليونات، يدعم إدخال لغات مختلفة مثل الصينية والإنجليزية، وهو النموذج API وراء إصدار Qwen 2.5."
  },
+  "qwen-omni-turbo-latest": {
+    "description": "تدعم نماذج كيوين-أومني إدخال بيانات متعددة الأنماط، بما في ذلك الفيديو والصوت والصور والنصوص، وتخرج الصوت والنص."
+  },
  "qwen-plus": {
    "description": "نموذج لغة ضخم من توغي، نسخة معززة، يدعم إدخال لغات مختلفة مثل الصينية والإنجليزية."
  },
@@ -1511,9 +1550,21 @@
  "qwen-vl-v1": {
    "description": "نموذج تم تدريبه باستخدام نموذج Qwen-7B اللغوي، مع إضافة نموذج الصور، بدقة إدخال الصور 448."
  },
+  "qwen/qwen-2-7b-instruct": {
+    "description": "Qwen2 هو سلسلة جديدة من نماذج اللغة الكبيرة Qwen. Qwen2 7B هو نموذج يعتمد على بنية transformer، ويظهر أداءً ممتازًا في فهم اللغة، والقدرات متعددة اللغات، والبرمجة، والرياضيات، والاستدلال."
+  },
  "qwen/qwen-2-7b-instruct:free": {
    "description": "Qwen2 هو سلسلة جديدة من نماذج اللغة الكبيرة، تتمتع بقدرات فهم وتوليد أقوى."
  },
+  "qwen/qwen-2-vl-72b-instruct": {
+    "description": "Qwen2-VL هو الإصدار الأحدث من نموذج Qwen-VL، وقد حقق أداءً متقدمًا في اختبارات الفهم البصري، بما في ذلك MathVista وDocVQA وRealWorldQA وMTVQA. يمكن لـ Qwen2-VL فهم مقاطع الفيديو التي تزيد مدتها عن 20 دقيقة، مما يتيح إجابات عالية الجودة على الأسئلة المستندة إلى الفيديو، والمحادثات، وإنشاء المحتوى. كما يتمتع بقدرات استدلال واتخاذ قرارات معقدة، ويمكن دمجه مع الأجهزة المحمولة والروبوتات، مما يتيح التشغيل التلقائي بناءً على البيئة البصرية والتعليمات النصية. بالإضافة إلى الإنجليزية والصينية، يدعم Qwen2-VL الآن فهم النصوص بلغات مختلفة في الصور، بما في ذلك معظم اللغات الأوروبية واليابانية والكورية والعربية والفيتنامية."
+  },
+  "qwen/qwen-2.5-72b-instruct": {
+    "description": "Qwen2.5-72B-Instruct هو أحد أحدث نماذج اللغة الكبيرة التي أصدرتها Alibaba Cloud. يتمتع هذا النموذج 72B بقدرات محسنة بشكل ملحوظ في مجالات الترميز والرياضيات. كما يوفر النموذج دعمًا متعدد اللغات، يغطي أكثر من 29 لغة، بما في ذلك الصينية والإنجليزية. وقد حقق النموذج تحسينات ملحوظة في اتباع التعليمات وفهم البيانات الهيكلية وتوليد المخرجات الهيكلية (خاصة JSON)."
+  },
+  "qwen/qwen2.5-32b-instruct": {
+    "description": "Qwen2.5-32B-Instruct هو أحد أحدث نماذج اللغة الكبيرة التي أصدرتها Alibaba Cloud. يتمتع هذا النموذج 32B بقدرات محسنة بشكل ملحوظ في مجالات الترميز والرياضيات. كما يوفر النموذج دعمًا متعدد اللغات، يغطي أكثر من 29 لغة، بما في ذلك الصينية والإنجليزية. وقد حقق النموذج تحسينات ملحوظة في اتباع التعليمات وفهم البيانات الهيكلية وتوليد المخرجات الهيكلية (خاصة JSON)."
+  },
  "qwen/qwen2.5-7b-instruct": {
    "description": "نموذج لغوي موجه للغة الصينية والإنجليزية، يستهدف مجالات اللغة، والبرمجة، والرياضيات، والاستدلال، وغيرها."
  },
@@ -1589,9 +1640,18 @@
  "qwq": {
    "description": "QwQ هو نموذج بحث تجريبي يركز على تحسين قدرات الاستدلال للذكاء الاصطناعي."
  },
+  "qwq-32b": {
+    "description": "نموذج استدلال QwQ المدرب على نموذج Qwen2.5-32B، الذي يعزز بشكل كبير من قدرة الاستدلال للنموذج من خلال التعلم المعزز. تصل المؤشرات الأساسية للنموذج (AIME 24/25، LiveCodeBench) وبعض المؤشرات العامة (IFEval، LiveBench وغيرها) إلى مستوى DeepSeek-R1 الكامل، حيث تتجاوز جميع المؤشرات بشكل ملحوظ نموذج DeepSeek-R1-Distill-Qwen-32B المعتمد أيضًا على Qwen2.5-32B."
+  },
  "qwq-32b-preview": {
    "description": "نموذج QwQ هو نموذج بحث تجريبي تم تطويره بواسطة فريق Qwen، يركز على تعزيز قدرات الاستدلال للذكاء الاصطناعي."
  },
+  "qwq-plus-latest": {
+    "description": "نموذج استدلال QwQ المدرب على نموذج Qwen2.5، الذي يعزز بشكل كبير من قدرة الاستدلال للنموذج من خلال التعلم المعزز. تصل المؤشرات الأساسية للنموذج (AIME 24/25، LiveCodeBench) وبعض المؤشرات العامة (IFEval، LiveBench وغيرها) إلى مستوى DeepSeek-R1 الكامل."
+  },
+  "r1-1776": {
+    "description": "R1-1776 هو إصدار من نموذج DeepSeek R1، تم تدريبه لاحقًا لتقديم معلومات حقائق غير خاضعة للرقابة وغير متحيزة."
+  },
  "solar-mini": {
    "description": "Solar Mini هو نموذج LLM مدمج، يتفوق على GPT-3.5، ويتميز بقدرات متعددة اللغات قوية، ويدعم الإنجليزية والكورية، ويقدم حلولًا فعالة وصغيرة الحجم."
  },
@@ -1604,6 +1664,9 @@
  "sonar": {
    "description": "منتج بحث خفيف الوزن يعتمد على سياق البحث، أسرع وأرخص من Sonar Pro."
  },
+  "sonar-deep-research": {
+    "description": "تقوم Deep Research بإجراء أبحاث شاملة على مستوى الخبراء وتجميعها في تقارير يمكن الوصول إليها وقابلة للتنفيذ."
+  },
  "sonar-pro": {
    "description": "منتج بحث متقدم يدعم سياق البحث، مع دعم للاستعلامات المتقدمة والمتابعة."
  },
@@ -1661,6 +1724,9 @@
  "text-embedding-3-small": {
    "description": "نموذج التضمين من الجيل الجديد، فعال واقتصادي، مناسب لاسترجاع المعرفة وتطبيقات RAG وغيرها."
  },
+  "thudm/glm-4-9b-chat": {
+    "description": "الإصدار المفتوح من الجيل الأحدث من نموذج GLM-4 الذي أطلقته Zhizhu AI."
+  },
  "togethercomputer/StripedHyena-Nous-7B": {
    "description": "StripedHyena Nous (7B) يوفر قدرة حسابية معززة من خلال استراتيجيات فعالة وهندسة نموذجية."
  },
@@ -1676,6 +1742,9 @@
  "us.anthropic.claude-3-5-sonnet-20241022-v2:0": {
    "description": "Claude 3.5 Sonnet يرفع المعايير الصناعية، حيث يتفوق على نماذج المنافسين وClaude 3 Opus، ويظهر أداءً ممتازًا في تقييمات واسعة، مع سرعة وتكلفة تتناسب مع نماذجنا المتوسطة."
  },
+  "us.anthropic.claude-3-7-sonnet-20250219-v1:0": {
+    "description": "كلود 3.7 سونيت هو أسرع نموذج من الجيل التالي من أنثروبيك. مقارنةً بكلود 3 هايكو، تم تحسين كلود 3.7 سونيت في جميع المهارات، وتجاوز العديد من اختبارات الذكاء لأكبر نموذج من الجيل السابق، كلود 3 أوبس."
+  },
  "whisper-1": {
    "description": "نموذج التعرف على الصوت العام، يدعم التعرف على الصوت متعدد اللغات، والترجمة الصوتية، والتعرف على اللغات."
  },
@@ -140,6 +140,18 @@
      "close": "حذف",
      "confirm": "تم تكوينه وإعادة المحاولة"
    },
+    "crawPages": {
+      "crawling": "جاري التعرف على الروابط",
+      "detail": {
+        "preview": "معاينة",
+        "raw": "النص الأصلي",
+        "tooLong": "محتوى النص طويل جدًا، سيتم الاحتفاظ بالسياق السابق فقط بأول {{characters}} حرف، ولن يتم احتساب الأجزاء الزائدة في سياق المحادثة"
+      },
+      "meta": {
+        "crawler": "وضع الزحف",
+        "words": "عدد الأحرف"
+      }
+    },
    "searchxng": {
      "baseURL": "الرجاء الإدخال",
      "description": "الرجاء إدخال عنوان URL لـ SearchXNG لبدء البحث عبر الإنترنت",
@@ -89,6 +89,9 @@
  "perplexity": {
    "description": "Perplexity هي شركة رائدة في تقديم نماذج توليد الحوار، تقدم مجموعة من نماذج Llama 3.1 المتقدمة، تدعم التطبيقات عبر الإنترنت وغير المتصلة، وتناسب بشكل خاص مهام معالجة اللغة الطبيعية المعقدة."
  },
+  "ppio": {
+    "description": "تقدم PPIO بايو السحابية خدمات واجهة برمجة التطبيقات لنماذج مفتوحة المصدر مستقرة وذات تكلفة فعالة، تدعم جميع سلسلة DeepSeek، وLlama، وQwen، وغيرها من النماذج الكبيرة الرائدة في الصناعة."
+  },
  "qwen": {
    "description": "Qwen هو نموذج لغة ضخم تم تطويره ذاتيًا بواسطة Alibaba Cloud، يتمتع بقدرات قوية في فهم وتوليد اللغة الطبيعية. يمكنه الإجابة على مجموعة متنوعة من الأسئلة، وكتابة المحتوى، والتعبير عن الآراء، وكتابة الشيفرات، ويؤدي دورًا في مجالات متعددة."
  },
@@ -32,7 +32,12 @@
  "duplicateTitle": "{{title}} Копие",
  "emptyAgent": "Няма наличен асистент",
  "extendParams": {
+    "disableContextCaching": {
+      "desc": "Разходите за генериране на единичен разговор могат да бъдат намалени с до 90%, а скоростта на отговорите да се увеличи 4 пъти (<1>Научете повече</1>). При активиране автоматично ще се деактивира ограничението на броя на историческите съобщения",
+      "title": "Активиране на кеширане на контекста"
+    },
    "enableReasoning": {
+      "desc": "Ограничения на механизма Claude Thinking (<1>Научете повече</1>), при активиране автоматично ще се деактивира ограничението на броя на историческите съобщения",
      "title": "Активиране на дълбочинно мислене"
    },
    "reasoningBudgetToken": {
@@ -40,6 +45,9 @@
    },
    "title": "Разширени функции на модела"
  },
+  "history": {
+    "title": "Асистентът ще запомни само последните {{count}} съобщения"
+  },
  "historyRange": "Диапазон на историята",
  "historySummary": "Исторически обобщение на съобщения",
  "inbox": {
@@ -79,6 +87,39 @@
    "deleteDisabledByThreads": "Съществуват подтеми, не можете да изтриете.",
    "regenerate": "Прегенерирай"
  },
+  "messages": {
+    "modelCard": {
+      "credit": "Кредити",
+      "creditPricing": "Ценообразуване",
+      "creditTooltip": "За удобство при броенето, 1$ се преобразува в 1M кредити, например $3/M токени се преобразува в 3 кредита/token",
+      "pricing": {
+        "inputCachedTokens": "Кеширани входящи {{amount}}/кредити · ${{amount}}/M",
+        "inputCharts": "${{amount}}/M символи",
+        "inputMinutes": "${{amount}}/минута",
+        "inputTokens": "Входящи {{amount}}/кредити · ${{amount}}/M",
+        "outputTokens": "Изходящи {{amount}}/кредити · ${{amount}}/M",
+        "writeCacheInputTokens": "Кеширане на входящи данни {{amount}}/точки · ${{amount}}/M"
+      }
+    },
+    "tokenDetails": {
+      "average": "Средна цена",
+      "input": "Вход",
+      "inputAudio": "Аудио вход",
+      "inputCached": "Кеширан вход",
+      "inputCitation": "Цитиране на входящи данни",
+      "inputText": "Текстов вход",
+      "inputTitle": "Детайли за входа",
+      "inputUncached": "Некеширан вход",
+      "inputWriteCached": "Входящи кеширани данни",
+      "output": "Изход",
+      "outputAudio": "Аудио изход",
+      "outputText": "Текстов изход",
+      "outputTitle": "Детайли за изхода",
+      "reasoning": "Дълбочинно разсъждение",
+      "title": "Детайли за генериране",
+      "total": "Общо разходи"
+    }
+  },
  "newAgent": "Нов агент",
  "pin": "Закачи",
  "pinOff": "Откачи",
@@ -322,6 +322,9 @@
    "tooltip": "Актуализиране на основната конфигурация на доставчика",
    "updateSuccess": "Актуализацията е успешна"
  },
+  "updateCustomAiProvider": {
+    "title": "Актуализиране на конфигурацията на доставчика на персонализирани AI услуги"
+  },
  "vertexai": {
    "apiKey": {
      "desc": "Въведете вашите ключове за Vertex AI",
@@ -8,6 +8,12 @@
  "01-ai/Yi-1.5-9B-Chat-16K": {
    "description": "Yi-1.5 9B поддържа 16K токена, предоставяйки ефективни и плавни способности за генериране на език."
  },
+  "01-ai/yi-1.5-34b-chat": {
+    "description": "零一万物, най-новият отворен модел с фина настройка, с 34 милиарда параметри, който поддържа множество диалогови сценарии, с висококачествени обучителни данни, съобразени с човешките предпочитания."
+  },
+  "01-ai/yi-1.5-9b-chat": {
+    "description": "零一万物, най-новият отворен модел с фина настройка, с 9 милиарда параметри, който поддържа множество диалогови сценарии, с висококачествени обучителни данни, съобразени с човешките предпочитания."
+  },
  "360gpt-pro": {
    "description": "360GPT Pro, като важен член на серията AI модели на 360, отговаря на разнообразни приложения на естествения език с ефективни способности за обработка на текст, поддържайки разбиране на дълги текстове и многостепенни диалози."
  },
@@ -239,6 +245,9 @@
  "Qwen/QVQ-72B-Preview": {
    "description": "QVQ-72B-Preview е изследователски модел, разработен от екипа на Qwen, който се фокусира върху визуалните способности за извеждане и притежава уникални предимства в разбирането на сложни сцени и решаването на визуално свързани математически проблеми."
  },
+  "Qwen/QwQ-32B": {
+    "description": "QwQ е моделът за изводи от серията Qwen. В сравнение с традиционните модели за оптимизация на инструкции, QwQ притежава способности за разсъждение и извод, което позволява значително подобряване на производителността в задачи от по-ниско ниво, особено при решаване на трудни проблеми. QwQ-32B е среден модел за изводи, който постига конкурентоспособна производителност в сравнение с най-съвременните модели за изводи (като DeepSeek-R1, o1-mini). Този модел използва технологии като RoPE, SwiGLU, RMSNorm и Attention QKV bias, с 64 слоя в мрежовата структура и 40 Q внимание глави (в архитектурата GQA KV е 8)."
+  },
  "Qwen/QwQ-32B-Preview": {
    "description": "QwQ-32B-Preview е най-новият експериментален изследователски модел на Qwen, който се фокусира върху подобряване на AI разсъдъчните способности. Чрез изследване на сложни механизми като езикови смеси и рекурсивно разсъждение, основните предимства включват мощни аналитични способности, математически и програмистки умения. В същото време съществуват проблеми с езиковото превключване, цикли на разсъждение, съображения за безопасност и разлики в други способности."
  },
@@ -467,9 +476,6 @@
  "anthropic.claude-3-5-sonnet-20241022-v2:0": {
    "description": "Claude 3.5 Sonnet повишава индустриалните стандарти, с производителност, надминаваща конкурентните модели и Claude 3 Opus, показвайки отлични резултати в широки оценки, като същевременно предлага скорост и разходи, характерни за нашите модели от среден клас."
  },
-  "anthropic.claude-3-7-sonnet-20250219-v1:0": {
-    "description": "Claude 3.7 Sonnet повишава индустриалните стандарти, с производителност, надвишаваща конкурентните модели и Claude 3 Opus, с отлични резултати в широки оценки, като същевременно предлага скорост и разходи, характерни за нашите модели от среден клас."
-  },
  "anthropic.claude-3-haiku-20240307-v1:0": {
    "description": "Claude 3 Haiku е най-бързият и компактен модел на Anthropic, предлагащ почти мигновена скорост на отговор. Той може бързо да отговаря на прости запитвания и заявки. Клиентите ще могат да изградят безпроблемно AI изживяване, имитиращо човешко взаимодействие. Claude 3 Haiku може да обработва изображения и да връща текстови изходи, с контекстуален прозорец от 200K."
  },
@@ -506,6 +512,9 @@
  "aya:35b": {
    "description": "Aya 23 е многозначен модел, представен от Cohere, поддържащ 23 езика, предоставяйки удобство за многоезични приложения."
  },
+  "baichuan/baichuan2-13b-chat": {
+    "description": "Baichuan-13B е отворен, комерсиален голям езиков модел, разработен от Baichuan Intelligence, с 13 милиарда параметри, който постига най-добрите резултати в своя размер на авторитетни бенчмаркове на китайски и английски."
+  },
  "charglm-3": {
    "description": "CharGLM-3 е проектиран за ролеви игри и емоционално придружаване, поддържаща дълга многократна памет и персонализиран диалог, с широко приложение."
  },
@@ -686,9 +695,30 @@
  "deepseek/deepseek-r1": {
    "description": "DeepSeek-R1 значително подобри способността на модела за разсъждение при наличието на много малко маркирани данни. Преди да предостави окончателния отговор, моделът първо ще изведе част от съдържанието на веригата на мислене, за да повиши точността на окончателния отговор."
  },
+  "deepseek/deepseek-r1-distill-llama-70b": {
+    "description": "DeepSeek R1 Distill Llama 70B е голям езиков модел, базиран на Llama3.3 70B, който използва фина настройка на изхода на DeepSeek R1, за да постигне конкурентна производителност, сравнима с големите водещи модели."
+  },
+  "deepseek/deepseek-r1-distill-llama-8b": {
+    "description": "DeepSeek R1 Distill Llama 8B е дестилиран голям езиков модел, базиран на Llama-3.1-8B-Instruct, обучен с изхода на DeepSeek R1."
+  },
+  "deepseek/deepseek-r1-distill-qwen-14b": {
+    "description": "DeepSeek R1 Distill Qwen 14B е дестилиран голям езиков модел, базиран на Qwen 2.5 14B, обучен с изхода на DeepSeek R1. Този модел надминава o1-mini на OpenAI в множество бенчмарков, постигащи най-съвременни резултати за плътни модели. Ето някои от резултатите от бенчмарковете:\nAIME 2024 pass@1: 69.7\nMATH-500 pass@1: 93.9\nCodeForces Rating: 1481\nТози модел демонстрира конкурентна производителност, сравнима с по-големи водещи модели, благодарение на фина настройка на изхода на DeepSeek R1."
+  },
+  "deepseek/deepseek-r1-distill-qwen-32b": {
+    "description": "DeepSeek R1 Distill Qwen 32B е дестилиран голям езиков модел, базиран на Qwen 2.5 32B, обучен с изхода на DeepSeek R1. Този модел надминава o1-mini на OpenAI в множество бенчмарков, постигащи най-съвременни резултати за плътни модели. Ето някои от резултатите от бенчмарковете:\nAIME 2024 pass@1: 72.6\nMATH-500 pass@1: 94.3\nCodeForces Rating: 1691\nТози модел демонстрира конкурентна производителност, сравнима с по-големи водещи модели, благодарение на фина настройка на изхода на DeepSeek R1."
+  },
+  "deepseek/deepseek-r1/community": {
+    "description": "DeepSeek R1 е най-новият отворен модел, публикуван от екипа на DeepSeek, който предлага изключителна производителност при извеждане, особено в математически, програмистки и логически задачи, достигайки ниво, сравнимо с модела o1 на OpenAI."
+  },
  "deepseek/deepseek-r1:free": {
    "description": "DeepSeek-R1 значително подобри способността на модела за разсъждение при наличието на много малко маркирани данни. Преди да предостави окончателния отговор, моделът първо ще изведе част от съдържанието на веригата на мислене, за да повиши точността на окончателния отговор."
  },
+  "deepseek/deepseek-v3": {
+    "description": "DeepSeek-V3 постига значителен напредък в скоростта на извеждане в сравнение с предишните модели. Той е на първо място сред отворените модели и може да се сравнява с най-съвременните затворени модели в света. DeepSeek-V3 използва архитектури с многоглаво внимание (MLA) и DeepSeekMoE, които бяха напълно валидирани в DeepSeek-V2. Освен това, DeepSeek-V3 въвежда помощна беззагубна стратегия за баланс на натоварването и задава цели за обучение с множество етикети, за да постигне по-силна производителност."
+  },
+  "deepseek/deepseek-v3/community": {
+    "description": "DeepSeek-V3 постига значителен напредък в скоростта на извеждане в сравнение с предишните модели. Той е на първо място сред отворените модели и може да се сравнява с най-съвременните затворени модели в света. DeepSeek-V3 използва архитектури с многоглаво внимание (MLA) и DeepSeekMoE, които бяха напълно валидирани в DeepSeek-V2. Освен това, DeepSeek-V3 въвежда помощна беззагубна стратегия за баланс на натоварването и задава цели за обучение с множество етикети, за да постигне по-силна производителност."
+  },
  "doubao-1.5-lite-32k": {
    "description": "Doubao-1.5-lite е ново поколение лек модел, с изключителна скорост на отговор, който постига световно ниво както по отношение на ефективността, така и на времето за реакция."
  },
@@ -800,9 +830,18 @@
  "gemini-2.0-flash-001": {
    "description": "Gemini 2.0 Flash предлага следващо поколение функции и подобрения, включително изключителна скорост, нативна употреба на инструменти, многомодално генериране и контекстен прозорец от 1M токена."
  },
+  "gemini-2.0-flash-lite": {
+    "description": "Gemini 2.0 Flash е вариант на модела, оптимизиран за икономичност и ниска латентност."
+  },
+  "gemini-2.0-flash-lite-001": {
+    "description": "Gemini 2.0 Flash е вариант на модела, оптимизиран за икономичност и ниска латентност."
+  },
  "gemini-2.0-flash-lite-preview-02-05": {
    "description": "Модел на Gemini 2.0 Flash, оптимизиран за икономичност и ниска латентност."
  },
+  "gemini-2.0-flash-thinking-exp": {
+    "description": "Gemini 2.0 Flash Exp е най-новият експериментален многомодален AI модел на Google, с ново поколение функции, изключителна скорост, нативно извикване на инструменти и многомодално генериране."
+  },
  "gemini-2.0-flash-thinking-exp-01-21": {
    "description": "Gemini 2.0 Flash Exp е най-новият експериментален многомодален AI модел на Google, с ново поколение функции, изключителна скорост, нативно извикване на инструменти и многомодално генериране."
  },
@@ -953,6 +992,9 @@
  "gpt-4-vision-preview": {
    "description": "Най-новият модел GPT-4 Turbo разполага с визуални функции. Сега визуалните заявки могат да се използват с JSON формат и извиквания на функции. GPT-4 Turbo е подобрена версия, която предлага икономически ефективна поддръжка за мултимодални задачи. Той намира баланс между точност и ефективност, подходящ за приложения, изискващи взаимодействие в реално време."
  },
+  "gpt-4.5-preview": {
+    "description": "Изследователската предварителна версия на GPT-4.5, която е нашият най-голям и мощен GPT модел до момента. Тя притежава обширни знания за света и може по-добре да разбира намеренията на потребителите, което я прави изключително ефективна в креативни задачи и автономно планиране. GPT-4.5 приема текстови и изображен вход и генерира текстови изход (включително структурирани изходи). Поддържа ключови функции за разработчици, като извикване на функции, пакетно API и потоков изход. В задачи, изискващи креативно, открито мислене и диалог (като писане, учене или изследване на нови идеи), GPT-4.5 показва особени способности. Крайната дата на знанията е октомври 2023."
+  },
  "gpt-4o": {
    "description": "ChatGPT-4o е динамичен модел, който се актуализира в реално време, за да поддържа най-новата версия. Той комбинира мощно разбиране на езика и генериране на текст, подходящ за мащабни приложения, включително обслужване на клиенти, образование и техническа поддръжка."
  },
@@ -1088,15 +1130,6 @@
  "llama-3.1-8b-instant": {
    "description": "Llama 3.1 8B е модел с висока производителност, предлагащ бързи способности за генериране на текст, особено подходящ за приложения, изискващи мащабна ефективност и икономичност."
  },
-  "llama-3.1-sonar-huge-128k-online": {
-    "description": "Llama 3.1 Sonar Huge Online модел, с 405B параметри, поддържащ контекстова дължина от около 127,000 маркера, проектиран за сложни онлайн чат приложения."
-  },
-  "llama-3.1-sonar-large-128k-online": {
-    "description": "Llama 3.1 Sonar Large Online модел, с 70B параметри, поддържащ контекстова дължина от около 127,000 маркера, подходящ за задачи с висока капацитет и разнообразие в чата."
-  },
-  "llama-3.1-sonar-small-128k-online": {
-    "description": "Llama 3.1 Sonar Small Online модел, с 8B параметри, поддържащ контекстова дължина от около 127,000 маркера, проектиран за онлайн чат, способен да обработва ефективно различни текстови взаимодействия."
-  },
  "llama-3.2-11b-vision-instruct": {
    "description": "Изключителни способности за визуално разсъждение върху изображения с висока разделителна способност, подходящи за приложения за визуално разбиране."
  },
@@ -1250,6 +1283,9 @@
  "meta-llama/llama-3.2-11b-vision-instruct": {
    "description": "LLaMA 3.2 е проектиран да обработва задачи, свързващи визуални и текстови данни. Той показва отлични резултати в задачи като описание на изображения и визуални въпроси, преодолявайки пропастта между генерирането на език и визуалното разсъждение."
  },
+  "meta-llama/llama-3.2-3b-instruct": {
+    "description": "meta-llama/llama-3.2-3b-instruct"
+  },
  "meta-llama/llama-3.2-90b-vision-instruct": {
    "description": "LLaMA 3.2 е проектиран да обработва задачи, свързващи визуални и текстови данни. Той показва отлични резултати в задачи като описание на изображения и визуални въпроси, преодолявайки пропастта между генерирането на език и визуалното разсъждение."
  },
@@ -1484,6 +1520,9 @@
  "qwen-max-latest": {
    "description": "Qwen Max е езиков модел с мащаб от стотици милиарди параметри, който поддържа вход на различни езици, включително китайски и английски. В момента е основният API модел зад версията на продукта Qwen 2.5."
  },
+  "qwen-omni-turbo-latest": {
+    "description": "Моделите от серията Qwen-Omni поддържат входни данни от множество модалности, включително видео, аудио, изображения и текст, и генерират аудио и текст."
+  },
  "qwen-plus": {
    "description": "通义千问（Qwen） е подобрена версия на мащабен езиков модел, който поддържа вход на различни езици, включително китайски и английски."
  },
@@ -1511,9 +1550,21 @@
  "qwen-vl-v1": {
    "description": "Инициализиран с езиковия модел Qwen-7B, добавя модел за изображения, предтренировъчен модел с резолюция на входа от 448."
  },
+  "qwen/qwen-2-7b-instruct": {
+    "description": "Qwen2 е новата серия големи езикови модели Qwen. Qwen2 7B е модел, базиран на трансформатор, който показва отлични резултати в разбирането на езика, многоезичните способности, програмирането, математиката и разсъжденията."
+  },
  "qwen/qwen-2-7b-instruct:free": {
    "description": "Qwen2 е нова серия от големи езикови модели с по-силни способности за разбиране и генериране."
  },
+  "qwen/qwen-2-vl-72b-instruct": {
+    "description": "Qwen2-VL е най-новата итерация на модела Qwen-VL, постигайки най-съвременни резултати в бенчмарковете за визуално разбиране, включително MathVista, DocVQA, RealWorldQA и MTVQA. Qwen2-VL може да разбира видеа с продължителност над 20 минути, за висококачествени въпроси и отговори, диалози и създаване на съдържание, базирани на видео. Той също така притежава сложни способности за разсъждение и вземане на решения, които могат да се интегрират с мобилни устройства, роботи и др., за автоматични операции на базата на визуална среда и текстови инструкции. Освен английски и китайски, Qwen2-VL сега поддържа и разбиране на текст на различни езици в изображения, включително повечето европейски езици, японски, корейски, арабски и виетнамски."
+  },
+  "qwen/qwen-2.5-72b-instruct": {
+    "description": "Qwen2.5-72B-Instruct е една от най-новите серии големи езикови модели, публикувани от Alibaba Cloud. Този 72B модел има значителни подобрения в области като кодиране и математика. Моделът предлага и многоезична поддръжка, обхващаща над 29 езика, включително китайски и английски. Моделът показва значителни подобрения в следването на инструкции, разбирането на структурирани данни и генерирането на структурирани изходи (особено JSON)."
+  },
+  "qwen/qwen2.5-32b-instruct": {
+    "description": "Qwen2.5-32B-Instruct е една от най-новите серии големи езикови модели, публикувани от Alibaba Cloud. Този 32B модел има значителни подобрения в области като кодиране и математика. Моделът предлага и многоезична поддръжка, обхващаща над 29 езика, включително китайски и английски. Моделът показва значителни подобрения в следването на инструкции, разбирането на структурирани данни и генерирането на структурирани изходи (особено JSON)."
+  },
  "qwen/qwen2.5-7b-instruct": {
    "description": "LLM, насочен към китайски и английски, за области като език, програмиране, математика и разсъждение."
  },
@@ -1589,9 +1640,18 @@
  "qwq": {
    "description": "QwQ е експериментален изследователски модел, който се фокусира върху подобряване на AI разсъдъчните способности."
  },
+  "qwq-32b": {
+    "description": "QwQ моделът за изводи, обучен на базата на модела Qwen2.5-32B, значително подобрява способностите си за изводи чрез усилено обучение. Основните показатели на модела, като математически код и други ключови индикатори (AIME 24/25, LiveCodeBench), както и някои общи индикатори (IFEval, LiveBench и др.), достигат нивото на DeepSeek-R1 в пълна версия, като всички показатели значително надвишават тези на DeepSeek-R1-Distill-Qwen-32B, също базиран на Qwen2.5-32B."
+  },
  "qwq-32b-preview": {
    "description": "QwQ моделът е експериментален изследователски модел, разработен от екипа на Qwen, който се фокусира върху подобряване на AI разсъдъчните способности."
  },
+  "qwq-plus-latest": {
+    "description": "QwQ моделът за изводи, обучен на базата на модела Qwen2.5, значително подобрява способностите си за изводи чрез усилено обучение. Основните показатели на модела, като математически код и други ключови индикатори (AIME 24/25, LiveCodeBench), както и някои общи индикатори (IFEval, LiveBench и др.), достигат нивото на DeepSeek-R1 в пълна версия."
+  },
+  "r1-1776": {
+    "description": "R1-1776 е версия на модела DeepSeek R1, след обучението, която предоставя непроверена и безпристрастна фактическа информация."
+  },
  "solar-mini": {
    "description": "Solar Mini е компактен LLM, който превъзхожда GPT-3.5, с мощни многоезични способности, поддържа английски и корейски, предоставяйки ефективно и компактно решение."
  },
@@ -1604,6 +1664,9 @@
  "sonar": {
    "description": "Лек продукт за търсене, базиран на контекст на търсене, по-бърз и по-евтин от Sonar Pro."
  },
+  "sonar-deep-research": {
+    "description": "Deep Research извършва задълбочени експертни изследвания и ги обобщава в достъпни и приложими доклади."
+  },
  "sonar-pro": {
    "description": "Разширен продукт за търсене, който поддържа контекст на търсене, напреднали запитвания и проследяване."
  },
@@ -1661,6 +1724,9 @@
  "text-embedding-3-small": {
    "description": "Ефективен и икономичен ново поколение модел за вграждане, подходящ за извличане на знания, RAG приложения и други сценарии."
  },
+  "thudm/glm-4-9b-chat": {
+    "description": "GLM-4 е последната версия на предварително обучен модел от серията, публикувана от Zhizhu AI."
+  },
  "togethercomputer/StripedHyena-Nous-7B": {
    "description": "StripedHyena Nous (7B) предлага подобрена изчислителна мощ чрез ефективни стратегии и архитектура на модела."
  },
@@ -1676,6 +1742,9 @@
  "us.anthropic.claude-3-5-sonnet-20241022-v2:0": {
    "description": "Claude 3.5 Sonnet повишава индустриалните стандарти, с производителност, надминаваща конкурентните модели и Claude 3 Opus, показвайки отлични резултати в широк спектър от оценки, като същевременно предлага скорост и разходи, сравними с нашите модели от средно ниво."
  },
+  "us.anthropic.claude-3-7-sonnet-20250219-v1:0": {
+    "description": "Claude 3.7 сонет е най-бързият модел от следващото поколение на Anthropic. В сравнение с Claude 3 Haiku, Claude 3.7 Сонет е подобрен във всички умения и надминава най-големия модел от предишното поколение Claude 3 Opus в много интелектуални тестове."
+  },
  "whisper-1": {
    "description": "Универсален модел за разпознаване на реч, поддържащ многоезично разпознаване на реч, превод на реч и разпознаване на езици."
  },
@@ -140,6 +140,18 @@
      "close": "Изтриване",
      "confirm": "Конфигурацията е завършена и опитайте отново"
    },
+    "crawPages": {
+      "crawling": "Разпознаване на връзки",
+      "detail": {
+        "preview": "Преглед",
+        "raw": "Оригинален текст",
+        "tooLong": "Текстът е твърде дълъг, контекстът на разговора ще запази само първите {{characters}} символа, а останалата част няма да бъде включена в контекста на разговора"
+      },
+      "meta": {
+        "crawler": "Режим на улавяне",
+        "words": "Брой символи"
+      }
+    },
    "searchxng": {
      "baseURL": "Моля, въведете",
      "description": "Моля, въведете URL адреса на SearchXNG, за да започнете търсене в мрежата",
@@ -89,6 +89,9 @@
  "perplexity": {
    "description": "Perplexity е водещ доставчик на модели за генериране на диалози, предлагащ множество напреднали модели Llama 3.1, поддържащи онлайн и офлайн приложения, особено подходящи за сложни задачи по обработка на естествен език."
  },
+  "ppio": {
+    "description": "PPIO ПайОу облак предлага стабилни и икономически изгодни API услуги за отворени модели, поддържащи цялата серия DeepSeek, Llama, Qwen и други водещи модели в индустрията."
+  },
  "qwen": {
    "description": "Qwen е самостоятелно разработен свръхголям езиков модел на Alibaba Cloud, с мощни способности за разбиране и генериране на естествен език. Може да отговаря на различни въпроси, да създава текстово съдържание, да изразява мнения и да пише код, играейки роля в множество области."
  },
@@ -32,7 +32,12 @@
  "duplicateTitle": "{{title}} Kopie",
  "emptyAgent": "Kein Assistent verfügbar",
  "extendParams": {
+    "disableContextCaching": {
+      "desc": "Die Kosten für die Generierung einer einzelnen Konversation können um bis zu 90 % gesenkt werden, die Reaktionsgeschwindigkeit wird um das Vierfache erhöht (<1>Mehr erfahren</1>). Wenn aktiviert, wird die Begrenzung der Anzahl historischer Nachrichten automatisch deaktiviert.",
+      "title": "Kontext-Caching aktivieren"
+    },
    "enableReasoning": {
+      "desc": "Basierend auf den Einschränkungen des Claude Thinking-Mechanismus (<1>Mehr erfahren</1>), wird bei Aktivierung die Begrenzung der Anzahl historischer Nachrichten automatisch deaktiviert.",
      "title": "Tiefes Denken aktivieren"
    },
    "reasoningBudgetToken": {
@@ -40,6 +45,9 @@
    },
    "title": "Modell Erweiterungsfunktionen"
  },
+  "history": {
+    "title": "Der Assistent wird nur die letzten {{count}} Nachrichten speichern"
+  },
  "historyRange": "Verlaufsbereich",
  "historySummary": "Zusammenfassung historischer Nachrichten",
  "inbox": {
@@ -79,6 +87,39 @@
    "deleteDisabledByThreads": "Es gibt Unterthemen, die Löschung ist nicht möglich.",
    "regenerate": "Neu generieren"
  },
+  "messages": {
+    "modelCard": {
+      "credit": "Punkte",
+      "creditPricing": "Preisgestaltung",
+      "creditTooltip": "Zur Vereinfachung der Zählung rechnen wir 1$ als 1M Punkte um, zum Beispiel werden $3/M Tokens als 3 Punkte/token umgerechnet",
+      "pricing": {
+        "inputCachedTokens": "Zwischengespeicherte Eingabe {{amount}}/Punkte · ${{amount}}/M",
+        "inputCharts": "${{amount}}/M Zeichen",
+        "inputMinutes": "${{amount}}/Minute",
+        "inputTokens": "Eingabe {{amount}}/Punkte · ${{amount}}/M",
+        "outputTokens": "Ausgabe {{amount}}/Punkte · ${{amount}}/M",
+        "writeCacheInputTokens": "Cache-Eingabe schreiben {{amount}}/Punkte · ${{amount}}/M"
+      }
+    },
+    "tokenDetails": {
+      "average": "Durchschnittspreis",
+      "input": "Eingabe",
+      "inputAudio": "Audioeingabe",
+      "inputCached": "Eingabe zwischengespeichert",
+      "inputCitation": "Eingabe zitieren",
+      "inputText": "Text-Eingabe",
+      "inputTitle": "Eingabedetails",
+      "inputUncached": "Eingabe nicht zwischengespeichert",
+      "inputWriteCached": "Eingabe Cache schreiben",
+      "output": "Ausgabe",
+      "outputAudio": "Audioausgabe",
+      "outputText": "Text-Ausgabe",
+      "outputTitle": "Ausgabedetails",
+      "reasoning": "Tiefes Denken",
+      "title": "Generierungsdetails",
+      "total": "Gesamter Verbrauch"
+    }
+  },
  "newAgent": "Neuer Assistent",
  "pin": "Anheften",
  "pinOff": "Anheften aufheben",
@@ -322,6 +322,9 @@
    "tooltip": "Aktualisieren Sie die grundlegenden Anbieterinformationen",
    "updateSuccess": "Aktualisierung erfolgreich"
  },
+  "updateCustomAiProvider": {
+    "title": "Konfiguration des benutzerdefinierten KI-Anbieters aktualisieren"
+  },
  "vertexai": {
    "apiKey": {
      "desc": "Geben Sie Ihre Vertex AI-Schlüssel ein",
@@ -8,6 +8,12 @@
  "01-ai/Yi-1.5-9B-Chat-16K": {
    "description": "Yi-1.5 9B unterstützt 16K Tokens und bietet effiziente, flüssige Sprachgenerierungsfähigkeiten."
  },
+  "01-ai/yi-1.5-34b-chat": {
+    "description": "Yi 1.5, das neueste Open-Source-Fine-Tuning-Modell mit 34 Milliarden Parametern, unterstützt verschiedene Dialogszenarien mit hochwertigen Trainingsdaten, die auf menschliche Präferenzen abgestimmt sind."
+  },
+  "01-ai/yi-1.5-9b-chat": {
+    "description": "Yi 1.5, das neueste Open-Source-Fine-Tuning-Modell mit 9 Milliarden Parametern, unterstützt verschiedene Dialogszenarien mit hochwertigen Trainingsdaten, die auf menschliche Präferenzen abgestimmt sind."
+  },
  "360gpt-pro": {
    "description": "360GPT Pro ist ein wichtiger Bestandteil der 360 AI-Modellreihe und erfüllt mit seiner effizienten Textverarbeitungsfähigkeit vielfältige Anwendungen der natürlichen Sprache, unterstützt das Verständnis langer Texte und Mehrfachdialoge."
  },
@@ -239,6 +245,9 @@
  "Qwen/QVQ-72B-Preview": {
    "description": "QVQ-72B-Preview ist ein forschungsorientiertes Modell, das vom Qwen-Team entwickelt wurde und sich auf visuelle Inferenzfähigkeiten konzentriert. Es hat einzigartige Vorteile beim Verständnis komplexer Szenen und der Lösung visuell verwandter mathematischer Probleme."
  },
+  "Qwen/QwQ-32B": {
+    "description": "QwQ ist das Inferenzmodell der Qwen-Serie. Im Vergleich zu traditionellen, anweisungsoptimierten Modellen verfügt QwQ über Denk- und Schlussfolgerungsfähigkeiten, die eine signifikante Leistungssteigerung bei nachgelagerten Aufgaben ermöglichen, insbesondere bei der Lösung schwieriger Probleme. QwQ-32B ist ein mittelgroßes Inferenzmodell, das im Vergleich zu den fortschrittlichsten Inferenzmodellen (wie DeepSeek-R1, o1-mini) wettbewerbsfähige Leistungen erzielt. Dieses Modell verwendet Technologien wie RoPE, SwiGLU, RMSNorm und Attention QKV Bias und hat eine Netzwerkstruktur mit 64 Schichten und 40 Q-Attention-Köpfen (im GQA-Architektur sind es 8 KV)."
+  },
  "Qwen/QwQ-32B-Preview": {
    "description": "QwQ-32B-Preview ist das neueste experimentelle Forschungsmodell von Qwen, das sich auf die Verbesserung der KI-Inferenzfähigkeiten konzentriert. Durch die Erforschung komplexer Mechanismen wie Sprachmischung und rekursive Inferenz bietet es Hauptvorteile wie starke Analysefähigkeiten, mathematische und Programmierfähigkeiten. Gleichzeitig gibt es Herausforderungen wie Sprachwechsel, Inferenzzyklen, Sicherheitsüberlegungen und Unterschiede in anderen Fähigkeiten."
  },
@@ -467,9 +476,6 @@
  "anthropic.claude-3-5-sonnet-20241022-v2:0": {
    "description": "Claude 3.5 Sonnet setzt neue Maßstäbe in der Branche, übertrifft die Modelle der Konkurrenz und Claude 3 Opus, und zeigt in umfassenden Bewertungen hervorragende Leistungen, während es die Geschwindigkeit und Kosten unserer mittelgroßen Modelle beibehält."
  },
-  "anthropic.claude-3-7-sonnet-20250219-v1:0": {
-    "description": "Claude 3.7 Sonnet hebt den Branchenstandard an, übertrifft die Modelle der Konkurrenz und Claude 3 Opus, und zeigt in umfassenden Bewertungen hervorragende Leistungen, während es die Geschwindigkeit und Kosten unserer mittelgroßen Modelle beibehält."
-  },
  "anthropic.claude-3-haiku-20240307-v1:0": {
    "description": "Claude 3 Haiku ist das schnellste und kompakteste Modell von Anthropic und bietet nahezu sofortige Reaktionsgeschwindigkeiten. Es kann schnell einfache Anfragen und Anforderungen beantworten. Kunden werden in der Lage sein, nahtlose AI-Erlebnisse zu schaffen, die menschliche Interaktionen nachahmen. Claude 3 Haiku kann Bilder verarbeiten und Textausgaben zurückgeben, mit einem Kontextfenster von 200K."
  },
@@ -506,6 +512,9 @@
  "aya:35b": {
    "description": "Aya 23 ist ein mehrsprachiges Modell von Cohere, das 23 Sprachen unterstützt und die Anwendung in einer Vielzahl von Sprachen erleichtert."
  },
+  "baichuan/baichuan2-13b-chat": {
+    "description": "Baichuan-13B ist ein Open-Source-Sprachmodell mit 13 Milliarden Parametern, das von Baichuan Intelligence entwickelt wurde und in autorisierten chinesischen und englischen Benchmarks die besten Ergebnisse in seiner Größenordnung erzielt hat."
+  },
  "charglm-3": {
    "description": "CharGLM-3 ist für Rollenspiele und emotionale Begleitung konzipiert und unterstützt extrem lange Mehrfachgedächtnisse und personalisierte Dialoge, mit breiter Anwendung."
  },
@@ -686,9 +695,30 @@
  "deepseek/deepseek-r1": {
    "description": "DeepSeek-R1 hat die Schlussfolgerungsfähigkeiten des Modells erheblich verbessert, selbst bei nur wenigen gekennzeichneten Daten. Bevor das Modell die endgültige Antwort ausgibt, gibt es zunächst eine Denkprozesskette aus, um die Genauigkeit der endgültigen Antwort zu erhöhen."
  },
+  "deepseek/deepseek-r1-distill-llama-70b": {
+    "description": "DeepSeek R1 Distill Llama 70B ist ein großes Sprachmodell, das auf Llama3.3 70B basiert und durch Feinabstimmung mit den Ausgaben von DeepSeek R1 eine wettbewerbsfähige Leistung erreicht, die mit großen, fortschrittlichen Modellen vergleichbar ist."
+  },
+  "deepseek/deepseek-r1-distill-llama-8b": {
+    "description": "DeepSeek R1 Distill Llama 8B ist ein distilliertes großes Sprachmodell, das auf Llama-3.1-8B-Instruct basiert und durch Training mit den Ausgaben von DeepSeek R1 erstellt wurde."
+  },
+  "deepseek/deepseek-r1-distill-qwen-14b": {
+    "description": "DeepSeek R1 Distill Qwen 14B ist ein distilliertes großes Sprachmodell, das auf Qwen 2.5 14B basiert und durch Training mit den Ausgaben von DeepSeek R1 erstellt wurde. Dieses Modell hat in mehreren Benchmark-Tests OpenAI's o1-mini übertroffen und die neuesten technologischen Fortschritte bei dichten Modellen (state-of-the-art) erzielt. Hier sind einige Ergebnisse der Benchmark-Tests:\nAIME 2024 pass@1: 69.7\nMATH-500 pass@1: 93.9\nCodeForces Rating: 1481\nDas Modell zeigt durch Feinabstimmung mit den Ausgaben von DeepSeek R1 eine wettbewerbsfähige Leistung, die mit größeren, fortschrittlichen Modellen vergleichbar ist."
+  },
+  "deepseek/deepseek-r1-distill-qwen-32b": {
+    "description": "DeepSeek R1 Distill Qwen 32B ist ein distilliertes großes Sprachmodell, das auf Qwen 2.5 32B basiert und durch Training mit den Ausgaben von DeepSeek R1 erstellt wurde. Dieses Modell hat in mehreren Benchmark-Tests OpenAI's o1-mini übertroffen und die neuesten technologischen Fortschritte bei dichten Modellen (state-of-the-art) erzielt. Hier sind einige Ergebnisse der Benchmark-Tests:\nAIME 2024 pass@1: 72.6\nMATH-500 pass@1: 94.3\nCodeForces Rating: 1691\nDas Modell zeigt durch Feinabstimmung mit den Ausgaben von DeepSeek R1 eine wettbewerbsfähige Leistung, die mit größeren, fortschrittlichen Modellen vergleichbar ist."
+  },
+  "deepseek/deepseek-r1/community": {
+    "description": "DeepSeek R1 ist das neueste Open-Source-Modell, das vom DeepSeek-Team veröffentlicht wurde und über eine äußerst leistungsstarke Inferenzleistung verfügt, insbesondere in den Bereichen Mathematik, Programmierung und logisches Denken, die mit dem OpenAI o1-Modell vergleichbar ist."
+  },
  "deepseek/deepseek-r1:free": {
    "description": "DeepSeek-R1 hat die Schlussfolgerungsfähigkeiten des Modells erheblich verbessert, selbst bei nur wenigen gekennzeichneten Daten. Bevor das Modell die endgültige Antwort ausgibt, gibt es zunächst eine Denkprozesskette aus, um die Genauigkeit der endgültigen Antwort zu erhöhen."
  },
+  "deepseek/deepseek-v3": {
+    "description": "DeepSeek-V3 hat einen bedeutenden Durchbruch in der Inferenzgeschwindigkeit im Vergleich zu früheren Modellen erzielt. Es belegt den ersten Platz unter den Open-Source-Modellen und kann mit den weltweit fortschrittlichsten proprietären Modellen konkurrieren. DeepSeek-V3 verwendet die Multi-Head-Latent-Attention (MLA) und die DeepSeekMoE-Architektur, die in DeepSeek-V2 umfassend validiert wurden. Darüber hinaus hat DeepSeek-V3 eine unterstützende verlustfreie Strategie für die Lastenverteilung eingeführt und mehrere Zielvorgaben für das Training von Mehrfachvorhersagen festgelegt, um eine stärkere Leistung zu erzielen."
+  },
+  "deepseek/deepseek-v3/community": {
+    "description": "DeepSeek-V3 hat einen bedeutenden Durchbruch in der Inferenzgeschwindigkeit im Vergleich zu früheren Modellen erzielt. Es belegt den ersten Platz unter den Open-Source-Modellen und kann mit den weltweit fortschrittlichsten proprietären Modellen konkurrieren. DeepSeek-V3 verwendet die Multi-Head-Latent-Attention (MLA) und die DeepSeekMoE-Architektur, die in DeepSeek-V2 umfassend validiert wurden. Darüber hinaus hat DeepSeek-V3 eine unterstützende verlustfreie Strategie für die Lastenverteilung eingeführt und mehrere Zielvorgaben für das Training von Mehrfachvorhersagen festgelegt, um eine stärkere Leistung zu erzielen."
+  },
  "doubao-1.5-lite-32k": {
    "description": "Doubao-1.5-lite ist das neueste leichte Modell der nächsten Generation, das eine extrem schnelle Reaktionszeit bietet und sowohl in der Leistung als auch in der Latenz weltweit erstklassig ist."
  },
@@ -800,9 +830,18 @@
  "gemini-2.0-flash-001": {
    "description": "Gemini 2.0 Flash bietet nächste Generation Funktionen und Verbesserungen, einschließlich außergewöhnlicher Geschwindigkeit, nativer Werkzeugnutzung, multimodaler Generierung und einem Kontextfenster von 1M Tokens."
  },
+  "gemini-2.0-flash-lite": {
+    "description": "Gemini 2.0 Flash ist eine Modellvariante, die auf Kosteneffizienz und niedrige Latenz optimiert ist."
+  },
+  "gemini-2.0-flash-lite-001": {
+    "description": "Gemini 2.0 Flash ist eine Modellvariante, die auf Kosteneffizienz und niedrige Latenz optimiert ist."
+  },
  "gemini-2.0-flash-lite-preview-02-05": {
    "description": "Ein Gemini 2.0 Flash Modell, das auf Kosteneffizienz und niedrige Latenz optimiert wurde."
  },
+  "gemini-2.0-flash-thinking-exp": {
+    "description": "Gemini 2.0 Flash Exp ist Googles neuestes experimentelles multimodales KI-Modell mit der nächsten Generation von Funktionen, außergewöhnlicher Geschwindigkeit, nativer Tool-Nutzung und multimodaler Generierung."
+  },
  "gemini-2.0-flash-thinking-exp-01-21": {
    "description": "Gemini 2.0 Flash Exp ist Googles neuestes experimentelles multimodales KI-Modell mit der nächsten Generation von Funktionen, außergewöhnlicher Geschwindigkeit, nativer Tool-Nutzung und multimodaler Generierung."
  },
@@ -953,6 +992,9 @@
  "gpt-4-vision-preview": {
    "description": "Das neueste GPT-4 Turbo-Modell verfügt über visuelle Funktionen. Jetzt können visuelle Anfragen im JSON-Format und durch Funktionsaufrufe gestellt werden. GPT-4 Turbo ist eine verbesserte Version, die kosteneffiziente Unterstützung für multimodale Aufgaben bietet. Es findet ein Gleichgewicht zwischen Genauigkeit und Effizienz und eignet sich für Anwendungen, die Echtzeitanpassungen erfordern."
  },
+  "gpt-4.5-preview": {
+    "description": "Die Forschungs-Vorschau von GPT-4.5, unserem bisher größten und leistungsstärksten GPT-Modell. Es verfügt über umfangreiches Weltwissen und kann die Absichten der Benutzer besser verstehen, was es in kreativen Aufgaben und autonomer Planung herausragend macht. GPT-4.5 akzeptiert Text- und Bild-Eingaben und generiert Textausgaben (einschließlich strukturierter Ausgaben). Es unterstützt wichtige Entwicklerfunktionen wie Funktionsaufrufe, Batch-APIs und Streaming-Ausgaben. In Aufgaben, die kreatives, offenes Denken und Dialog erfordern (wie Schreiben, Lernen oder das Erkunden neuer Ideen), zeigt GPT-4.5 besonders gute Leistungen. Der Wissensstand ist bis Oktober 2023."
+  },
  "gpt-4o": {
    "description": "ChatGPT-4o ist ein dynamisches Modell, das in Echtzeit aktualisiert wird, um die neueste Version zu gewährleisten. Es kombiniert starke Sprachverständnis- und Generierungsfähigkeiten und eignet sich für großangelegte Anwendungsszenarien, einschließlich Kundenservice, Bildung und technische Unterstützung."
  },
@@ -1088,15 +1130,6 @@
  "llama-3.1-8b-instant": {
    "description": "Llama 3.1 8B ist ein leistungsstarkes Modell, das schnelle Textgenerierungsfähigkeiten bietet und sich hervorragend für Anwendungen eignet, die große Effizienz und Kosteneffektivität erfordern."
  },
-  "llama-3.1-sonar-huge-128k-online": {
-    "description": "Das Llama 3.1 Sonar Huge Online-Modell hat 405B Parameter und unterstützt eine Kontextlänge von etwa 127.000 Markierungen, es wurde für komplexe Online-Chat-Anwendungen entwickelt."
-  },
-  "llama-3.1-sonar-large-128k-online": {
-    "description": "Das Llama 3.1 Sonar Large Online-Modell hat 70B Parameter und unterstützt eine Kontextlänge von etwa 127.000 Markierungen, es eignet sich für hochvolumige und vielfältige Chat-Aufgaben."
-  },
-  "llama-3.1-sonar-small-128k-online": {
-    "description": "Das Llama 3.1 Sonar Small Online-Modell hat 8B Parameter und unterstützt eine Kontextlänge von etwa 127.000 Markierungen, es wurde speziell für Online-Chat entwickelt und kann verschiedene Textinteraktionen effizient verarbeiten."
-  },
  "llama-3.2-11b-vision-instruct": {
    "description": "Überlegene Bildverarbeitungsfähigkeiten auf hochauflösenden Bildern, geeignet für visuelle Verständnisanwendungen."
  },
@@ -1250,6 +1283,9 @@
  "meta-llama/llama-3.2-11b-vision-instruct": {
    "description": "LLaMA 3.2 ist darauf ausgelegt, Aufgaben zu bearbeiten, die visuelle und textuelle Daten kombinieren. Es zeigt hervorragende Leistungen bei Aufgaben wie Bildbeschreibung und visuellem Fragen und Antworten und überbrückt die Kluft zwischen Sprachgenerierung und visueller Schlussfolgerung."
  },
+  "meta-llama/llama-3.2-3b-instruct": {
+    "description": "meta-llama/llama-3.2-3b-instruct"
+  },
  "meta-llama/llama-3.2-90b-vision-instruct": {
    "description": "LLaMA 3.2 ist darauf ausgelegt, Aufgaben zu bearbeiten, die visuelle und textuelle Daten kombinieren. Es zeigt hervorragende Leistungen bei Aufgaben wie Bildbeschreibung und visuellem Fragen und Antworten und überbrückt die Kluft zwischen Sprachgenerierung und visueller Schlussfolgerung."
  },
@@ -1484,6 +1520,9 @@
  "qwen-max-latest": {
    "description": "Der Tongyi Qianwen ist ein Sprachmodell mit einem Umfang von mehreren Billionen, das Eingaben in verschiedenen Sprachen wie Chinesisch und Englisch unterstützt und die API-Modelle hinter der aktuellen Version 2.5 von Tongyi Qianwen darstellt."
  },
+  "qwen-omni-turbo-latest": {
+    "description": "Die Qwen-Omni-Serie unterstützt die Eingabe von Daten in verschiedenen Modalitäten, einschließlich Video, Audio, Bilder und Text, und gibt Audio und Text aus."
+  },
  "qwen-plus": {
    "description": "Qwen Plus ist die verbesserte Version des großangelegten Sprachmodells, das Eingaben in verschiedenen Sprachen wie Chinesisch und Englisch unterstützt."
  },
@@ -1511,9 +1550,21 @@
  "qwen-vl-v1": {
    "description": "Initiiert mit dem Qwen-7B-Sprachmodell, fügt es ein Bildmodell hinzu, das für Bildeingaben mit einer Auflösung von 448 vortrainiert wurde."
  },
+  "qwen/qwen-2-7b-instruct": {
+    "description": "Qwen2 ist die brandneue Serie von großen Sprachmodellen von Qwen. Qwen2 7B ist ein transformerbasiertes Modell, das in den Bereichen Sprachverständnis, Mehrsprachigkeit, Programmierung, Mathematik und logisches Denken hervorragende Leistungen zeigt."
+  },
  "qwen/qwen-2-7b-instruct:free": {
    "description": "Qwen2 ist eine neue Serie großer Sprachmodelle mit stärkeren Verständnis- und Generierungsfähigkeiten."
  },
+  "qwen/qwen-2-vl-72b-instruct": {
+    "description": "Qwen2-VL ist die neueste Iteration des Qwen-VL-Modells und hat in Benchmark-Tests zur visuellen Verständlichkeit eine fortschrittliche Leistung erreicht, einschließlich MathVista, DocVQA, RealWorldQA und MTVQA. Qwen2-VL kann über 20 Minuten Video verstehen und ermöglicht qualitativ hochwertige, videobasierte Fragen und Antworten, Dialoge und Inhaltserstellung. Es verfügt auch über komplexe Denk- und Entscheidungsfähigkeiten und kann mit mobilen Geräten, Robotern usw. integriert werden, um basierend auf visuellen Umgebungen und Textanweisungen automatisch zu agieren. Neben Englisch und Chinesisch unterstützt Qwen2-VL jetzt auch das Verständnis von Text in Bildern in verschiedenen Sprachen, einschließlich der meisten europäischen Sprachen, Japanisch, Koreanisch, Arabisch und Vietnamesisch."
+  },
+  "qwen/qwen-2.5-72b-instruct": {
+    "description": "Qwen2.5-72B-Instruct ist eines der neuesten großen Sprachmodell-Serien, die von Alibaba Cloud veröffentlicht wurden. Dieses 72B-Modell hat signifikante Verbesserungen in den Bereichen Codierung und Mathematik. Das Modell bietet auch mehrsprachige Unterstützung und deckt über 29 Sprachen ab, einschließlich Chinesisch und Englisch. Das Modell hat signifikante Verbesserungen in der Befolgung von Anweisungen, im Verständnis von strukturierten Daten und in der Generierung von strukturierten Ausgaben (insbesondere JSON) erzielt."
+  },
+  "qwen/qwen2.5-32b-instruct": {
+    "description": "Qwen2.5-32B-Instruct ist eines der neuesten großen Sprachmodell-Serien, die von Alibaba Cloud veröffentlicht wurden. Dieses 32B-Modell hat signifikante Verbesserungen in den Bereichen Codierung und Mathematik. Das Modell bietet auch mehrsprachige Unterstützung und deckt über 29 Sprachen ab, einschließlich Chinesisch und Englisch. Das Modell hat signifikante Verbesserungen in der Befolgung von Anweisungen, im Verständnis von strukturierten Daten und in der Generierung von strukturierten Ausgaben (insbesondere JSON) erzielt."
+  },
  "qwen/qwen2.5-7b-instruct": {
    "description": "LLM, das auf Chinesisch und Englisch ausgerichtet ist und sich auf Sprache, Programmierung, Mathematik, Schlussfolgern und andere Bereiche konzentriert."
  },
@@ -1589,9 +1640,18 @@
  "qwq": {
    "description": "QwQ ist ein experimentelles Forschungsmodell, das sich auf die Verbesserung der KI-Inferenzfähigkeiten konzentriert."
  },
+  "qwq-32b": {
+    "description": "Das QwQ-Inferenzmodell, das auf dem Qwen2.5-32B-Modell trainiert wurde, hat durch verstärktes Lernen die Inferenzfähigkeiten des Modells erheblich verbessert. Die Kernmetriken des Modells, wie mathematische Codes (AIME 24/25, LiveCodeBench) sowie einige allgemeine Metriken (IFEval, LiveBench usw.), erreichen das Niveau der DeepSeek-R1 Vollversion, wobei alle Metriken deutlich die ebenfalls auf Qwen2.5-32B basierende DeepSeek-R1-Distill-Qwen-32B übertreffen."
+  },
  "qwq-32b-preview": {
    "description": "Das QwQ-Modell ist ein experimentelles Forschungsmodell, das vom Qwen-Team entwickelt wurde und sich auf die Verbesserung der KI-Inferenzfähigkeiten konzentriert."
  },
+  "qwq-plus-latest": {
+    "description": "Das QwQ-Inferenzmodell, das auf dem Qwen2.5-Modell trainiert wurde, hat durch verstärktes Lernen die Inferenzfähigkeiten des Modells erheblich verbessert. Die Kernmetriken des Modells, wie mathematische Codes (AIME 24/25, LiveCodeBench) sowie einige allgemeine Metriken (IFEval, LiveBench usw.), erreichen das Niveau der DeepSeek-R1 Vollversion."
+  },
+  "r1-1776": {
+    "description": "R1-1776 ist eine Version des DeepSeek R1 Modells, die nachtrainiert wurde, um unverfälschte, unvoreingenommene Fakteninformationen bereitzustellen."
+  },
  "solar-mini": {
    "description": "Solar Mini ist ein kompaktes LLM, das besser abschneidet als GPT-3.5 und über starke Mehrsprachigkeitsfähigkeiten verfügt. Es unterstützt Englisch und Koreanisch und bietet eine effiziente und kompakte Lösung."
  },
@@ -1604,6 +1664,9 @@
  "sonar": {
    "description": "Ein leichtgewichtiges Suchprodukt, das auf kontextbezogener Suche basiert und schneller und günstiger ist als Sonar Pro."
  },
+  "sonar-deep-research": {
+    "description": "Deep Research führt umfassende Expertenforschung durch und fasst diese in zugänglichen, umsetzbaren Berichten zusammen."
+  },
  "sonar-pro": {
    "description": "Ein fortschrittliches Suchprodukt, das kontextbezogene Suche unterstützt und erweiterte Abfragen sowie Nachverfolgung ermöglicht."
  },
@@ -1661,6 +1724,9 @@
  "text-embedding-3-small": {
    "description": "Effizientes und kostengünstiges neues Embedding-Modell, geeignet für Wissensabruf, RAG-Anwendungen und andere Szenarien."
  },
+  "thudm/glm-4-9b-chat": {
+    "description": "Die Open-Source-Version des neuesten vortrainierten Modells der GLM-4-Serie, das von Zhizhu AI veröffentlicht wurde."
+  },
  "togethercomputer/StripedHyena-Nous-7B": {
    "description": "StripedHyena Nous (7B) bietet durch effiziente Strategien und Modellarchitekturen verbesserte Rechenfähigkeiten."
  },
@@ -1676,6 +1742,9 @@
  "us.anthropic.claude-3-5-sonnet-20241022-v2:0": {
    "description": "Claude 3.5 Sonnet hebt den Branchenstandard an, übertrifft die Konkurrenzmodelle und Claude 3 Opus und zeigt in umfangreichen Bewertungen hervorragende Leistungen, während es die Geschwindigkeit und Kosten unserer mittelgroßen Modelle beibehält."
  },
+  "us.anthropic.claude-3-7-sonnet-20250219-v1:0": {
+    "description": "Claude 3.7 Sonett ist das schnellste nächste Modell von Anthropic. Im Vergleich zu Claude 3 Haiku hat Claude 3.7 Sonett in allen Fähigkeiten Verbesserungen erfahren und übertrifft in vielen intellektuellen Benchmark-Tests das größte Modell der vorherigen Generation, Claude 3 Opus."
+  },
  "whisper-1": {
    "description": "Allgemeines Spracherkennungsmodell, unterstützt mehrsprachige Spracherkennung, Sprachübersetzung und Spracherkennung."
  },
@@ -140,6 +140,18 @@
      "close": "Löschen",
      "confirm": "Konfiguration abgeschlossen und erneut versucht"
    },
+    "crawPages": {
+      "crawling": "Linkerkennung läuft",
+      "detail": {
+        "preview": "Vorschau",
+        "raw": "Ursprünglicher Text",
+        "tooLong": "Der Textinhalt ist zu lang, der Kontext des Gesprächs behält nur die ersten {{characters}} Zeichen bei, der übersteigende Teil wird nicht in den Gesprächskontext einbezogen."
+      },
+      "meta": {
+        "crawler": "Crawler-Modus",
+        "words": "Zeichenanzahl"
+      }
+    },
    "searchxng": {
      "baseURL": "Bitte eingeben",
      "description": "Geben Sie die URL von SearchXNG ein, um mit der Online-Suche zu beginnen",
@@ -89,6 +89,9 @@
  "perplexity": {
    "description": "Perplexity ist ein führender Anbieter von Dialoggenerierungsmodellen und bietet eine Vielzahl fortschrittlicher Llama 3.1-Modelle an, die sowohl für Online- als auch Offline-Anwendungen geeignet sind und sich besonders für komplexe Aufgaben der Verarbeitung natürlicher Sprache eignen."
  },
+  "ppio": {
+    "description": "PPIO Paiou Cloud bietet stabile und kosteneffiziente Open-Source-Modell-API-Dienste und unterstützt die gesamte DeepSeek-Serie, Llama, Qwen und andere führende große Modelle der Branche."
+  },
  "qwen": {
    "description": "Tongyi Qianwen ist ein von Alibaba Cloud selbst entwickeltes, groß angelegtes Sprachmodell mit starken Fähigkeiten zur Verarbeitung und Generierung natürlicher Sprache. Es kann eine Vielzahl von Fragen beantworten, Texte erstellen, Meinungen äußern und Code schreiben und spielt in mehreren Bereichen eine Rolle."
  },
@@ -32,7 +32,12 @@
  "duplicateTitle": "{{title}} Copy",
  "emptyAgent": "No assistant available",
  "extendParams": {
+    "disableContextCaching": {
+      "desc": "The cost of generating a single conversation can be reduced by up to 90%, and the response speed is increased by 4 times (<1>Learn more</1>). Enabling this will automatically disable the limit on the number of historical messages.",
+      "title": "Enable Context Caching"
+    },
    "enableReasoning": {
+      "desc": "Based on the Claude Thinking mechanism limit (<1>Learn more</1>), enabling this will automatically disable the limit on the number of historical messages.",
      "title": "Enable Deep Thinking"
    },
    "reasoningBudgetToken": {
@@ -40,6 +45,9 @@
    },
    "title": "Model Extension Features"
  },
+  "history": {
+    "title": "The assistant will only remember the last {{count}} messages."
+  },
  "historyRange": "History Range",
  "historySummary": "Historical Message Summary",
  "inbox": {
@@ -79,6 +87,39 @@
    "deleteDisabledByThreads": "There are subtopics, deletion is not allowed",
    "regenerate": "Regenerate"
  },
+  "messages": {
+    "modelCard": {
+      "credit": "Credits",
+      "creditPricing": "Pricing",
+      "creditTooltip": "For counting purposes, we convert $1 to 1M credits; for example, $3/M tokens can be converted to 3 credits/token.",
+      "pricing": {
+        "inputCachedTokens": "Cached input {{amount}}/credits · ${{amount}}/M",
+        "inputCharts": "${{amount}}/M characters",
+        "inputMinutes": "${{amount}}/minute",
+        "inputTokens": "Input {{amount}}/credits · ${{amount}}/M",
+        "outputTokens": "Output {{amount}}/credits · ${{amount}}/M",
+        "writeCacheInputTokens": "Cache input write {{amount}}/points · ${{amount}}/M"
+      }
+    },
+    "tokenDetails": {
+      "average": "Average unit price",
+      "input": "Input",
+      "inputAudio": "Audio Input",
+      "inputCached": "Cached Input",
+      "inputCitation": "Input citation",
+      "inputText": "Text Input",
+      "inputTitle": "Input Details",
+      "inputUncached": "Uncached Input",
+      "inputWriteCached": "Input cache write",
+      "output": "Output",
+      "outputAudio": "Audio Output",
+      "outputText": "Text Output",
+      "outputTitle": "Output Details",
+      "reasoning": "Deep Thinking",
+      "title": "Generation Details",
+      "total": "Total Consumption"
+    }
+  },
  "newAgent": "New Assistant",
  "pin": "Pin",
  "pinOff": "Unpin",
@@ -322,6 +322,9 @@
    "tooltip": "Update provider basic configuration",
    "updateSuccess": "Update successful"
  },
+  "updateCustomAiProvider": {
+    "title": "Update Custom AI Provider Configuration"
+  },
  "vertexai": {
    "apiKey": {
      "desc": "Enter your Vertex AI Keys",
@@ -8,6 +8,12 @@
  "01-ai/Yi-1.5-9B-Chat-16K": {
    "description": "Yi-1.5 9B supports 16K tokens, providing efficient and smooth language generation capabilities."
  },
+  "01-ai/yi-1.5-34b-chat": {
+    "description": "Zero One Everything, the latest open-source fine-tuned model with 34 billion parameters, supports various dialogue scenarios with high-quality training data aligned with human preferences."
+  },
+  "01-ai/yi-1.5-9b-chat": {
+    "description": "Zero One Everything, the latest open-source fine-tuned model with 9 billion parameters, supports various dialogue scenarios with high-quality training data aligned with human preferences."
+  },
  "360gpt-pro": {
    "description": "360GPT Pro, as an important member of the 360 AI model series, meets diverse natural language application scenarios with efficient text processing capabilities, supporting long text understanding and multi-turn dialogue."
  },
@@ -239,6 +245,9 @@
  "Qwen/QVQ-72B-Preview": {
    "description": "QVQ-72B-Preview is a research-oriented model developed by the Qwen team, focusing on visual reasoning capabilities, with unique advantages in understanding complex scenes and solving visually related mathematical problems."
  },
+  "Qwen/QwQ-32B": {
+    "description": "QwQ is the inference model of the Qwen series. Compared to traditional instruction-tuned models, QwQ possesses reasoning and cognitive abilities, achieving significantly enhanced performance in downstream tasks, especially in solving difficult problems. QwQ-32B is a medium-sized inference model that competes effectively against state-of-the-art inference models (such as DeepSeek-R1 and o1-mini). This model employs technologies such as RoPE, SwiGLU, RMSNorm, and Attention QKV bias, featuring a 64-layer network structure and 40 Q attention heads (with 8 KV heads in the GQA architecture)."
+  },
  "Qwen/QwQ-32B-Preview": {
    "description": "QwQ-32B-Preview is Qwen's latest experimental research model, focusing on enhancing AI reasoning capabilities. By exploring complex mechanisms such as language mixing and recursive reasoning, its main advantages include strong analytical reasoning, mathematical, and programming abilities. However, it also faces challenges such as language switching issues, reasoning loops, safety considerations, and differences in other capabilities."
  },
@@ -467,9 +476,6 @@
  "anthropic.claude-3-5-sonnet-20241022-v2:0": {
    "description": "Claude 3.5 Sonnet raises the industry standard, outperforming competing models and Claude 3 Opus, excelling in extensive evaluations while maintaining the speed and cost of our mid-tier models."
  },
-  "anthropic.claude-3-7-sonnet-20250219-v1:0": {
-    "description": "Claude 3.7 Sonnet is Anthropic's latest model, offering a balance of speed and performance. It excels in a wide range of tasks, including programming, data science, visual processing, and agent tasks."
-  },
  "anthropic.claude-3-haiku-20240307-v1:0": {
    "description": "Claude 3 Haiku is Anthropic's fastest and most compact model, providing near-instantaneous response times. It can quickly answer simple queries and requests. Customers will be able to build seamless AI experiences that mimic human interaction. Claude 3 Haiku can process images and return text output, with a context window of 200K."
  },
@@ -506,6 +512,9 @@
  "aya:35b": {
    "description": "Aya 23 is a multilingual model launched by Cohere, supporting 23 languages, facilitating diverse language applications."
  },
+  "baichuan/baichuan2-13b-chat": {
+    "description": "Baichuan-13B is an open-source, commercially usable large language model developed by Baichuan Intelligence, containing 13 billion parameters, achieving the best results in its size on authoritative Chinese and English benchmarks."
+  },
  "charglm-3": {
    "description": "CharGLM-3 is designed for role-playing and emotional companionship, supporting ultra-long multi-turn memory and personalized dialogue, with wide applications."
  },
@@ -686,9 +695,30 @@
  "deepseek/deepseek-r1": {
    "description": "DeepSeek-R1 significantly enhances model reasoning capabilities with minimal labeled data. Before outputting the final answer, the model first provides a chain of thought to improve the accuracy of the final response."
  },
+  "deepseek/deepseek-r1-distill-llama-70b": {
+    "description": "DeepSeek R1 Distill Llama 70B is a large language model based on Llama3.3 70B, which achieves competitive performance comparable to large cutting-edge models by utilizing fine-tuning from DeepSeek R1 outputs."
+  },
+  "deepseek/deepseek-r1-distill-llama-8b": {
+    "description": "DeepSeek R1 Distill Llama 8B is a distilled large language model based on Llama-3.1-8B-Instruct, trained using outputs from DeepSeek R1."
+  },
+  "deepseek/deepseek-r1-distill-qwen-14b": {
+    "description": "DeepSeek R1 Distill Qwen 14B is a distilled large language model based on Qwen 2.5 14B, trained using outputs from DeepSeek R1. This model has surpassed OpenAI's o1-mini in several benchmark tests, achieving state-of-the-art results for dense models. Here are some benchmark results:\nAIME 2024 pass@1: 69.7\nMATH-500 pass@1: 93.9\nCodeForces Rating: 1481\nThis model demonstrates competitive performance comparable to larger cutting-edge models through fine-tuning from DeepSeek R1 outputs."
+  },
+  "deepseek/deepseek-r1-distill-qwen-32b": {
+    "description": "DeepSeek R1 Distill Qwen 32B is a distilled large language model based on Qwen 2.5 32B, trained using outputs from DeepSeek R1. This model has surpassed OpenAI's o1-mini in several benchmark tests, achieving state-of-the-art results for dense models. Here are some benchmark results:\nAIME 2024 pass@1: 72.6\nMATH-500 pass@1: 94.3\nCodeForces Rating: 1691\nThis model demonstrates competitive performance comparable to larger cutting-edge models through fine-tuning from DeepSeek R1 outputs."
+  },
+  "deepseek/deepseek-r1/community": {
+    "description": "DeepSeek R1 is the latest open-source model released by the DeepSeek team, featuring impressive inference performance, particularly in mathematics, programming, and reasoning tasks, reaching levels comparable to OpenAI's o1 model."
+  },
  "deepseek/deepseek-r1:free": {
    "description": "DeepSeek-R1 significantly enhances model reasoning capabilities with minimal labeled data. Before outputting the final answer, the model first provides a chain of thought to improve the accuracy of the final response."
  },
+  "deepseek/deepseek-v3": {
+    "description": "DeepSeek-V3 has achieved a significant breakthrough in inference speed compared to previous models. It ranks first among open-source models and can compete with the world's most advanced closed-source models. DeepSeek-V3 employs Multi-Head Latent Attention (MLA) and DeepSeekMoE architectures, which have been thoroughly validated in DeepSeek-V2. Additionally, DeepSeek-V3 introduces an auxiliary lossless strategy for load balancing and sets multi-label prediction training objectives for enhanced performance."
+  },
+  "deepseek/deepseek-v3/community": {
+    "description": "DeepSeek-V3 has achieved a significant breakthrough in inference speed compared to previous models. It ranks first among open-source models and can compete with the world's most advanced closed-source models. DeepSeek-V3 employs Multi-Head Latent Attention (MLA) and DeepSeekMoE architectures, which have been thoroughly validated in DeepSeek-V2. Additionally, DeepSeek-V3 introduces an auxiliary lossless strategy for load balancing and sets multi-label prediction training objectives for enhanced performance."
+  },
  "doubao-1.5-lite-32k": {
    "description": "Doubao-1.5-lite is a new generation lightweight model, offering extreme response speed with performance and latency at a world-class level."
  },
@@ -800,9 +830,18 @@
  "gemini-2.0-flash-001": {
    "description": "Gemini 2.0 Flash offers next-generation features and improvements, including exceptional speed, native tool usage, multimodal generation, and a 1M token context window."
  },
+  "gemini-2.0-flash-lite": {
+    "description": "Gemini 2.0 Flash is a variant of the model optimized for cost-effectiveness and low latency."
+  },
+  "gemini-2.0-flash-lite-001": {
+    "description": "Gemini 2.0 Flash is a variant of the model optimized for cost-effectiveness and low latency."
+  },
  "gemini-2.0-flash-lite-preview-02-05": {
    "description": "A Gemini 2.0 Flash model optimized for cost-effectiveness and low latency."
  },
+  "gemini-2.0-flash-thinking-exp": {
+    "description": "Gemini 2.0 Flash Exp is Google's latest experimental multimodal AI model, featuring next-generation capabilities, exceptional speed, native tool invocation, and multimodal generation."
+  },
  "gemini-2.0-flash-thinking-exp-01-21": {
    "description": "Gemini 2.0 Flash Exp is Google's latest experimental multimodal AI model, featuring next-generation capabilities, exceptional speed, native tool invocation, and multimodal generation."
  },
@@ -953,6 +992,9 @@
  "gpt-4-vision-preview": {
    "description": "The latest GPT-4 Turbo model features visual capabilities. Now, visual requests can be made using JSON format and function calls. GPT-4 Turbo is an enhanced version that provides cost-effective support for multimodal tasks. It strikes a balance between accuracy and efficiency, making it suitable for applications requiring real-time interaction."
  },
+  "gpt-4.5-preview": {
+    "description": "The research preview of GPT-4.5, our largest and most powerful GPT model to date. It possesses extensive world knowledge and better understands user intent, excelling in creative tasks and autonomous planning. GPT-4.5 accepts both text and image inputs and generates text outputs (including structured outputs). It supports key developer features such as function calling, batch API, and streaming output. GPT-4.5 particularly shines in tasks that require creativity, open-ended thinking, and dialogue, such as writing, learning, or exploring new ideas. Knowledge cutoff date is October 2023."
+  },
  "gpt-4o": {
    "description": "ChatGPT-4o is a dynamic model that updates in real-time to stay current with the latest version. It combines powerful language understanding and generation capabilities, making it suitable for large-scale applications, including customer service, education, and technical support."
  },
@@ -1088,15 +1130,6 @@
  "llama-3.1-8b-instant": {
    "description": "Llama 3.1 8B is a high-performance model that offers rapid text generation capabilities, making it ideal for applications requiring large-scale efficiency and cost-effectiveness."
  },
-  "llama-3.1-sonar-huge-128k-online": {
-    "description": "Llama 3.1 Sonar Huge Online model, featuring 405B parameters, supports a context length of approximately 127,000 tokens, designed for complex online chat applications."
-  },
-  "llama-3.1-sonar-large-128k-online": {
-    "description": "Llama 3.1 Sonar Large Online model, featuring 70B parameters, supports a context length of approximately 127,000 tokens, suitable for high-capacity and diverse chat tasks."
-  },
-  "llama-3.1-sonar-small-128k-online": {
-    "description": "Llama 3.1 Sonar Small Online model, featuring 8B parameters, supports a context length of approximately 127,000 tokens, designed for online chat, efficiently handling various text interactions."
-  },
  "llama-3.2-11b-vision-instruct": {
    "description": "Excellent image reasoning capabilities on high-resolution images, suitable for visual understanding applications."
  },
@@ -1250,6 +1283,9 @@
  "meta-llama/llama-3.2-11b-vision-instruct": {
    "description": "LLaMA 3.2 is designed to handle tasks that combine visual and textual data. It excels in tasks such as image description and visual question answering, bridging the gap between language generation and visual reasoning."
  },
+  "meta-llama/llama-3.2-3b-instruct": {
+    "description": "meta-llama/llama-3.2-3b-instruct"
+  },
  "meta-llama/llama-3.2-90b-vision-instruct": {
    "description": "LLaMA 3.2 is designed to handle tasks that combine visual and textual data. It excels in tasks such as image description and visual question answering, bridging the gap between language generation and visual reasoning."
  },
@@ -1484,6 +1520,9 @@
  "qwen-max-latest": {
    "description": "Tongyi Qianwen Max is a large-scale language model with hundreds of billions of parameters, supporting input in various languages, including Chinese and English. It is the API model behind the current Tongyi Qianwen 2.5 product version."
  },
+  "qwen-omni-turbo-latest": {
+    "description": "The Qwen-Omni series of models supports input of various modalities, including video, audio, images, and text, and outputs both audio and text."
+  },
  "qwen-plus": {
    "description": "Qwen Plus is an enhanced large-scale language model supporting input in various languages including Chinese and English."
  },
@@ -1511,9 +1550,21 @@
  "qwen-vl-v1": {
    "description": "Initialized with the Qwen-7B language model, this pre-trained model adds an image model with an input resolution of 448."
  },
+  "qwen/qwen-2-7b-instruct": {
+    "description": "Qwen2 is a brand new series of large language models. Qwen2 7B is a transformer-based model that excels in language understanding, multilingual capabilities, programming, mathematics, and reasoning."
+  },
  "qwen/qwen-2-7b-instruct:free": {
    "description": "Qwen2 is a brand new series of large language models with enhanced understanding and generation capabilities."
  },
+  "qwen/qwen-2-vl-72b-instruct": {
+    "description": "Qwen2-VL is the latest iteration of the Qwen-VL model, achieving state-of-the-art performance in visual understanding benchmarks, including MathVista, DocVQA, RealWorldQA, and MTVQA. Qwen2-VL can understand videos over 20 minutes long for high-quality video-based Q&A, dialogue, and content creation. It also possesses complex reasoning and decision-making capabilities, allowing integration with mobile devices, robots, and more for automated operations based on visual environments and text instructions. In addition to English and Chinese, Qwen2-VL now supports understanding text in different languages within images, including most European languages, Japanese, Korean, Arabic, and Vietnamese."
+  },
+  "qwen/qwen-2.5-72b-instruct": {
+    "description": "Qwen2.5-72B-Instruct is one of the latest large language model series released by Alibaba Cloud. This 72B model has significantly improved capabilities in coding and mathematics. The model also offers multilingual support, covering over 29 languages, including Chinese and English. It shows significant enhancements in instruction following, understanding structured data, and generating structured outputs (especially JSON)."
+  },
+  "qwen/qwen2.5-32b-instruct": {
+    "description": "Qwen2.5-32B-Instruct is one of the latest large language model series released by Alibaba Cloud. This 32B model has significantly improved capabilities in coding and mathematics. The model provides multilingual support, covering over 29 languages, including Chinese and English. It shows significant enhancements in instruction following, understanding structured data, and generating structured outputs (especially JSON)."
+  },
  "qwen/qwen2.5-7b-instruct": {
    "description": "An LLM focused on both Chinese and English, targeting language, programming, mathematics, reasoning, and more."
  },
@@ -1589,9 +1640,18 @@
  "qwq": {
    "description": "QwQ is an experimental research model focused on improving AI reasoning capabilities."
  },
+  "qwq-32b": {
+    "description": "The QwQ inference model is trained based on the Qwen2.5-32B model, significantly enhancing its reasoning capabilities through reinforcement learning. The core metrics of the model, including mathematical code (AIME 24/25, LiveCodeBench) and some general metrics (IFEval, LiveBench, etc.), reach the level of the full version of DeepSeek-R1, with all metrics significantly surpassing those of DeepSeek-R1-Distill-Qwen-32B, which is also based on Qwen2.5-32B."
+  },
  "qwq-32b-preview": {
    "description": "The QwQ model is an experimental research model developed by the Qwen team, focusing on enhancing AI reasoning capabilities."
  },
+  "qwq-plus-latest": {
+    "description": "The QwQ inference model is trained based on the Qwen2.5 model, significantly enhancing its reasoning capabilities through reinforcement learning. The core metrics of the model, including mathematical code (AIME 24/25, LiveCodeBench) and some general metrics (IFEval, LiveBench, etc.), reach the level of the full version of DeepSeek-R1."
+  },
+  "r1-1776": {
+    "description": "R1-1776 is a version of the DeepSeek R1 model, fine-tuned to provide unfiltered, unbiased factual information."
+  },
  "solar-mini": {
    "description": "Solar Mini is a compact LLM that outperforms GPT-3.5, featuring strong multilingual capabilities and supporting English and Korean, providing an efficient and compact solution."
  },
@@ -1604,6 +1664,9 @@
  "sonar": {
    "description": "A lightweight search product based on contextual search, faster and cheaper than Sonar Pro."
  },
+  "sonar-deep-research": {
+    "description": "Deep Research conducts comprehensive expert-level studies and synthesizes them into accessible, actionable reports."
+  },
  "sonar-pro": {
    "description": "An advanced search product that supports contextual search, advanced queries, and follow-ups."
  },
@@ -1661,6 +1724,9 @@
  "text-embedding-3-small": {
    "description": "An efficient and cost-effective next-generation embedding model, suitable for knowledge retrieval, RAG applications, and more."
  },
+  "thudm/glm-4-9b-chat": {
+    "description": "The open-source version of the latest generation pre-trained model from the GLM-4 series released by Zhiyuan AI."
+  },
  "togethercomputer/StripedHyena-Nous-7B": {
    "description": "StripedHyena Nous (7B) provides enhanced computational capabilities through efficient strategies and model architecture."
  },
@@ -1676,6 +1742,9 @@
  "us.anthropic.claude-3-5-sonnet-20241022-v2:0": {
    "description": "Claude 3.5 Sonnet raises the industry standard, outperforming competitor models and Claude 3 Opus, excelling in a wide range of evaluations while maintaining the speed and cost of our mid-tier models."
  },
+  "us.anthropic.claude-3-7-sonnet-20250219-v1:0": {
+    "description": "Claude 3.7 Sonnet is Anthropic's fastest next-generation model. Compared to Claude 3 Haiku, Claude 3.7 Sonnet shows improvements across various skills and surpasses the previous generation's largest model, Claude 3 Opus, in many intelligence benchmark tests."
+  },
  "whisper-1": {
    "description": "A universal speech recognition model that supports multilingual speech recognition, speech translation, and language identification."
  },
@@ -140,6 +140,18 @@
      "close": "Delete",
      "confirm": "Configuration completed, please retry"
    },
+    "crawPages": {
+      "crawling": "Identifying links",
+      "detail": {
+        "preview": "Preview",
+        "raw": "Raw text",
+        "tooLong": "The text content is too long; only the first {{characters}} characters of the conversation context will be retained, and the excess will not be included in the conversation context."
+      },
+      "meta": {
+        "crawler": "Crawling Mode",
+        "words": "Character count"
+      }
+    },
    "searchxng": {
      "baseURL": "Please enter",
      "description": "Enter the URL for SearchXNG to start online searching",
@@ -89,6 +89,9 @@
  "perplexity": {
    "description": "Perplexity is a leading provider of conversational generation models, offering various advanced Llama 3.1 models that support both online and offline applications, particularly suited for complex natural language processing tasks."
  },
+  "ppio": {
+    "description": "PPIO supports stable and cost-efficient open-source LLM APIs, such as DeepSeek, Llama, Qwen etc."
+  },
  "qwen": {
    "description": "Tongyi Qianwen is a large-scale language model independently developed by Alibaba Cloud, featuring strong natural language understanding and generation capabilities. It can answer various questions, create written content, express opinions, and write code, playing a role in multiple fields."
  },
@@ -32,7 +32,12 @@
  "duplicateTitle": "{{title}} Copia",
  "emptyAgent": "No hay asistente disponible",
  "extendParams": {
+    "disableContextCaching": {
+      "desc": "El costo de generación de una sola conversación puede reducirse hasta en un 90%, y la velocidad de respuesta se incrementa 4 veces (<1>Más información</1>). Al activarlo, se desactivará automáticamente el límite de mensajes históricos",
+      "title": "Activar caché de contexto"
+    },
    "enableReasoning": {
+      "desc": "Basado en las restricciones del mecanismo Claude Thinking (<1>Más información</1>), al activarlo se desactivará automáticamente el límite de mensajes históricos",
      "title": "Activar el pensamiento profundo"
    },
    "reasoningBudgetToken": {
@@ -40,6 +45,9 @@
    },
    "title": "Funcionalidad de extensión del modelo"
  },
+  "history": {
+    "title": "El asistente solo recordará los últimos {{count}} mensajes"
+  },
  "historyRange": "Rango de historial",
  "historySummary": "Resumen de mensajes históricos",
  "inbox": {
@@ -79,6 +87,39 @@
    "deleteDisabledByThreads": "Existen subtemas, no se puede eliminar",
    "regenerate": "Regenerar"
  },
+  "messages": {
+    "modelCard": {
+      "credit": "Créditos",
+      "creditPricing": "Precios",
+      "creditTooltip": "Para facilitar el conteo, convertimos 1$ en 1M créditos, por ejemplo, $3/M tokens se convierte en 3 créditos/token",
+      "pricing": {
+        "inputCachedTokens": "Entradas en caché {{amount}}/créditos · ${{amount}}/M",
+        "inputCharts": "${{amount}}/M caracteres",
+        "inputMinutes": "${{amount}}/minuto",
+        "inputTokens": "Entradas {{amount}}/créditos · ${{amount}}/M",
+        "outputTokens": "Salidas {{amount}}/créditos · ${{amount}}/M",
+        "writeCacheInputTokens": "Escritura en caché de entrada {{amount}}/puntos · ${{amount}}/M"
+      }
+    },
+    "tokenDetails": {
+      "average": "Precio promedio",
+      "input": "Entrada",
+      "inputAudio": "Entrada de audio",
+      "inputCached": "Entrada en caché",
+      "inputCitation": "Citación de entrada",
+      "inputText": "Entrada de texto",
+      "inputTitle": "Detalles de entrada",
+      "inputUncached": "Entrada no en caché",
+      "inputWriteCached": "Escritura en caché de entrada",
+      "output": "Salida",
+      "outputAudio": "Salida de audio",
+      "outputText": "Salida de texto",
+      "outputTitle": "Detalles de salida",
+      "reasoning": "Razonamiento profundo",
+      "title": "Detalles de generación",
+      "total": "Total consumido"
+    }
+  },
  "newAgent": "Nuevo asistente",
  "pin": "Fijar",
  "pinOff": "Desfijar",
@@ -322,6 +322,9 @@
    "tooltip": "Actualizar configuración básica del proveedor",
    "updateSuccess": "Actualización exitosa"
  },
+  "updateCustomAiProvider": {
+    "title": "Actualizar la configuración del proveedor de IA personalizado"
+  },
  "vertexai": {
    "apiKey": {
      "desc": "Introduce tus claves de Vertex AI",
@@ -8,6 +8,12 @@
  "01-ai/Yi-1.5-9B-Chat-16K": {
    "description": "Yi-1.5 9B soporta 16K Tokens, proporcionando una capacidad de generación de lenguaje eficiente y fluida."
  },
+  "01-ai/yi-1.5-34b-chat": {
+    "description": "Cero Uno, el último modelo de ajuste fino de código abierto, cuenta con 34 mil millones de parámetros, con ajuste fino que admite múltiples escenarios de conversación y datos de entrenamiento de alta calidad, alineados con las preferencias humanas."
+  },
+  "01-ai/yi-1.5-9b-chat": {
+    "description": "Cero Uno, el último modelo de ajuste fino de código abierto, cuenta con 9 mil millones de parámetros, con ajuste fino que admite múltiples escenarios de conversación y datos de entrenamiento de alta calidad, alineados con las preferencias humanas."
+  },
  "360gpt-pro": {
    "description": "360GPT Pro, como un miembro importante de la serie de modelos de IA de 360, satisface diversas aplicaciones de procesamiento de lenguaje natural con su eficiente capacidad de manejo de textos, soportando la comprensión de textos largos y funciones de diálogo en múltiples turnos."
  },
@@ -239,6 +245,9 @@
  "Qwen/QVQ-72B-Preview": {
    "description": "QVQ-72B-Preview es un modelo de investigación desarrollado por el equipo de Qwen, enfocado en la capacidad de razonamiento visual, que tiene ventajas únicas en la comprensión de escenas complejas y en la resolución de problemas matemáticos relacionados con la visión."
  },
+  "Qwen/QwQ-32B": {
+    "description": "QwQ es el modelo de inferencia de la serie Qwen. A diferencia de los modelos tradicionales de ajuste por instrucciones, QwQ posee habilidades de pensamiento e inferencia, lo que le permite lograr un rendimiento significativamente mejorado en tareas posteriores, especialmente en la resolución de problemas difíciles. QwQ-32B es un modelo de inferencia de tamaño mediano que puede competir en rendimiento con los modelos de inferencia más avanzados (como DeepSeek-R1, o1-mini). Este modelo utiliza tecnologías como RoPE, SwiGLU, RMSNorm y sesgo de atención QKV, y cuenta con una estructura de red de 64 capas y 40 cabezas de atención Q (en la arquitectura GQA, KV es de 8)."
+  },
  "Qwen/QwQ-32B-Preview": {
    "description": "QwQ-32B-Preview es el último modelo de investigación experimental de Qwen, enfocado en mejorar la capacidad de razonamiento de la IA. A través de la exploración de mecanismos complejos como la mezcla de lenguajes y el razonamiento recursivo, sus principales ventajas incluyen una poderosa capacidad de análisis de razonamiento, así como habilidades matemáticas y de programación. Sin embargo, también presenta problemas de cambio de idioma, ciclos de razonamiento, consideraciones de seguridad y diferencias en otras capacidades."
  },
@@ -467,9 +476,6 @@
  "anthropic.claude-3-5-sonnet-20241022-v2:0": {
    "description": "Claude 3.5 Sonnet ha elevado los estándares de la industria, superando el rendimiento de modelos competidores y de Claude 3 Opus, destacándose en evaluaciones amplias, mientras mantiene la velocidad y el costo de nuestros modelos de nivel medio."
  },
-  "anthropic.claude-3-7-sonnet-20250219-v1:0": {
-    "description": "Claude 3.7 Sonnet es el modelo de IA más potente de Anthropic, con un rendimiento de vanguardia en tareas altamente complejas. Puede manejar indicaciones abiertas y escenarios no vistos, con una fluidez y comprensión humana excepcionales. Claude 3.7 Sonnet muestra la vanguardia de las posibilidades de la IA generativa. Claude 3.7 Sonnet puede manejar imágenes y devolver salidas de texto, con una ventana de contexto de 200K."
-  },
  "anthropic.claude-3-haiku-20240307-v1:0": {
    "description": "Claude 3 Haiku es el modelo más rápido y compacto de Anthropic, ofreciendo una velocidad de respuesta casi instantánea. Puede responder rápidamente a consultas y solicitudes simples. Los clientes podrán construir experiencias de IA sin costuras que imiten la interacción humana. Claude 3 Haiku puede manejar imágenes y devolver salidas de texto, con una ventana de contexto de 200K."
  },
@@ -506,6 +512,9 @@
  "aya:35b": {
    "description": "Aya 23 es un modelo multilingüe lanzado por Cohere, que admite 23 idiomas, facilitando aplicaciones de lenguaje diversas."
  },
+  "baichuan/baichuan2-13b-chat": {
+    "description": "Baichuan-13B es un modelo de lenguaje de gran escala de código abierto y comercializable desarrollado por Baichuan Intelligence, que cuenta con 13 mil millones de parámetros y ha logrado los mejores resultados en benchmarks autorizados en chino e inglés."
+  },
  "charglm-3": {
    "description": "CharGLM-3 está diseñado para juegos de rol y acompañamiento emocional, soportando memoria de múltiples rondas y diálogos personalizados, con aplicaciones amplias."
  },
@@ -686,9 +695,30 @@
  "deepseek/deepseek-r1": {
    "description": "DeepSeek-R1 mejora significativamente la capacidad de razonamiento del modelo con muy pocos datos etiquetados. Antes de proporcionar la respuesta final, el modelo genera una cadena de pensamiento para mejorar la precisión de la respuesta final."
  },
+  "deepseek/deepseek-r1-distill-llama-70b": {
+    "description": "DeepSeek R1 Distill Llama 70B es un modelo de lenguaje de gran tamaño basado en Llama3.3 70B, que utiliza el ajuste fino de la salida de DeepSeek R1 para lograr un rendimiento competitivo comparable a los modelos de vanguardia de gran tamaño."
+  },
+  "deepseek/deepseek-r1-distill-llama-8b": {
+    "description": "DeepSeek R1 Distill Llama 8B es un modelo de lenguaje grande destilado basado en Llama-3.1-8B-Instruct, entrenado utilizando la salida de DeepSeek R1."
+  },
+  "deepseek/deepseek-r1-distill-qwen-14b": {
+    "description": "DeepSeek R1 Distill Qwen 14B es un modelo de lenguaje grande destilado basado en Qwen 2.5 14B, entrenado utilizando la salida de DeepSeek R1. Este modelo ha superado a o1-mini de OpenAI en múltiples pruebas de referencia, logrando resultados de vanguardia en modelos densos. A continuación se presentan algunos resultados de las pruebas de referencia:\nAIME 2024 pass@1: 69.7\nMATH-500 pass@1: 93.9\nCalificación de CodeForces: 1481\nEste modelo, ajustado a partir de la salida de DeepSeek R1, muestra un rendimiento competitivo comparable al de modelos de vanguardia de mayor escala."
+  },
+  "deepseek/deepseek-r1-distill-qwen-32b": {
+    "description": "DeepSeek R1 Distill Qwen 32B es un modelo de lenguaje grande destilado basado en Qwen 2.5 32B, entrenado utilizando la salida de DeepSeek R1. Este modelo ha superado a o1-mini de OpenAI en múltiples pruebas de referencia, logrando resultados de vanguardia en modelos densos. A continuación se presentan algunos resultados de las pruebas de referencia:\nAIME 2024 pass@1: 72.6\nMATH-500 pass@1: 94.3\nCalificación de CodeForces: 1691\nEste modelo, ajustado a partir de la salida de DeepSeek R1, muestra un rendimiento competitivo comparable al de modelos de vanguardia de mayor escala."
+  },
+  "deepseek/deepseek-r1/community": {
+    "description": "DeepSeek R1 es el último modelo de código abierto lanzado por el equipo de DeepSeek, que cuenta con un rendimiento de inferencia excepcional, especialmente en tareas de matemáticas, programación y razonamiento, alcanzando niveles comparables al modelo o1 de OpenAI."
+  },
  "deepseek/deepseek-r1:free": {
    "description": "DeepSeek-R1 mejora significativamente la capacidad de razonamiento del modelo con muy pocos datos etiquetados. Antes de proporcionar la respuesta final, el modelo genera una cadena de pensamiento para mejorar la precisión de la respuesta final."
  },
+  "deepseek/deepseek-v3": {
+    "description": "DeepSeek-V3 ha logrado un avance significativo en la velocidad de inferencia en comparación con modelos anteriores. Se clasifica como el número uno entre los modelos de código abierto y puede competir con los modelos cerrados más avanzados del mundo. DeepSeek-V3 utiliza la arquitectura de atención multi-cabeza (MLA) y DeepSeekMoE, que han sido completamente validadas en DeepSeek-V2. Además, DeepSeek-V3 ha introducido una estrategia auxiliar sin pérdidas para el balanceo de carga y ha establecido objetivos de entrenamiento de predicción de múltiples etiquetas para lograr un rendimiento más robusto."
+  },
+  "deepseek/deepseek-v3/community": {
+    "description": "DeepSeek-V3 ha logrado un avance significativo en la velocidad de inferencia en comparación con modelos anteriores. Se clasifica como el número uno entre los modelos de código abierto y puede competir con los modelos cerrados más avanzados del mundo. DeepSeek-V3 utiliza la arquitectura de atención multi-cabeza (MLA) y DeepSeekMoE, que han sido completamente validadas en DeepSeek-V2. Además, DeepSeek-V3 ha introducido una estrategia auxiliar sin pérdidas para el balanceo de carga y ha establecido objetivos de entrenamiento de predicción de múltiples etiquetas para lograr un rendimiento más robusto."
+  },
  "doubao-1.5-lite-32k": {
    "description": "Doubao-1.5-lite es un modelo ligero de nueva generación, con una velocidad de respuesta extrema, alcanzando niveles de rendimiento y latencia de clase mundial."
  },
@@ -800,9 +830,18 @@
  "gemini-2.0-flash-001": {
    "description": "Gemini 2.0 Flash ofrece funciones y mejoras de próxima generación, incluyendo velocidad excepcional, uso de herramientas nativas, generación multimodal y una ventana de contexto de 1M tokens."
  },
+  "gemini-2.0-flash-lite": {
+    "description": "Variante del modelo Gemini 2.0 Flash, optimizada para objetivos como la rentabilidad y la baja latencia."
+  },
+  "gemini-2.0-flash-lite-001": {
+    "description": "Variante del modelo Gemini 2.0 Flash, optimizada para objetivos como la rentabilidad y la baja latencia."
+  },
  "gemini-2.0-flash-lite-preview-02-05": {
    "description": "Un modelo Gemini 2.0 Flash optimizado para objetivos de costo-efectividad y baja latencia."
  },
+  "gemini-2.0-flash-thinking-exp": {
+    "description": "Gemini 2.0 Flash Exp es el último modelo experimental de IA multimodal de Google, con características de próxima generación, velocidad excepcional, llamadas nativas a herramientas y generación multimodal."
+  },
  "gemini-2.0-flash-thinking-exp-01-21": {
    "description": "Gemini 2.0 Flash Exp es el último modelo experimental de IA multimodal de Google, con características de próxima generación, velocidad excepcional, llamadas nativas a herramientas y generación multimodal."
  },
@@ -953,6 +992,9 @@
  "gpt-4-vision-preview": {
    "description": "El último modelo GPT-4 Turbo cuenta con funciones visuales. Ahora, las solicitudes visuales pueden utilizar el modo JSON y llamadas a funciones. GPT-4 Turbo es una versión mejorada que ofrece soporte rentable para tareas multimodales. Encuentra un equilibrio entre precisión y eficiencia, adecuado para aplicaciones que requieren interacción en tiempo real."
  },
+  "gpt-4.5-preview": {
+    "description": "Versión de investigación de GPT-4.5, que es nuestro modelo GPT más grande y potente hasta la fecha. Posee un amplio conocimiento del mundo y puede comprender mejor la intención del usuario, lo que lo hace destacar en tareas creativas y planificación autónoma. GPT-4.5 acepta entradas de texto e imagen y genera salidas de texto (incluidas salidas estructuradas). Soporta funciones clave para desarrolladores, como llamadas a funciones, API por lotes y salida en streaming. En tareas que requieren pensamiento creativo, abierto y diálogo (como escritura, aprendizaje o exploración de nuevas ideas), GPT-4.5 brilla especialmente. La fecha límite de conocimiento es octubre de 2023."
+  },
  "gpt-4o": {
    "description": "ChatGPT-4o es un modelo dinámico que se actualiza en tiempo real para mantener la versión más actual. Combina una poderosa comprensión y generación de lenguaje, adecuado para aplicaciones a gran escala, incluyendo servicio al cliente, educación y soporte técnico."
  },
@@ -1088,15 +1130,6 @@
  "llama-3.1-8b-instant": {
    "description": "Llama 3.1 8B es un modelo de alto rendimiento que ofrece una rápida capacidad de generación de texto, ideal para aplicaciones que requieren eficiencia a gran escala y rentabilidad."
  },
-  "llama-3.1-sonar-huge-128k-online": {
-    "description": "El modelo Llama 3.1 Sonar Huge Online, con 405B de parámetros, soporta una longitud de contexto de aproximadamente 127,000 tokens, diseñado para aplicaciones de chat en línea complejas."
-  },
-  "llama-3.1-sonar-large-128k-online": {
-    "description": "El modelo Llama 3.1 Sonar Large Online, con 70B de parámetros, soporta una longitud de contexto de aproximadamente 127,000 tokens, adecuado para tareas de chat de alta capacidad y diversidad."
-  },
-  "llama-3.1-sonar-small-128k-online": {
-    "description": "El modelo Llama 3.1 Sonar Small Online, con 8B de parámetros, soporta una longitud de contexto de aproximadamente 127,000 tokens, diseñado para chat en línea, capaz de manejar eficientemente diversas interacciones textuales."
-  },
  "llama-3.2-11b-vision-instruct": {
    "description": "Capacidad excepcional de razonamiento visual en imágenes de alta resolución, adecuada para aplicaciones de comprensión visual."
  },
@@ -1250,6 +1283,9 @@
  "meta-llama/llama-3.2-11b-vision-instruct": {
    "description": "LLaMA 3.2 está diseñado para manejar tareas que combinan datos visuales y textuales. Destaca en tareas como la descripción de imágenes y preguntas visuales, superando la brecha entre la generación de lenguaje y el razonamiento visual."
  },
+  "meta-llama/llama-3.2-3b-instruct": {
+    "description": "meta-llama/llama-3.2-3b-instruct"
+  },
  "meta-llama/llama-3.2-90b-vision-instruct": {
    "description": "LLaMA 3.2 está diseñado para manejar tareas que combinan datos visuales y textuales. Destaca en tareas como la descripción de imágenes y preguntas visuales, superando la brecha entre la generación de lenguaje y el razonamiento visual."
  },
@@ -1484,6 +1520,9 @@
  "qwen-max-latest": {
    "description": "El modelo de lenguaje a gran escala Tongyi Qwen de nivel de cientos de miles de millones, que admite entradas en diferentes idiomas como chino e inglés, es el modelo API detrás de la versión del producto Tongyi Qwen 2.5."
  },
+  "qwen-omni-turbo-latest": {
+    "description": "La serie de modelos Qwen-Omni admite la entrada de datos en múltiples modalidades, incluyendo video, audio, imágenes y texto, y produce audio y texto como salida."
+  },
  "qwen-plus": {
    "description": "La versión mejorada del modelo de lenguaje a gran escala Qwen admite entradas en diferentes idiomas como chino e inglés."
  },
@@ -1511,9 +1550,21 @@
  "qwen-vl-v1": {
    "description": "Iniciado con el modelo de lenguaje Qwen-7B, se añade un modelo de imagen, un modelo preentrenado con una resolución de entrada de imagen de 448."
  },
+  "qwen/qwen-2-7b-instruct": {
+    "description": "Qwen2 es una nueva serie de modelos de lenguaje grande Qwen. Qwen2 7B es un modelo basado en transformador que destaca en comprensión del lenguaje, capacidades multilingües, programación, matemáticas y razonamiento."
+  },
  "qwen/qwen-2-7b-instruct:free": {
    "description": "Qwen2 es una nueva serie de modelos de lenguaje de gran tamaño, con una mayor capacidad de comprensión y generación."
  },
+  "qwen/qwen-2-vl-72b-instruct": {
+    "description": "Qwen2-VL es la última iteración del modelo Qwen-VL, alcanzando un rendimiento de vanguardia en pruebas de comprensión visual, incluyendo MathVista, DocVQA, RealWorldQA y MTVQA. Qwen2-VL puede entender videos de más de 20 minutos, permitiendo preguntas y respuestas, diálogos y creación de contenido de alta calidad basados en video. También posee capacidades complejas de razonamiento y toma de decisiones, pudiendo integrarse con dispositivos móviles, robots, etc., para realizar operaciones automáticas basadas en el entorno visual y las instrucciones de texto. Además del inglés y el chino, Qwen2-VL ahora también admite la comprensión de texto en diferentes idiomas dentro de imágenes, incluyendo la mayoría de los idiomas europeos, japonés, coreano, árabe y vietnamita."
+  },
+  "qwen/qwen-2.5-72b-instruct": {
+    "description": "Qwen2.5-72B-Instruct es una de las últimas series de modelos de lenguaje grande lanzadas por Alibaba Cloud. Este modelo de 72B presenta capacidades significativamente mejoradas en áreas como codificación y matemáticas. También ofrece soporte multilingüe, abarcando más de 29 idiomas, incluidos chino e inglés. El modelo ha mejorado notablemente en el seguimiento de instrucciones, la comprensión de datos estructurados y la generación de salidas estructuradas (especialmente JSON)."
+  },
+  "qwen/qwen2.5-32b-instruct": {
+    "description": "Qwen2.5-32B-Instruct es una de las últimas series de modelos de lenguaje grande lanzadas por Alibaba Cloud. Este modelo de 32B presenta capacidades significativamente mejoradas en áreas como codificación y matemáticas. También ofrece soporte multilingüe, abarcando más de 29 idiomas, incluidos chino e inglés. El modelo ha mejorado notablemente en el seguimiento de instrucciones, la comprensión de datos estructurados y la generación de salidas estructuradas (especialmente JSON)."
+  },
  "qwen/qwen2.5-7b-instruct": {
    "description": "LLM orientado a chino e inglés, enfocado en áreas como lenguaje, programación, matemáticas y razonamiento."
  },
@@ -1589,9 +1640,18 @@
  "qwq": {
    "description": "QwQ es un modelo de investigación experimental que se centra en mejorar la capacidad de razonamiento de la IA."
  },
+  "qwq-32b": {
+    "description": "El modelo de inferencia QwQ, entrenado con el modelo Qwen2.5-32B, ha mejorado significativamente su capacidad de inferencia a través del aprendizaje por refuerzo. Los indicadores clave del modelo, como el código matemático y otros indicadores centrales (AIME 24/25, LiveCodeBench), así como algunos indicadores generales (IFEval, LiveBench, etc.), han alcanzado el nivel del modelo DeepSeek-R1 en su versión completa, superando notablemente a DeepSeek-R1-Distill-Qwen-32B, que también se basa en Qwen2.5-32B."
+  },
  "qwq-32b-preview": {
    "description": "El modelo QwQ es un modelo de investigación experimental desarrollado por el equipo de Qwen, enfocado en mejorar la capacidad de razonamiento de la IA."
  },
+  "qwq-plus-latest": {
+    "description": "El modelo de inferencia QwQ, entrenado con el modelo Qwen2.5, ha mejorado significativamente su capacidad de inferencia a través del aprendizaje por refuerzo. Los indicadores clave del modelo, como el código matemático y otros indicadores centrales (AIME 24/25, LiveCodeBench), así como algunos indicadores generales (IFEval, LiveBench, etc.), han alcanzado el nivel del modelo DeepSeek-R1 en su versión completa."
+  },
+  "r1-1776": {
+    "description": "R1-1776 es una versión del modelo DeepSeek R1, que ha sido entrenada posteriormente para proporcionar información factual sin censura y sin sesgos."
+  },
  "solar-mini": {
    "description": "Solar Mini es un LLM compacto que supera a GPT-3.5, con potentes capacidades multilingües, soportando inglés y coreano, ofreciendo soluciones eficientes y compactas."
  },
@@ -1604,6 +1664,9 @@
  "sonar": {
    "description": "Producto de búsqueda ligero basado en contexto de búsqueda, más rápido y económico que Sonar Pro."
  },
+  "sonar-deep-research": {
+    "description": "Deep Research realiza una investigación exhaustiva a nivel de expertos y la compila en informes accesibles y prácticos."
+  },
  "sonar-pro": {
    "description": "Producto de búsqueda avanzada que soporta contexto de búsqueda, consultas avanzadas y seguimiento."
  },
@@ -1661,6 +1724,9 @@
  "text-embedding-3-small": {
    "description": "Un modelo de Embedding de nueva generación, eficiente y económico, adecuado para la recuperación de conocimiento, aplicaciones RAG y más."
  },
+  "thudm/glm-4-9b-chat": {
+    "description": "Versión de código abierto de la última generación del modelo preentrenado GLM-4 lanzado por Zhizhu AI."
+  },
  "togethercomputer/StripedHyena-Nous-7B": {
    "description": "StripedHyena Nous (7B) proporciona una capacidad de cálculo mejorada a través de estrategias y arquitecturas de modelos eficientes."
  },
@@ -1676,6 +1742,9 @@
  "us.anthropic.claude-3-5-sonnet-20241022-v2:0": {
    "description": "Claude 3.5 Sonnet eleva el estándar de la industria, superando a modelos competidores y a Claude 3 Opus, destacándose en evaluaciones amplias, mientras mantiene la velocidad y costo de nuestros modelos de nivel medio."
  },
+  "us.anthropic.claude-3-7-sonnet-20250219-v1:0": {
+    "description": "Claude 3.7 sonnet es el modelo de próxima generación más rápido de Anthropic. En comparación con Claude 3 Haiku, Claude 3.7 Sonnet ha mejorado en todas las habilidades y ha superado al modelo más grande de la generación anterior, Claude 3 Opus, en muchas pruebas de referencia de inteligencia."
+  },
  "whisper-1": {
    "description": "Modelo de reconocimiento de voz general, que admite reconocimiento de voz multilingüe, traducción de voz y reconocimiento de idiomas."
  },
@@ -140,6 +140,18 @@
      "close": "Eliminar",
      "confirm": "Configuración completada, intente de nuevo"
    },
+    "crawPages": {
+      "crawling": "Reconocimiento de enlaces",
+      "detail": {
+        "preview": "Vista previa",
+        "raw": "Texto original",
+        "tooLong": "El contenido del texto es demasiado largo, el contexto de la conversación solo retiene los primeros {{characters}} caracteres, el resto no se incluye en el contexto de la conversación"
+      },
+      "meta": {
+        "crawler": "Modo de rastreo",
+        "words": "Número de caracteres"
+      }
+    },
    "searchxng": {
      "baseURL": "Introduzca",
      "description": "Introduzca la URL de SearchXNG para comenzar la búsqueda en línea",
@@ -89,6 +89,9 @@
  "perplexity": {
    "description": "Perplexity es un proveedor líder de modelos de generación de diálogos, ofreciendo varios modelos avanzados de Llama 3.1, que son adecuados para aplicaciones en línea y fuera de línea, especialmente para tareas complejas de procesamiento del lenguaje natural."
  },
+  "ppio": {
+    "description": "PPIO Paiouyun ofrece servicios de API de modelos de código abierto estables y de alto rendimiento, que admiten toda la serie DeepSeek, Llama, Qwen y otros modelos grandes líderes en la industria."
+  },
  "qwen": {
    "description": "Tongyi Qianwen es un modelo de lenguaje de gran escala desarrollado de forma independiente por Alibaba Cloud, con potentes capacidades de comprensión y generación de lenguaje natural. Puede responder a diversas preguntas, crear contenido escrito, expresar opiniones y redactar código, desempeñando un papel en múltiples campos."
  },
@@ -32,7 +32,12 @@
  "duplicateTitle": "نسخه‌ای از {{title}}",
  "emptyAgent": "دستیار موجود نیست",
  "extendParams": {
+    "disableContextCaching": {
+      "desc": "هزینه تولید یک گفت‌وگو می‌تواند تا 90% کاهش یابد و سرعت پاسخ‌دهی 4 برابر افزایش یابد (<1>بیشتر بدانید</1>) . با فعال‌سازی این گزینه، محدودیت تعداد پیام‌های تاریخی به‌طور خودکار غیرفعال خواهد شد",
+      "title": "فعال‌سازی کش زمینه"
+    },
    "enableReasoning": {
+      "desc": "محدودیت‌های مبتنی بر مکانیزم تفکر کلاود (<1>بیشتر بدانید</1>) . با فعال‌سازی این گزینه، محدودیت تعداد پیام‌های تاریخی به‌طور خودکار غیرفعال خواهد شد",
      "title": "فعال‌سازی تفکر عمیق"
    },
    "reasoningBudgetToken": {
@@ -40,6 +45,9 @@
    },
    "title": "ویژگی‌های گسترش مدل"
  },
+  "history": {
+    "title": "دستیار فقط آخرین {{count}} پیام را به خاطر خواهد سپرد"
+  },
  "historyRange": "محدوده تاریخی",
  "historySummary": "خلاصه پیام‌های تاریخی",
  "inbox": {
@@ -79,6 +87,39 @@
    "deleteDisabledByThreads": "زیرموضوع وجود دارد، نمی‌توان حذف کرد",
    "regenerate": "بازتولید"
  },
+  "messages": {
+    "modelCard": {
+      "credit": "اعتبار",
+      "creditPricing": "قیمت گذاری",
+      "creditTooltip": "برای سهولت در شمارش، ما 1$ را به 1M اعتبار تبدیل می‌کنیم، به عنوان مثال $3/M توکن‌ها معادل 3 اعتبار/token است",
+      "pricing": {
+        "inputCachedTokens": "ورودی کش شده {{amount}}/اعتبار · ${{amount}}/M",
+        "inputCharts": "${{amount}}/M کاراکتر",
+        "inputMinutes": "${{amount}}/دقیقه",
+        "inputTokens": "ورودی {{amount}}/اعتبار · ${{amount}}/M",
+        "outputTokens": "خروجی {{amount}}/اعتبار · ${{amount}}/M",
+        "writeCacheInputTokens": "ذخیره ورودی نوشتن {{amount}}/امتیاز · ${{amount}}/M"
+      }
+    },
+    "tokenDetails": {
+      "average": "میانگین قیمت",
+      "input": "ورودی",
+      "inputAudio": "ورودی صوتی",
+      "inputCached": "ورودی کش شده",
+      "inputCitation": "ارجاع ورودی",
+      "inputText": "ورودی متنی",
+      "inputTitle": "جزئیات ورودی",
+      "inputUncached": "ورودی غیر کش شده",
+      "inputWriteCached": "ذخیره ورودی نوشتن",
+      "output": "خروجی",
+      "outputAudio": "خروجی صوتی",
+      "outputText": "خروجی متنی",
+      "outputTitle": "جزئیات خروجی",
+      "reasoning": "تفکر عمیق",
+      "title": "جزئیات تولید",
+      "total": "مجموع مصرف"
+    }
+  },
  "newAgent": "دستیار جدید",
  "pin": "سنجاق کردن",
  "pinOff": "لغو سنجاق",
@@ -322,6 +322,9 @@
    "tooltip": "به‌روزرسانی پیکربندی پایه ارائه‌دهنده",
    "updateSuccess": "به‌روزرسانی با موفقیت انجام شد"
  },
+  "updateCustomAiProvider": {
+    "title": "به‌روزرسانی تنظیمات ارائه‌دهنده AI سفارشی"
+  },
  "vertexai": {
    "apiKey": {
      "desc": "کلیدهای Vertex AI خود را وارد کنید",
@@ -8,6 +8,12 @@
  "01-ai/Yi-1.5-9B-Chat-16K": {
    "description": "Yi-1.5 9B از 16K توکن پشتیبانی می‌کند و توانایی تولید زبان به‌صورت کارآمد و روان را ارائه می‌دهد."
  },
+  "01-ai/yi-1.5-34b-chat": {
+    "description": "Zero One Everything، جدیدترین مدل متن باز تنظیم شده با 34 میلیارد پارامتر، که تنظیمات آن از چندین سناریوی گفتگویی پشتیبانی می‌کند و داده‌های آموزشی با کیفیت بالا را برای هم‌راستایی با ترجیحات انسانی فراهم می‌کند."
+  },
+  "01-ai/yi-1.5-9b-chat": {
+    "description": "Zero One Everything، جدیدترین مدل متن باز تنظیم شده با 9 میلیارد پارامتر، که تنظیمات آن از چندین سناریوی گفتگویی پشتیبانی می‌کند و داده‌های آموزشی با کیفیت بالا را برای هم‌راستایی با ترجیحات انسانی فراهم می‌کند."
+  },
  "360gpt-pro": {
    "description": "360GPT Pro به عنوان یکی از اعضای مهم سری مدل‌های 360 AI، با توانایی پردازش متون به‌صورت کارآمد، نیازهای متنوع در زمینه‌های مختلف کاربردهای زبان طبیعی را برآورده می‌کند و از قابلیت‌هایی مانند درک متون طولانی و مکالمات چندمرحله‌ای پشتیبانی می‌کند."
  },
@@ -239,6 +245,9 @@
  "Qwen/QVQ-72B-Preview": {
    "description": "QVQ-72B-Preview یک مدل تحقیقاتی است که توسط تیم Qwen توسعه یافته و بر روی توانایی‌های استنتاج بصری تمرکز دارد و در درک صحنه‌های پیچیده و حل مسائل ریاضی مرتبط با بصری دارای مزیت‌های منحصر به فردی است."
  },
+  "Qwen/QwQ-32B": {
+    "description": "QwQ مدل استنتاجی از سری Qwen است. در مقایسه با مدل‌های سنتی بهینه‌سازی دستورالعمل، QwQ دارای توانایی تفکر و استنتاج است و می‌تواند در وظایف پایین‌دستی عملکرد قابل توجهی را به ویژه در حل مسائل دشوار ارائه دهد. QwQ-32B یک مدل استنتاجی متوسط است که می‌تواند در مقایسه با مدل‌های استنتاجی پیشرفته (مانند DeepSeek-R1، o1-mini) عملکرد رقابتی را به دست آورد. این مدل از تکنیک‌هایی مانند RoPE، SwiGLU، RMSNorm و Attention QKV bias استفاده می‌کند و دارای ساختار شبکه 64 لایه و 40 سر توجه Q (در معماری GQA، KV برابر با 8 است) می‌باشد."
+  },
  "Qwen/QwQ-32B-Preview": {
    "description": "QwQ-32B-Preview جدیدترین مدل تحقیقاتی تجربی Qwen است که بر بهبود توانایی استدلال AI تمرکز دارد. با کاوش در مکانیزم‌های پیچیده‌ای مانند ترکیب زبان و استدلال بازگشتی، مزایای اصلی شامل توانایی تحلیل استدلال قوی، توانایی ریاضی و برنامه‌نویسی است. در عین حال، مشکلاتی مانند تغییر زبان، حلقه‌های استدلال، ملاحظات ایمنی و تفاوت‌های دیگر در توانایی‌ها وجود دارد."
  },
@@ -467,9 +476,6 @@
  "anthropic.claude-3-5-sonnet-20241022-v2:0": {
    "description": "Claude 3.5 Sonnet استانداردهای صنعت را ارتقا داده است، عملکردی بهتر از مدل‌های رقیب و Claude 3 Opus دارد، در ارزیابی‌های گسترده به خوبی عمل کرده و در عین حال سرعت و هزینه مدل‌های سطح متوسط ما را حفظ می‌کند."
  },
-  "anthropic.claude-3-7-sonnet-20250219-v1:0": {
-    "description": "سونت کلود 3.7 سریع‌ترین مدل نسل بعدی آنتروپیک است. در مقایسه با کلود 3 هایکو، سونت کلود 3.7 در تمام مهارت‌ها بهبود یافته و در بسیاری از آزمون‌های استاندارد هوش از بزرگ‌ترین مدل نسل قبلی، کلود 3 اوپوس، پیشی گرفته است."
-  },
  "anthropic.claude-3-haiku-20240307-v1:0": {
    "description": "Claude 3 Haiku سریع‌ترین و فشرده‌ترین مدل Anthropic است که پاسخ‌های تقریباً فوری ارائه می‌دهد. این مدل می‌تواند به سرعت به پرسش‌ها و درخواست‌های ساده پاسخ دهد. مشتریان قادر خواهند بود تجربه‌های هوش مصنوعی یکپارچه‌ای را که تعاملات انسانی را تقلید می‌کند، ایجاد کنند. Claude 3 Haiku می‌تواند تصاویر را پردازش کرده و خروجی متنی ارائه دهد و دارای پنجره متنی 200K است."
  },
@@ -506,6 +512,9 @@
  "aya:35b": {
    "description": "Aya 23 یک مدل چندزبانه است که توسط Cohere ارائه شده و از 23 زبان پشتیبانی می‌کند و استفاده از برنامه‌های چندزبانه را تسهیل می‌نماید."
  },
+  "baichuan/baichuan2-13b-chat": {
+    "description": "Baichuan-13B یک مدل زبان بزرگ متن باز و قابل تجاری با 130 میلیارد پارامتر است که در آزمون‌های معتبر چینی و انگلیسی بهترین عملکرد را در اندازه مشابه به دست آورده است."
+  },
  "charglm-3": {
    "description": "CharGLM-3 به‌طور ویژه برای نقش‌آفرینی و همراهی عاطفی طراحی شده است، از حافظه طولانی‌مدت و مکالمات شخصی‌سازی‌شده پشتیبانی می‌کند و کاربردهای گسترده‌ای دارد."
  },
@@ -686,9 +695,30 @@
  "deepseek/deepseek-r1": {
    "description": "DeepSeek-R1 با وجود داده‌های برچسب‌گذاری شده بسیار کم، توانایی استدلال مدل را به طرز چشمگیری افزایش می‌دهد. قبل از ارائه پاسخ نهایی، مدل ابتدا یک زنجیره تفکر را تولید می‌کند تا دقت پاسخ نهایی را افزایش دهد."
  },
+  "deepseek/deepseek-r1-distill-llama-70b": {
+    "description": "DeepSeek R1 Distill Llama 70B یک مدل زبان بزرگ مبتنی بر Llama3.3 70B است که با استفاده از تنظیمات DeepSeek R1 به عملکرد رقابتی معادل مدل‌های پیشرفته بزرگ دست یافته است."
+  },
+  "deepseek/deepseek-r1-distill-llama-8b": {
+    "description": "DeepSeek R1 Distill Llama 8B یک مدل زبان بزرگ تقطیر شده مبتنی بر Llama-3.1-8B-Instruct است که با استفاده از خروجی DeepSeek R1 آموزش دیده است."
+  },
+  "deepseek/deepseek-r1-distill-qwen-14b": {
+    "description": "DeepSeek R1 Distill Qwen 14B یک مدل زبان بزرگ تقطیر شده مبتنی بر Qwen 2.5 14B است که با استفاده از خروجی DeepSeek R1 آموزش دیده است. این مدل در چندین آزمون معیار از o1-mini OpenAI پیشی گرفته و به آخرین دستاوردهای فناوری مدل‌های متراکم (dense models) دست یافته است. نتایج برخی از آزمون‌های معیار به شرح زیر است:\nAIME 2024 pass@1: 69.7\nMATH-500 pass@1: 93.9\nCodeForces Rating: 1481\nاین مدل با تنظیمات خروجی DeepSeek R1، عملکرد رقابتی معادل مدل‌های پیشرفته بزرگتر را نشان می‌دهد."
+  },
+  "deepseek/deepseek-r1-distill-qwen-32b": {
+    "description": "DeepSeek R1 Distill Qwen 32B یک مدل زبان بزرگ تقطیر شده مبتنی بر Qwen 2.5 32B است که با استفاده از خروجی DeepSeek R1 آموزش دیده است. این مدل در چندین آزمون معیار از o1-mini OpenAI پیشی گرفته و به آخرین دستاوردهای فناوری مدل‌های متراکم (dense models) دست یافته است. نتایج برخی از آزمون‌های معیار به شرح زیر است:\nAIME 2024 pass@1: 72.6\nMATH-500 pass@1: 94.3\nCodeForces Rating: 1691\nاین مدل با تنظیمات خروجی DeepSeek R1، عملکرد رقابتی معادل مدل‌های پیشرفته بزرگتر را نشان می‌دهد."
+  },
+  "deepseek/deepseek-r1/community": {
+    "description": "DeepSeek R1 جدیدترین مدل متن باز منتشر شده توسط تیم DeepSeek است که دارای عملکرد استدلال بسیار قوی است و به ویژه در وظایف ریاضی، برنامه‌نویسی و استدلال به سطحی معادل مدل o1 OpenAI رسیده است."
+  },
  "deepseek/deepseek-r1:free": {
    "description": "DeepSeek-R1 با وجود داده‌های برچسب‌گذاری شده بسیار کم، توانایی استدلال مدل را به طرز چشمگیری افزایش می‌دهد. قبل از ارائه پاسخ نهایی، مدل ابتدا یک زنجیره تفکر را تولید می‌کند تا دقت پاسخ نهایی را افزایش دهد."
  },
+  "deepseek/deepseek-v3": {
+    "description": "DeepSeek-V3 در سرعت استدلال به یک پیشرفت عمده نسبت به مدل‌های قبلی دست یافته است. این مدل در بین مدل‌های متن باز رتبه اول را دارد و می‌تواند با پیشرفته‌ترین مدل‌های بسته جهانی رقابت کند. DeepSeek-V3 از معماری توجه چندسر (MLA) و DeepSeekMoE استفاده می‌کند که این معماری‌ها در DeepSeek-V2 به طور کامل تأیید شده‌اند. علاوه بر این، DeepSeek-V3 یک استراتژی کمکی بدون ضرر برای تعادل بار معرفی کرده و اهداف آموزشی پیش‌بینی چند برچسبی را برای بهبود عملکرد تعیین کرده است."
+  },
+  "deepseek/deepseek-v3/community": {
+    "description": "DeepSeek-V3 در سرعت استدلال به یک پیشرفت عمده نسبت به مدل‌های قبلی دست یافته است. این مدل در بین مدل‌های متن باز رتبه اول را دارد و می‌تواند با پیشرفته‌ترین مدل‌های بسته جهانی رقابت کند. DeepSeek-V3 از معماری توجه چندسر (MLA) و DeepSeekMoE استفاده می‌کند که این معماری‌ها در DeepSeek-V2 به طور کامل تأیید شده‌اند. علاوه بر این، DeepSeek-V3 یک استراتژی کمکی بدون ضرر برای تعادل بار معرفی کرده و اهداف آموزشی پیش‌بینی چند برچسبی را برای بهبود عملکرد تعیین کرده است."
+  },
  "doubao-1.5-lite-32k": {
    "description": "مدل سبک نسل جدید Doubao-1.5-lite، با سرعت پاسخ‌دهی فوق‌العاده، عملکرد و تأخیر در سطح جهانی را ارائه می‌دهد."
  },
@@ -800,9 +830,18 @@
  "gemini-2.0-flash-001": {
    "description": "Gemini 2.0 Flash ویژگی‌ها و بهبودهای نسل بعدی را ارائه می‌دهد، از جمله سرعت عالی، استفاده از ابزارهای بومی، تولید چندرسانه‌ای و پنجره متن 1M توکن."
  },
+  "gemini-2.0-flash-lite": {
+    "description": "مدل متغیر Gemini 2.0 Flash برای بهینه‌سازی هزینه و تأخیر کم طراحی شده است."
+  },
+  "gemini-2.0-flash-lite-001": {
+    "description": "مدل متغیر Gemini 2.0 Flash برای بهینه‌سازی هزینه و تأخیر کم طراحی شده است."
+  },
  "gemini-2.0-flash-lite-preview-02-05": {
    "description": "مدل Gemini 2.0 Flash که برای بهینه‌سازی هزینه و تأخیر کم طراحی شده است."
  },
+  "gemini-2.0-flash-thinking-exp": {
+    "description": "Gemini 2.0 Flash Exp جدیدترین مدل AI چندرسانه‌ای آزمایشی گوگل است که دارای ویژگی‌های نسل بعدی، سرعت فوق‌العاده، فراخوانی ابزار بومی و تولید چندرسانه‌ای است."
+  },
  "gemini-2.0-flash-thinking-exp-01-21": {
    "description": "Gemini 2.0 Flash Exp جدیدترین مدل AI چندرسانه‌ای آزمایشی گوگل است که دارای ویژگی‌های نسل بعدی، سرعت فوق‌العاده، فراخوانی ابزار بومی و تولید چندرسانه‌ای است."
  },
@@ -953,6 +992,9 @@
  "gpt-4-vision-preview": {
    "description": "جدیدترین مدل GPT-4 Turbo دارای قابلیت‌های بصری است. اکنون درخواست‌های بصری می‌توانند از حالت JSON و فراخوانی توابع استفاده کنند. GPT-4 Turbo نسخه‌ای پیشرفته است که پشتیبانی مقرون‌به‌صرفه‌ای برای وظایف چندوجهی ارائه می‌دهد. این مدل بین دقت و کارایی تعادل برقرار می‌کند و برای سناریوهای کاربردی که نیاز به تعاملات بلادرنگ دارند، مناسب است."
  },
+  "gpt-4.5-preview": {
+    "description": "نسخه پیش‌نمایش تحقیقاتی GPT-4.5، بزرگ‌ترین و قدرتمندترین مدل GPT ما تا به امروز است. این مدل دارای دانش وسیع جهانی است و می‌تواند بهتر از قبل نیت‌های کاربران را درک کند، که باعث می‌شود در وظایف خلاقانه و برنامه‌ریزی مستقل عملکرد فوق‌العاده‌ای داشته باشد. GPT-4.5 قادر به پذیرش ورودی‌های متنی و تصویری است و خروجی‌های متنی (شامل خروجی‌های ساختاریافته) تولید می‌کند. از ویژگی‌های کلیدی توسعه‌دهندگان مانند فراخوانی توابع، API دسته‌ای و خروجی جریانی پشتیبانی می‌کند. در وظایفی که نیاز به تفکر خلاق، تفکر باز و گفتگو دارند (مانند نوشتن، یادگیری یا کاوش ایده‌های جدید)، GPT-4.5 به‌ویژه عملکرد خوبی دارد. تاریخ قطع دانش در اکتبر 2023 است."
+  },
  "gpt-4o": {
    "description": "پیشرفته‌ترین مدل چندوجهی در سری GPT-4 OpenAI که می‌تواند ورودی‌های متنی و تصویری را پردازش کند."
  },
@@ -1088,15 +1130,6 @@
  "llama-3.1-8b-instant": {
    "description": "Llama 3.1 8B یک مدل با کارایی بالا است که توانایی تولید سریع متن را فراهم می‌کند و برای کاربردهایی که به بهره‌وری و صرفه‌جویی در هزینه در مقیاس بزرگ نیاز دارند، بسیار مناسب است."
  },
-  "llama-3.1-sonar-huge-128k-online": {
-    "description": "مدل Llama 3.1 Sonar Huge Online با 405 میلیارد پارامتر، پشتیبانی از طول زمینه حدود 127,000 نشانه، طراحی شده برای برنامه‌های چت آنلاین پیچیده."
-  },
-  "llama-3.1-sonar-large-128k-online": {
-    "description": "مدل Llama 3.1 Sonar Large Online با 70 میلیارد پارامتر، پشتیبانی از طول زمینه حدود 127,000 نشانه، مناسب برای وظایف چت با حجم بالا و متنوع."
-  },
-  "llama-3.1-sonar-small-128k-online": {
-    "description": "مدل Llama 3.1 Sonar Small Online با 8 میلیارد پارامتر، پشتیبانی از طول زمینه‌ای حدود 127,000 نشانه، به‌طور ویژه برای چت آنلاین طراحی شده و می‌تواند به‌طور کارآمد انواع تعاملات متنی را پردازش کند."
-  },
  "llama-3.2-11b-vision-instruct": {
    "description": "توانایی استدلال تصویری عالی در تصاویر با وضوح بالا، مناسب برای برنامه‌های درک بصری."
  },
@@ -1250,6 +1283,9 @@
  "meta-llama/llama-3.2-11b-vision-instruct": {
    "description": "LLaMA 3.2 برای انجام وظایفی که ترکیبی از داده‌های بصری و متنی هستند طراحی شده است. این مدل در وظایفی مانند توصیف تصویر و پرسش و پاسخ بصری عملکرد بسیار خوبی دارد و فاصله بین تولید زبان و استدلال بصری را پر می‌کند."
  },
+  "meta-llama/llama-3.2-3b-instruct": {
+    "description": "meta-llama/llama-3.2-3b-instruct"
+  },
  "meta-llama/llama-3.2-90b-vision-instruct": {
    "description": "LLaMA 3.2 برای انجام وظایفی طراحی شده است که داده‌های بصری و متنی را با هم ترکیب می‌کند. این مدل در وظایفی مانند توصیف تصویر و پرسش و پاسخ بصری عملکرد بسیار خوبی دارد و فاصله بین تولید زبان و استدلال بصری را پر می‌کند."
  },
@@ -1484,6 +1520,9 @@
  "qwen-max-latest": {
    "description": "مدل زبانی بسیار بزرگ با مقیاس میلیاردی تونگی چیان‌ون، که از ورودی‌های زبان‌های مختلف مانند چینی، انگلیسی و غیره پشتیبانی می‌کند. مدل API پشت نسخه محصول تونگی چیان‌ون 2.5 فعلی."
  },
+  "qwen-omni-turbo-latest": {
+    "description": "مدل‌های سری Qwen-Omni از ورودی داده‌های چندگانه شامل ویدیو، صدا، تصویر و متن پشتیبانی می‌کنند و خروجی‌های صوتی و متنی تولید می‌کنند."
+  },
  "qwen-plus": {
    "description": "مدل زبان بسیار بزرگ Qwen در نسخه تقویت شده، از ورودی زبان‌های مختلف مانند چینی و انگلیسی پشتیبانی می‌کند."
  },
@@ -1511,9 +1550,21 @@
  "qwen-vl-v1": {
    "description": "مدل زبان Qwen-7B با اضافه کردن مدل تصویر و وضوح ورودی تصویر 448، به عنوان یک مدل پیش‌آموزش‌شده، اولیه‌سازی شده است."
  },
+  "qwen/qwen-2-7b-instruct": {
+    "description": "Qwen2 یک سری جدید از مدل‌های زبان بزرگ Qwen است. Qwen2 7B یک مدل مبتنی بر ترنسفورمر است که در درک زبان، قابلیت‌های چند زبانه، برنامه‌نویسی، ریاضی و استدلال عملکرد عالی دارد."
+  },
  "qwen/qwen-2-7b-instruct:free": {
    "description": "Qwen2 یک سری جدید از مدل‌های زبان بزرگ است که دارای توانایی‌های درک و تولید قوی‌تری می‌باشد."
  },
+  "qwen/qwen-2-vl-72b-instruct": {
+    "description": "Qwen2-VL جدیدترین نسخه از مدل Qwen-VL است که در آزمون‌های معیار درک بصری به عملکرد پیشرفته‌ای دست یافته است، از جمله MathVista، DocVQA، RealWorldQA و MTVQA. Qwen2-VL قادر به درک ویدیوهای بیش از 20 دقیقه است و برای پرسش و پاسخ، گفتگو و تولید محتوا مبتنی بر ویدیو با کیفیت بالا استفاده می‌شود. این مدل همچنین دارای قابلیت‌های پیچیده استدلال و تصمیم‌گیری است و می‌تواند با دستگاه‌های موبایل، ربات‌ها و غیره ادغام شود و بر اساس محیط بصری و دستورات متنی به طور خودکار عمل کند. علاوه بر انگلیسی و چینی، Qwen2-VL اکنون از درک متن‌های مختلف زبان در تصاویر نیز پشتیبانی می‌کند، از جمله بیشتر زبان‌های اروپایی، ژاپنی، کره‌ای، عربی و ویتنامی."
+  },
+  "qwen/qwen-2.5-72b-instruct": {
+    "description": "Qwen2.5-72B-Instruct یکی از جدیدترین سری مدل‌های زبان بزرگ منتشر شده توسط Alibaba Cloud است. این مدل 72B در زمینه‌های کدنویسی و ریاضی دارای قابلیت‌های بهبود یافته قابل توجهی است. این مدل همچنین از چندین زبان پشتیبانی می‌کند و بیش از 29 زبان از جمله چینی و انگلیسی را پوشش می‌دهد. این مدل در پیروی از دستورات، درک داده‌های ساختاری و تولید خروجی‌های ساختاری (به ویژه JSON) بهبودهای قابل توجهی داشته است."
+  },
+  "qwen/qwen2.5-32b-instruct": {
+    "description": "Qwen2.5-32B-Instruct یکی از جدیدترین سری مدل‌های زبان بزرگ منتشر شده توسط Alibaba Cloud است. این مدل 32B در زمینه‌های کدنویسی و ریاضی دارای قابلیت‌های بهبود یافته قابل توجهی است. این مدل از چندین زبان پشتیبانی می‌کند و بیش از 29 زبان از جمله چینی و انگلیسی را پوشش می‌دهد. این مدل در پیروی از دستورات، درک داده‌های ساختاری و تولید خروجی‌های ساختاری (به ویژه JSON) بهبودهای قابل توجهی داشته است."
+  },
  "qwen/qwen2.5-7b-instruct": {
    "description": "مدل LLM برای زبان‌های چینی و انگلیسی که در زمینه‌های زبان، برنامه‌نویسی، ریاضیات و استدلال تخصص دارد."
  },
@@ -1589,9 +1640,18 @@
  "qwq": {
    "description": "QwQ یک مدل تحقیقاتی تجربی است که بر بهبود توانایی استدلال AI تمرکز دارد."
  },
+  "qwq-32b": {
+    "description": "مدل استنتاج QwQ مبتنی بر مدل Qwen2.5-32B است که از طریق یادگیری تقویتی به طور قابل توجهی توانایی استنتاج مدل را افزایش داده است. شاخص‌های اصلی مدل مانند کد ریاضی (AIME 24/25، LiveCodeBench) و برخی از شاخص‌های عمومی (IFEval، LiveBench و غیره) به سطح DeepSeek-R1 نسخه کامل رسیده‌اند و تمامی شاخص‌ها به طور قابل توجهی از DeepSeek-R1-Distill-Qwen-32B که نیز مبتنی بر Qwen2.5-32B است، پیشی گرفته‌اند."
+  },
  "qwq-32b-preview": {
    "description": "مدل QwQ یک مدل تحقیقاتی تجربی است که توسط تیم Qwen توسعه یافته و بر تقویت توانایی استدلال AI تمرکز دارد."
  },
+  "qwq-plus-latest": {
+    "description": "مدل استنتاج QwQ مبتنی بر مدل Qwen2.5 است که از طریق یادگیری تقویتی به طور قابل توجهی توانایی استنتاج مدل را افزایش داده است. شاخص‌های اصلی مدل مانند کد ریاضی (AIME 24/25، LiveCodeBench) و برخی از شاخص‌های عمومی (IFEval، LiveBench و غیره) به سطح DeepSeek-R1 نسخه کامل رسیده‌اند."
+  },
+  "r1-1776": {
+    "description": "R1-1776 نسخه‌ای از مدل DeepSeek R1 است که پس از آموزش مجدد، اطلاعات واقعی بدون سانسور و بدون تعصب را ارائه می‌دهد."
+  },
  "solar-mini": {
    "description": "Solar Mini یک LLM فشرده است که عملکردی بهتر از GPT-3.5 دارد و دارای توانایی‌های چند زبانه قوی است و از انگلیسی و کره‌ای پشتیبانی می‌کند و راه‌حل‌های کارآمد و کوچکی را ارائه می‌دهد."
  },
@@ -1604,6 +1664,9 @@
  "sonar": {
    "description": "محصول جستجوی سبک بر اساس زمینه جستجو که سریع‌تر و ارزان‌تر از Sonar Pro است."
  },
+  "sonar-deep-research": {
+    "description": "تحقیق عمیق، تحقیقاتی جامع و تخصصی را انجام می‌دهد و آن را به گزارش‌های قابل دسترسی و قابل استفاده تبدیل می‌کند."
+  },
  "sonar-pro": {
    "description": "محصول جستجوی پیشرفته که از جستجوی زمینه پشتیبانی می‌کند و قابلیت‌های پیشرفته‌ای برای پرسش و پیگیری دارد."
  },
@@ -1661,6 +1724,9 @@
  "text-embedding-3-small": {
    "description": "مدل جدید و کارآمد Embedding، مناسب برای جستجوی دانش، کاربردهای RAG و سایر سناریوها."
  },
+  "thudm/glm-4-9b-chat": {
+    "description": "نسخه متن باز جدیدترین نسل مدل‌های پیش‌آموزش GLM-4 منتشر شده توسط Zhizhu AI."
+  },
  "togethercomputer/StripedHyena-Nous-7B": {
    "description": "StripedHyena Nous (7B) با استفاده از استراتژی‌ها و معماری مدل کارآمد، توان محاسباتی بهبودیافته‌ای را ارائه می‌دهد."
  },
@@ -1676,6 +1742,9 @@
  "us.anthropic.claude-3-5-sonnet-20241022-v2:0": {
    "description": "Claude 3.5 Sonnet استانداردهای صنعتی را ارتقا داده و عملکردی فراتر از مدل‌های رقیب و Claude 3 Opus دارد و در ارزیابی‌های گسترده‌ای عملکرد عالی از خود نشان می‌دهد، در حالی که سرعت و هزینه مدل‌های سطح متوسط ما را نیز داراست."
  },
+  "us.anthropic.claude-3-7-sonnet-20250219-v1:0": {
+    "description": "Claude 3.7 sonnet سریع‌ترین مدل نسل بعدی Anthropic است. در مقایسه با Claude 3 Haiku، Claude 3.7 Sonnet در تمام مهارت‌ها بهبود یافته و در بسیاری از آزمون‌های استاندارد هوش از بزرگ‌ترین مدل نسل قبلی، Claude 3 Opus، پیشی گرفته است."
+  },
  "whisper-1": {
    "description": "مدل شناسایی گفتار عمومی، پشتیبانی از شناسایی گفتار چند زبانه، ترجمه گفتار و شناسایی زبان."
  },
@@ -140,6 +140,18 @@
      "close": "حذف",
      "confirm": "پیکربندی کامل و دوباره تلاش کنید"
    },
+    "crawPages": {
+      "crawling": "در حال شناسایی لینک",
+      "detail": {
+        "preview": "پیش‌نمایش",
+        "raw": "متن اصلی",
+        "tooLong": "متن بسیار طولانی است، فقط {{characters}} کاراکتر اول در زمینه گفتگو حفظ می‌شود و بخش‌های اضافی در زمینه گفتگو محاسبه نمی‌شوند"
+      },
+      "meta": {
+        "crawler": "مدل خزنده",
+        "words": "تعداد کاراکتر"
+      }
+    },
    "searchxng": {
      "baseURL": "لطفاً وارد کنید",
      "description": "لطفاً آدرس وب SearchXNG را وارد کنید تا جستجوی آنلاین را شروع کنید",
@@ -89,6 +89,9 @@
  "perplexity": {
    "description": "Perplexity یک ارائه‌دهنده پیشرو در مدل‌های تولید مکالمه است که انواع مدل‌های پیشرفته Llama 3.1 را ارائه می‌دهد و از برنامه‌های آنلاین و آفلاین پشتیبانی می‌کند. این مدل‌ها به‌ویژه برای وظایف پیچیده پردازش زبان طبیعی مناسب هستند."
  },
+  "ppio": {
+    "description": "PPIO پایو کلود خدمات API مدل‌های متن باز با ثبات و با قیمت مناسب را ارائه می‌دهد و از تمام سری‌های DeepSeek، Llama، Qwen و سایر مدل‌های بزرگ پیشرو در صنعت پشتیبانی می‌کند."
+  },
  "qwen": {
    "description": "چوان یی چیان ون یک مدل زبان بسیار بزرگ است که توسط علی‌کلود به‌طور مستقل توسعه یافته و دارای توانایی‌های قدرتمند درک و تولید زبان طبیعی است. این مدل می‌تواند به انواع سوالات پاسخ دهد، محتوای متنی خلق کند، نظرات و دیدگاه‌ها را بیان کند، کد بنویسد و در حوزه‌های مختلف نقش ایفا کند."
  },
@@ -32,7 +32,12 @@
  "duplicateTitle": "{{title}} Copie",
  "emptyAgent": "Aucun assistant disponible",
  "extendParams": {
+    "disableContextCaching": {
+      "desc": "Le coût de génération d'une seule conversation peut être réduit de 90 % au maximum, avec une vitesse de réponse augmentée de 4 fois (<1>En savoir plus</1>). Une fois activé, la limite du nombre de messages historiques sera automatiquement désactivée.",
+      "title": "Activer le cache de contexte"
+    },
    "enableReasoning": {
+      "desc": "Basé sur les restrictions du mécanisme Claude Thinking (<1>En savoir plus</1>), une fois activé, la limite du nombre de messages historiques sera automatiquement désactivée.",
      "title": "Activer la réflexion approfondie"
    },
    "reasoningBudgetToken": {
@@ -40,6 +45,9 @@
    },
    "title": "Fonctionnalités d'extension du modèle"
  },
+  "history": {
+    "title": "L'assistant ne se souviendra que des {{count}} derniers messages"
+  },
  "historyRange": "Plage d'historique",
  "historySummary": "Résumé des messages historiques",
  "inbox": {
@@ -79,6 +87,39 @@
    "deleteDisabledByThreads": "Il existe des sous-sujets, la suppression n'est pas possible.",
    "regenerate": "Régénérer"
  },
+  "messages": {
+    "modelCard": {
+      "credit": "Crédit",
+      "creditPricing": "Tarification",
+      "creditTooltip": "Pour faciliter le comptage, nous convertissons 1 $ en 1M de crédits, par exemple, 3 $/M tokens équivaut à 3 crédits/token",
+      "pricing": {
+        "inputCachedTokens": "Entrée mise en cache {{amount}}/crédit · ${{amount}}/M",
+        "inputCharts": "${{amount}}/M caractères",
+        "inputMinutes": "${{amount}}/minute",
+        "inputTokens": "Entrée {{amount}}/crédit · ${{amount}}/M",
+        "outputTokens": "Sortie {{amount}}/crédit · ${{amount}}/M",
+        "writeCacheInputTokens": "Écriture de cache d'entrée {{amount}}/points · ${{amount}}/M"
+      }
+    },
+    "tokenDetails": {
+      "average": "Prix moyen",
+      "input": "Entrée",
+      "inputAudio": "Entrée audio",
+      "inputCached": "Entrée mise en cache",
+      "inputCitation": "Citation d'entrée",
+      "inputText": "Entrée texte",
+      "inputTitle": "Détails de l'entrée",
+      "inputUncached": "Entrée non mise en cache",
+      "inputWriteCached": "Écriture de cache d'entrée",
+      "output": "Sortie",
+      "outputAudio": "Sortie audio",
+      "outputText": "Sortie texte",
+      "outputTitle": "Détails de la sortie",
+      "reasoning": "Raisonnement approfondi",
+      "title": "Détails de génération",
+      "total": "Total consommé"
+    }
+  },
  "newAgent": "Nouvel agent",
  "pin": "Épingler",
  "pinOff": "Désépingler",
@@ -322,6 +322,9 @@
    "tooltip": "Mettre à jour la configuration de base du fournisseur",
    "updateSuccess": "Mise à jour réussie"
  },
+  "updateCustomAiProvider": {
+    "title": "Mettre à jour la configuration du fournisseur de services AI personnalisé"
+  },
  "vertexai": {
    "apiKey": {
      "desc": "Entrez vos clés Vertex AI",
@@ -8,6 +8,12 @@
  "01-ai/Yi-1.5-9B-Chat-16K": {
    "description": "Yi-1.5 9B supporte 16K Tokens, offrant une capacité de génération de langage efficace et fluide."
  },
+  "01-ai/yi-1.5-34b-chat": {
+    "description": "Zero One Everything, le dernier modèle de fine-tuning open source, avec 34 milliards de paramètres, prend en charge divers scénarios de dialogue, avec des données d'entraînement de haute qualité, alignées sur les préférences humaines."
+  },
+  "01-ai/yi-1.5-9b-chat": {
+    "description": "Zero One Everything, le dernier modèle de fine-tuning open source, avec 9 milliards de paramètres, prend en charge divers scénarios de dialogue, avec des données d'entraînement de haute qualité, alignées sur les préférences humaines."
+  },
  "360gpt-pro": {
    "description": "360GPT Pro, en tant que membre important de la série de modèles AI de 360, répond à des applications variées de traitement de texte avec une efficacité élevée, supportant la compréhension de longs textes et les dialogues multi-tours."
  },
@@ -239,6 +245,9 @@
  "Qwen/QVQ-72B-Preview": {
    "description": "QVQ-72B-Preview est un modèle de recherche développé par l'équipe Qwen, axé sur les capacités de raisonnement visuel, qui possède des avantages uniques dans la compréhension de scènes complexes et la résolution de problèmes mathématiques liés à la vision."
  },
+  "Qwen/QwQ-32B": {
+    "description": "QwQ est le modèle d'inférence de la série Qwen. Comparé aux modèles d'optimisation d'instructions traditionnels, QwQ possède des capacités de réflexion et de raisonnement, permettant d'obtenir des performances nettement améliorées dans les tâches en aval, en particulier pour résoudre des problèmes difficiles. QwQ-32B est un modèle d'inférence de taille moyenne, capable d'obtenir des performances compétitives par rapport aux modèles d'inférence les plus avancés (comme DeepSeek-R1, o1-mini). Ce modèle utilise des techniques telles que RoPE, SwiGLU, RMSNorm et Attention QKV bias, avec une architecture de réseau de 64 couches et 40 têtes d'attention Q (dans l'architecture GQA, KV est de 8)."
+  },
  "Qwen/QwQ-32B-Preview": {
    "description": "QwQ-32B-Preview est le dernier modèle de recherche expérimental de Qwen, axé sur l'amélioration des capacités de raisonnement de l'IA. En explorant des mécanismes complexes tels que le mélange de langues et le raisonnement récursif, ses principaux avantages incluent de puissantes capacités d'analyse de raisonnement, ainsi que des compétences en mathématiques et en programmation. Cependant, il existe également des problèmes de changement de langue, des cycles de raisonnement, des considérations de sécurité et des différences dans d'autres capacités."
  },
@@ -467,9 +476,6 @@
  "anthropic.claude-3-5-sonnet-20241022-v2:0": {
    "description": "Claude 3.5 Sonnet a élevé les normes de l'industrie, surpassant les modèles concurrents et Claude 3 Opus, tout en affichant d'excellentes performances dans une large gamme d'évaluations, tout en conservant la vitesse et le coût de nos modèles de niveau intermédiaire."
  },
-  "anthropic.claude-3-7-sonnet-20250219-v1:0": {
-    "description": "Claude 3.7 Sonnet élève les normes de l'industrie, surpassant les modèles concurrents et Claude 3 Opus, avec d'excellentes performances dans une large gamme d'évaluations, tout en offrant la vitesse et le coût de nos modèles de niveau intermédiaire."
-  },
  "anthropic.claude-3-haiku-20240307-v1:0": {
    "description": "Claude 3 Haiku est le modèle le plus rapide et le plus compact d'Anthropic, offrant une vitesse de réponse quasi instantanée. Il peut répondre rapidement à des requêtes et demandes simples. Les clients pourront construire une expérience AI transparente imitant l'interaction humaine. Claude 3 Haiku peut traiter des images et retourner des sorties textuelles, avec une fenêtre contextuelle de 200K."
  },
@@ -506,6 +512,9 @@
  "aya:35b": {
    "description": "Aya 23 est un modèle multilingue lancé par Cohere, prenant en charge 23 langues, facilitant les applications linguistiques diversifiées."
  },
+  "baichuan/baichuan2-13b-chat": {
+    "description": "Baichuan-13B est un modèle de langage open source et commercialisable développé par Baichuan Intelligence, contenant 13 milliards de paramètres, qui a obtenu les meilleurs résultats dans des benchmarks chinois et anglais de référence."
+  },
  "charglm-3": {
    "description": "CharGLM-3 est conçu pour le jeu de rôle et l'accompagnement émotionnel, prenant en charge une mémoire multi-tours ultra-longue et des dialogues personnalisés, avec des applications variées."
  },
@@ -686,9 +695,30 @@
  "deepseek/deepseek-r1": {
    "description": "DeepSeek-R1 améliore considérablement les capacités de raisonnement du modèle avec très peu de données annotées. Avant de fournir la réponse finale, le modèle génère d'abord une chaîne de pensée pour améliorer l'exactitude de la réponse finale."
  },
+  "deepseek/deepseek-r1-distill-llama-70b": {
+    "description": "DeepSeek R1 Distill Llama 70B est un modèle de langage de grande taille basé sur Llama3.3 70B, qui utilise le fine-tuning des sorties de DeepSeek R1 pour atteindre des performances compétitives comparables aux grands modèles de pointe."
+  },
+  "deepseek/deepseek-r1-distill-llama-8b": {
+    "description": "DeepSeek R1 Distill Llama 8B est un modèle de langage distillé basé sur Llama-3.1-8B-Instruct, entraîné en utilisant les sorties de DeepSeek R1."
+  },
+  "deepseek/deepseek-r1-distill-qwen-14b": {
+    "description": "DeepSeek R1 Distill Qwen 14B est un modèle de langage distillé basé sur Qwen 2.5 14B, entraîné en utilisant les sorties de DeepSeek R1. Ce modèle a surpassé l'o1-mini d'OpenAI dans plusieurs benchmarks, atteignant des résultats de pointe pour les modèles denses. Voici quelques résultats de benchmarks :\nAIME 2024 pass@1 : 69.7\nMATH-500 pass@1 : 93.9\nCodeForces Rating : 1481\nCe modèle, affiné à partir des sorties de DeepSeek R1, démontre des performances compétitives comparables à celles de modèles de pointe de plus grande taille."
+  },
+  "deepseek/deepseek-r1-distill-qwen-32b": {
+    "description": "DeepSeek R1 Distill Qwen 32B est un modèle de langage distillé basé sur Qwen 2.5 32B, entraîné en utilisant les sorties de DeepSeek R1. Ce modèle a surpassé l'o1-mini d'OpenAI dans plusieurs benchmarks, atteignant des résultats de pointe pour les modèles denses. Voici quelques résultats de benchmarks :\nAIME 2024 pass@1 : 72.6\nMATH-500 pass@1 : 94.3\nCodeForces Rating : 1691\nCe modèle, affiné à partir des sorties de DeepSeek R1, démontre des performances compétitives comparables à celles de modèles de pointe de plus grande taille."
+  },
+  "deepseek/deepseek-r1/community": {
+    "description": "DeepSeek R1 est le dernier modèle open source publié par l'équipe DeepSeek, offrant des performances d'inférence très puissantes, atteignant des niveaux comparables à ceux du modèle o1 d'OpenAI, en particulier dans les tâches de mathématiques, de programmation et de raisonnement."
+  },
  "deepseek/deepseek-r1:free": {
    "description": "DeepSeek-R1 améliore considérablement les capacités de raisonnement du modèle avec très peu de données annotées. Avant de fournir la réponse finale, le modèle génère d'abord une chaîne de pensée pour améliorer l'exactitude de la réponse finale."
  },
+  "deepseek/deepseek-v3": {
+    "description": "DeepSeek-V3 a réalisé une percée majeure en termes de vitesse d'inférence par rapport aux modèles précédents. Il se classe au premier rang des modèles open source et peut rivaliser avec les modèles fermés les plus avancés au monde. DeepSeek-V3 utilise une architecture d'attention multi-tête (MLA) et DeepSeekMoE, qui ont été entièrement validées dans DeepSeek-V2. De plus, DeepSeek-V3 a introduit une stratégie auxiliaire sans perte pour l'équilibrage de charge et a établi des objectifs d'entraînement de prédiction multi-étiquettes pour obtenir de meilleures performances."
+  },
+  "deepseek/deepseek-v3/community": {
+    "description": "DeepSeek-V3 a réalisé une percée majeure en termes de vitesse d'inférence par rapport aux modèles précédents. Il se classe au premier rang des modèles open source et peut rivaliser avec les modèles fermés les plus avancés au monde. DeepSeek-V3 utilise une architecture d'attention multi-tête (MLA) et DeepSeekMoE, qui ont été entièrement validées dans DeepSeek-V2. De plus, DeepSeek-V3 a introduit une stratégie auxiliaire sans perte pour l'équilibrage de charge et a établi des objectifs d'entraînement de prédiction multi-étiquettes pour obtenir de meilleures performances."
+  },
  "doubao-1.5-lite-32k": {
    "description": "Doubao-1.5-lite est un modèle léger de nouvelle génération, offrant une vitesse de réponse extrême, avec des performances et des délais atteignant des niveaux de classe mondiale."
  },
@@ -800,9 +830,18 @@
  "gemini-2.0-flash-001": {
    "description": "Gemini 2.0 Flash propose des fonctionnalités et des améliorations de nouvelle génération, y compris une vitesse exceptionnelle, l'utilisation d'outils natifs, la génération multimodale et une fenêtre de contexte de 1M tokens."
  },
+  "gemini-2.0-flash-lite": {
+    "description": "Une variante du modèle Gemini 2.0 Flash, optimisée pour des objectifs tels que le rapport coût-efficacité et la faible latence."
+  },
+  "gemini-2.0-flash-lite-001": {
+    "description": "Une variante du modèle Gemini 2.0 Flash, optimisée pour des objectifs tels que le rapport coût-efficacité et la faible latence."
+  },
  "gemini-2.0-flash-lite-preview-02-05": {
    "description": "Un modèle Gemini 2.0 Flash optimisé pour des objectifs de rentabilité et de faible latence."
  },
+  "gemini-2.0-flash-thinking-exp": {
+    "description": "Gemini 2.0 Flash Exp est le dernier modèle d'IA multimodal expérimental de Google, doté de caractéristiques de nouvelle génération, d'une vitesse exceptionnelle, d'appels d'outils natifs et de génération multimodale."
+  },
  "gemini-2.0-flash-thinking-exp-01-21": {
    "description": "Gemini 2.0 Flash Exp est le dernier modèle d'IA multimodal expérimental de Google, doté de caractéristiques de nouvelle génération, d'une vitesse exceptionnelle, d'appels d'outils natifs et de génération multimodale."
  },
@@ -953,6 +992,9 @@
  "gpt-4-vision-preview": {
    "description": "Le dernier modèle GPT-4 Turbo dispose de fonctionnalités visuelles. Désormais, les requêtes visuelles peuvent être effectuées en utilisant le mode JSON et les appels de fonction. GPT-4 Turbo est une version améliorée, offrant un soutien rentable pour les tâches multimodales. Il trouve un équilibre entre précision et efficacité, adapté aux applications nécessitant des interactions en temps réel."
  },
+  "gpt-4.5-preview": {
+    "description": "La version de recherche préliminaire de GPT-4.5, qui est notre modèle GPT le plus grand et le plus puissant à ce jour. Il possède une vaste connaissance du monde et comprend mieux les intentions des utilisateurs, ce qui le rend exceptionnel dans les tâches créatives et la planification autonome. GPT-4.5 accepte les entrées textuelles et visuelles et génère des sorties textuelles (y compris des sorties structurées). Il prend en charge des fonctionnalités clés pour les développeurs, telles que les appels de fonctions, l'API par lots et les sorties en continu. GPT-4.5 excelle particulièrement dans les tâches nécessitant créativité, pensée ouverte et dialogue (comme l'écriture, l'apprentissage ou l'exploration de nouvelles idées). La date limite des connaissances est fixée à octobre 2023."
+  },
  "gpt-4o": {
    "description": "ChatGPT-4o est un modèle dynamique, mis à jour en temps réel pour rester à jour avec la dernière version. Il combine une compréhension et une génération de langage puissantes, adapté à des scénarios d'application à grande échelle, y compris le service client, l'éducation et le support technique."
  },
@@ -1088,15 +1130,6 @@
  "llama-3.1-8b-instant": {
    "description": "Llama 3.1 8B est un modèle à haute performance, offrant une capacité de génération de texte rapide, particulièrement adapté aux scénarios d'application nécessitant une efficacité à grande échelle et un rapport coût-efficacité."
  },
-  "llama-3.1-sonar-huge-128k-online": {
-    "description": "Le modèle Llama 3.1 Sonar Huge Online, avec 405B de paramètres, prend en charge une longueur de contexte d'environ 127 000 jetons, conçu pour des applications de chat en ligne complexes."
-  },
-  "llama-3.1-sonar-large-128k-online": {
-    "description": "Le modèle Llama 3.1 Sonar Large Online, avec 70B de paramètres, prend en charge une longueur de contexte d'environ 127 000 jetons, adapté aux tâches de chat à haute capacité et diversifiées."
-  },
-  "llama-3.1-sonar-small-128k-online": {
-    "description": "Le modèle Llama 3.1 Sonar Small Online, avec 8B de paramètres, prend en charge une longueur de contexte d'environ 127 000 jetons, conçu pour le chat en ligne, capable de traiter efficacement diverses interactions textuelles."
-  },
  "llama-3.2-11b-vision-instruct": {
    "description": "Capacités d'inférence d'image exceptionnelles sur des images haute résolution, adaptées aux applications de compréhension visuelle."
  },
@@ -1250,6 +1283,9 @@
  "meta-llama/llama-3.2-11b-vision-instruct": {
    "description": "LLaMA 3.2 est conçu pour traiter des tâches combinant des données visuelles et textuelles. Il excelle dans des tâches telles que la description d'images et les questions-réponses visuelles, comblant le fossé entre la génération de langage et le raisonnement visuel."
  },
+  "meta-llama/llama-3.2-3b-instruct": {
+    "description": "meta-llama/llama-3.2-3b-instruct"
+  },
  "meta-llama/llama-3.2-90b-vision-instruct": {
    "description": "LLaMA 3.2 est conçu pour traiter des tâches combinant des données visuelles et textuelles. Il excelle dans des tâches telles que la description d'images et les questions-réponses visuelles, comblant le fossé entre la génération de langage et le raisonnement visuel."
  },
@@ -1484,6 +1520,9 @@
  "qwen-max-latest": {
    "description": "Le modèle de langage à grande échelle Tongyi Qwen de niveau milliard, prenant en charge des entrées en chinois, en anglais et dans d'autres langues, actuellement le modèle API derrière la version produit Tongyi Qwen 2.5."
  },
+  "qwen-omni-turbo-latest": {
+    "description": "La série de modèles Qwen-Omni prend en charge l'entrée de données multimodales, y compris vidéo, audio, images et texte, et produit des sorties audio et textuelles."
+  },
  "qwen-plus": {
    "description": "Version améliorée du modèle de langage à grande échelle Qwen, prenant en charge des entrées dans différentes langues telles que le chinois et l'anglais."
  },
@@ -1511,9 +1550,21 @@
  "qwen-vl-v1": {
    "description": "Initialisé avec le modèle de langage Qwen-7B, ajoutant un modèle d'image, un modèle pré-entraîné avec une résolution d'entrée d'image de 448."
  },
+  "qwen/qwen-2-7b-instruct": {
+    "description": "Qwen2 est la toute nouvelle série de modèles de langage de grande taille Qwen. Qwen2 7B est un modèle basé sur le transformateur, qui excelle dans la compréhension du langage, les capacités multilingues, la programmation, les mathématiques et le raisonnement."
+  },
  "qwen/qwen-2-7b-instruct:free": {
    "description": "Qwen2 est une toute nouvelle série de modèles de langage de grande taille, offrant des capacités de compréhension et de génération plus puissantes."
  },
+  "qwen/qwen-2-vl-72b-instruct": {
+    "description": "Qwen2-VL est la dernière version itérée du modèle Qwen-VL, atteignant des performances de pointe dans les benchmarks de compréhension visuelle, y compris MathVista, DocVQA, RealWorldQA et MTVQA. Qwen2-VL peut comprendre des vidéos de plus de 20 minutes pour des questions-réponses, des dialogues et de la création de contenu de haute qualité basés sur la vidéo. Il possède également des capacités de raisonnement et de décision complexes, pouvant être intégré à des appareils mobiles, des robots, etc., pour des opérations automatiques basées sur l'environnement visuel et des instructions textuelles. En plus de l'anglais et du chinois, Qwen2-VL prend désormais en charge la compréhension du texte dans différentes langues dans les images, y compris la plupart des langues européennes, le japonais, le coréen, l'arabe et le vietnamien."
+  },
+  "qwen/qwen-2.5-72b-instruct": {
+    "description": "Qwen2.5-72B-Instruct est l'un des derniers modèles de langage de grande taille publiés par Alibaba Cloud. Ce modèle de 72B présente des capacités significativement améliorées dans des domaines tels que le codage et les mathématiques. Le modèle offre également un support multilingue, couvrant plus de 29 langues, y compris le chinois et l'anglais. Il a montré des améliorations significatives dans le suivi des instructions, la compréhension des données structurées et la génération de sorties structurées (en particulier JSON)."
+  },
+  "qwen/qwen2.5-32b-instruct": {
+    "description": "Qwen2.5-32B-Instruct est l'un des derniers modèles de langage de grande taille publiés par Alibaba Cloud. Ce modèle de 32B présente des capacités significativement améliorées dans des domaines tels que le codage et les mathématiques. Le modèle offre un support multilingue, couvrant plus de 29 langues, y compris le chinois et l'anglais. Il a montré des améliorations significatives dans le suivi des instructions, la compréhension des données structurées et la génération de sorties structurées (en particulier JSON)."
+  },
  "qwen/qwen2.5-7b-instruct": {
    "description": "LLM orienté vers le chinois et l'anglais, ciblant des domaines tels que la langue, la programmation, les mathématiques et le raisonnement."
  },
@@ -1589,9 +1640,18 @@
  "qwq": {
    "description": "QwQ est un modèle de recherche expérimental, axé sur l'amélioration des capacités de raisonnement de l'IA."
  },
+  "qwq-32b": {
+    "description": "Le modèle d'inférence QwQ, entraîné sur le modèle Qwen2.5-32B, a considérablement amélioré ses capacités d'inférence grâce à l'apprentissage par renforcement. Les indicateurs clés du modèle, tels que le code mathématique (AIME 24/25, LiveCodeBench) ainsi que certains indicateurs généraux (IFEval, LiveBench, etc.), atteignent le niveau de la version complète de DeepSeek-R1, avec des performances nettement supérieures à celles de DeepSeek-R1-Distill-Qwen-32B, également basé sur Qwen2.5-32B."
+  },
  "qwq-32b-preview": {
    "description": "Le modèle QwQ est un modèle de recherche expérimental développé par l'équipe Qwen, axé sur l'amélioration des capacités de raisonnement de l'IA."
  },
+  "qwq-plus-latest": {
+    "description": "Le modèle d'inférence QwQ, entraîné sur le modèle Qwen2.5, a considérablement amélioré ses capacités d'inférence grâce à l'apprentissage par renforcement. Les indicateurs clés du modèle, tels que le code mathématique (AIME 24/25, LiveCodeBench) ainsi que certains indicateurs généraux (IFEval, LiveBench, etc.), atteignent le niveau de la version complète de DeepSeek-R1."
+  },
+  "r1-1776": {
+    "description": "R1-1776 est une version du modèle DeepSeek R1, après un entraînement supplémentaire, fournissant des informations factuelles non filtrées et impartiales."
+  },
  "solar-mini": {
    "description": "Solar Mini est un LLM compact, offrant des performances supérieures à celles de GPT-3.5, avec de puissantes capacités multilingues, prenant en charge l'anglais et le coréen, et fournissant une solution efficace et compacte."
  },
@@ -1604,6 +1664,9 @@
  "sonar": {
    "description": "Produit de recherche léger basé sur le contexte de recherche, plus rapide et moins cher que Sonar Pro."
  },
+  "sonar-deep-research": {
+    "description": "Deep Research effectue des recherches approfondies de niveau expert et les synthétise en rapports accessibles et exploitables."
+  },
  "sonar-pro": {
    "description": "Produit de recherche avancé prenant en charge le contexte de recherche, avec des requêtes avancées et un suivi."
  },
@@ -1661,6 +1724,9 @@
  "text-embedding-3-small": {
    "description": "Un modèle d'Embedding de nouvelle génération, efficace et économique, adapté à la recherche de connaissances, aux applications RAG, etc."
  },
+  "thudm/glm-4-9b-chat": {
+    "description": "Version open source de la dernière génération de modèles pré-entraînés de la série GLM-4 publiée par Zhizhu AI."
+  },
  "togethercomputer/StripedHyena-Nous-7B": {
    "description": "StripedHyena Nous (7B) offre une capacité de calcul améliorée grâce à des stratégies et une architecture de modèle efficaces."
  },
@@ -1676,6 +1742,9 @@
  "us.anthropic.claude-3-5-sonnet-20241022-v2:0": {
    "description": "Claude 3.5 Sonnet élève les normes de l'industrie, surpassant les modèles concurrents et Claude 3 Opus, avec d'excellentes performances dans une large gamme d'évaluations, tout en offrant la vitesse et le coût de nos modèles de niveau intermédiaire."
  },
+  "us.anthropic.claude-3-7-sonnet-20250219-v1:0": {
+    "description": "Claude 3.7 sonnet est le modèle de prochaine génération le plus rapide d'Anthropic. Par rapport à Claude 3 Haiku, Claude 3.7 Sonnet a amélioré ses compétences dans divers domaines et a surpassé le plus grand modèle de la génération précédente, Claude 3 Opus, dans de nombreux tests de référence intellectuels."
+  },
  "whisper-1": {
    "description": "Modèle de reconnaissance vocale général, prenant en charge la reconnaissance vocale multilingue, la traduction vocale et la reconnaissance de langue."
  },
@@ -140,6 +140,18 @@
      "close": "Supprimer",
      "confirm": "Configuration terminée, veuillez réessayer"
    },
+    "crawPages": {
+      "crawling": "Identification des liens en cours",
+      "detail": {
+        "preview": "Aperçu",
+        "raw": "Texte brut",
+        "tooLong": "Le contenu du texte est trop long, le contexte de la conversation ne conserve que les {{characters}} premiers caractères, la partie excédentaire n'est pas prise en compte dans le contexte de la conversation"
+      },
+      "meta": {
+        "crawler": "Mode de collecte",
+        "words": "Nombre de caractères"
+      }
+    },
    "searchxng": {
      "baseURL": "Veuillez entrer",
      "description": "Veuillez entrer l'URL de SearchXNG pour commencer la recherche en ligne",
@@ -89,6 +89,9 @@
  "perplexity": {
    "description": "Perplexity est un fournisseur de modèles de génération de dialogue de premier plan, offrant divers modèles avancés Llama 3.1, prenant en charge les applications en ligne et hors ligne, particulièrement adaptés aux tâches complexes de traitement du langage naturel."
  },
+  "ppio": {
+    "description": "PPIO Paiouyun offre des services API de modèles open source stables et rentables, prenant en charge toute la gamme DeepSeek, Llama, Qwen et d'autres grands modèles de pointe dans l'industrie."
+  },
  "qwen": {
    "description": "Tongyi Qianwen est un modèle de langage à grande échelle développé de manière autonome par Alibaba Cloud, doté de puissantes capacités de compréhension et de génération du langage naturel. Il peut répondre à diverses questions, créer du contenu écrit, exprimer des opinions, rédiger du code, etc., jouant un rôle dans plusieurs domaines."
  },
@@ -32,7 +32,12 @@
  "duplicateTitle": "{{title}} Copia",
  "emptyAgent": "Nessun assistente disponibile",
  "extendParams": {
+    "disableContextCaching": {
+      "desc": "Il costo di generazione di una singola conversazione può essere ridotto fino al 90%, con una velocità di risposta aumentata di 4 volte (<1>Scopri di più</1>). Attivando questa opzione, verrà disabilitato automaticamente il limite sul numero di messaggi storici.",
+      "title": "Attiva la cache del contesto"
+    },
    "enableReasoning": {
+      "desc": "Limitazioni basate sul meccanismo di pensiero di Claude (<1>Scopri di più</1>), attivando questa opzione verrà disabilitato automaticamente il limite sul numero di messaggi storici.",
      "title": "Attiva il pensiero profondo"
    },
    "reasoningBudgetToken": {
@@ -40,6 +45,9 @@
    },
    "title": "Funzionalità di estensione del modello"
  },
+  "history": {
+    "title": "L'assistente ricorderà solo gli ultimi {{count}} messaggi"
+  },
  "historyRange": "Intervallo cronologico",
  "historySummary": "Riepilogo della storia",
  "inbox": {
@@ -79,6 +87,39 @@
    "deleteDisabledByThreads": "Esistono sottoargomenti, non è possibile eliminare",
    "regenerate": "Rigenera"
  },
+  "messages": {
+    "modelCard": {
+      "credit": "Crediti",
+      "creditPricing": "Prezzo",
+      "creditTooltip": "Per facilitare il conteggio, consideriamo 1$ equivalente a 1M crediti, ad esempio $3/M token equivalgono a 3 crediti/token",
+      "pricing": {
+        "inputCachedTokens": "Input memorizzato {{amount}}/crediti · ${{amount}}/M",
+        "inputCharts": "${{amount}}/M caratteri",
+        "inputMinutes": "${{amount}}/minuto",
+        "inputTokens": "Input {{amount}}/crediti · ${{amount}}/M",
+        "outputTokens": "Output {{amount}}/crediti · ${{amount}}/M",
+        "writeCacheInputTokens": "Scrittura cache input {{amount}}/crediti · ${{amount}}/M"
+      }
+    },
+    "tokenDetails": {
+      "average": "Prezzo medio",
+      "input": "Input",
+      "inputAudio": "Input audio",
+      "inputCached": "Input memorizzato",
+      "inputCitation": "Citazione input",
+      "inputText": "Input testo",
+      "inputTitle": "Dettagli input",
+      "inputUncached": "Input non memorizzato",
+      "inputWriteCached": "Scrittura cache input",
+      "output": "Output",
+      "outputAudio": "Output audio",
+      "outputText": "Output testo",
+      "outputTitle": "Dettagli output",
+      "reasoning": "Ragionamento profondo",
+      "title": "Dettagli generati",
+      "total": "Totale consumato"
+    }
+  },
  "newAgent": "Nuovo assistente",
  "pin": "Fissa in alto",
  "pinOff": "Annulla fissaggio in alto",
@@ -322,6 +322,9 @@
    "tooltip": "Aggiorna la configurazione di base del fornitore",
    "updateSuccess": "Aggiornamento avvenuto con successo"
  },
+  "updateCustomAiProvider": {
+    "title": "Aggiorna la configurazione del fornitore di AI personalizzato"
+  },
  "vertexai": {
    "apiKey": {
      "desc": "Inserisci le tue chiavi Vertex AI",
@@ -8,6 +8,12 @@
  "01-ai/Yi-1.5-9B-Chat-16K": {
    "description": "Yi-1.5 9B supporta 16K Tokens, offrendo capacità di generazione linguistica efficienti e fluide."
  },
+  "01-ai/yi-1.5-34b-chat": {
+    "description": "Zero One Everything, il più recente modello open source fine-tuned, con 34 miliardi di parametri, supporta vari scenari di dialogo, con dati di addestramento di alta qualità, allineati alle preferenze umane."
+  },
+  "01-ai/yi-1.5-9b-chat": {
+    "description": "Zero One Everything, il più recente modello open source fine-tuned, con 9 miliardi di parametri, supporta vari scenari di dialogo, con dati di addestramento di alta qualità, allineati alle preferenze umane."
+  },
  "360gpt-pro": {
    "description": "360GPT Pro, come membro importante della serie di modelli AI di 360, soddisfa le diverse applicazioni del linguaggio naturale con un'efficace capacità di elaborazione del testo, supportando la comprensione di testi lunghi e conversazioni a più turni."
  },
@@ -239,6 +245,9 @@
  "Qwen/QVQ-72B-Preview": {
    "description": "QVQ-72B-Preview è un modello di ricerca sviluppato dal team Qwen, focalizzato sulle capacità di inferenza visiva, con vantaggi unici nella comprensione di scenari complessi e nella risoluzione di problemi matematici legati alla visione."
  },
+  "Qwen/QwQ-32B": {
+    "description": "QwQ è il modello di inferenza della serie Qwen. Rispetto ai tradizionali modelli di ottimizzazione delle istruzioni, QwQ possiede capacità di pensiero e ragionamento, consentendo prestazioni significativamente migliorate nei compiti downstream, specialmente nella risoluzione di problemi complessi. QwQ-32B è un modello di inferenza di medie dimensioni, in grado di ottenere prestazioni competitive rispetto ai modelli di inferenza all'avanguardia (come DeepSeek-R1, o1-mini). Questo modello utilizza tecnologie come RoPE, SwiGLU, RMSNorm e Attention QKV bias, con una struttura di rete a 64 strati e 40 teste di attenzione Q (nel GQA, KV è 8)."
+  },
  "Qwen/QwQ-32B-Preview": {
    "description": "QwQ-32B-Preview è l'ultimo modello di ricerca sperimentale di Qwen, focalizzato sul miglioramento delle capacità di ragionamento dell'IA. Esplorando meccanismi complessi come la mescolanza linguistica e il ragionamento ricorsivo, i principali vantaggi includono potenti capacità di analisi del ragionamento, abilità matematiche e di programmazione. Tuttavia, ci sono anche problemi di cambio linguistico, cicli di ragionamento, considerazioni di sicurezza e differenze in altre capacità."
  },
@@ -467,9 +476,6 @@
  "anthropic.claude-3-5-sonnet-20241022-v2:0": {
    "description": "Claude 3.5 Sonnet ha elevato gli standard del settore, superando le prestazioni dei modelli concorrenti e di Claude 3 Opus, dimostrando eccellenza in una vasta gamma di valutazioni, mantenendo al contempo la velocità e i costi dei nostri modelli di livello medio."
  },
-  "anthropic.claude-3-7-sonnet-20250219-v1:0": {
-    "description": "Claude 3.7 Sonnet è il modello più recente di Anthropic, con prestazioni all'avanguardia in una vasta gamma di valutazioni, superando i modelli concorrenti e Claude 3.5 Sonnet, dimostrando eccellenza in una vasta gamma di valutazioni, mantenendo al contempo la velocità e i costi dei nostri modelli di livello medio."
-  },
  "anthropic.claude-3-haiku-20240307-v1:0": {
    "description": "Claude 3 Haiku è il modello più veloce e compatto di Anthropic, offrendo una velocità di risposta quasi istantanea. Può rispondere rapidamente a query e richieste semplici. I clienti saranno in grado di costruire un'esperienza AI senza soluzione di continuità che imita l'interazione umana. Claude 3 Haiku può gestire immagini e restituire output testuali, con una finestra di contesto di 200K."
  },
@@ -506,6 +512,9 @@
  "aya:35b": {
    "description": "Aya 23 è un modello multilingue lanciato da Cohere, supporta 23 lingue, facilitando applicazioni linguistiche diversificate."
  },
+  "baichuan/baichuan2-13b-chat": {
+    "description": "Baichuan-13B è un modello di linguaggio open source sviluppato da Baichuan Intelligence, con 13 miliardi di parametri, che ha ottenuto i migliori risultati nella sua categoria in benchmark autorevoli sia in cinese che in inglese."
+  },
  "charglm-3": {
    "description": "CharGLM-3 è progettato per il gioco di ruolo e la compagnia emotiva, supporta una memoria multi-turno ultra-lunga e dialoghi personalizzati, con ampie applicazioni."
  },
@@ -686,9 +695,30 @@
  "deepseek/deepseek-r1": {
    "description": "DeepSeek-R1 ha notevolmente migliorato le capacità di ragionamento del modello con pochissimi dati etichettati. Prima di fornire la risposta finale, il modello genera una catena di pensiero per migliorare l'accuratezza della risposta finale."
  },
+  "deepseek/deepseek-r1-distill-llama-70b": {
+    "description": "DeepSeek R1 Distill Llama 70B è un grande modello di linguaggio basato su Llama3.3 70B, che utilizza il fine-tuning dell'output di DeepSeek R1 per raggiungere prestazioni competitive paragonabili a quelle dei modelli all'avanguardia di grandi dimensioni."
+  },
+  "deepseek/deepseek-r1-distill-llama-8b": {
+    "description": "DeepSeek R1 Distill Llama 8B è un modello di linguaggio distillato basato su Llama-3.1-8B-Instruct, addestrato utilizzando l'output di DeepSeek R1."
+  },
+  "deepseek/deepseek-r1-distill-qwen-14b": {
+    "description": "DeepSeek R1 Distill Qwen 14B è un modello di linguaggio distillato basato su Qwen 2.5 14B, addestrato utilizzando l'output di DeepSeek R1. Questo modello ha superato OpenAI's o1-mini in diversi benchmark, raggiungendo risultati all'avanguardia per i modelli densi. Ecco alcuni risultati dei benchmark:\nAIME 2024 pass@1: 69.7\nMATH-500 pass@1: 93.9\nCodeForces Rating: 1481\nQuesto modello, attraverso il fine-tuning dell'output di DeepSeek R1, ha dimostrato prestazioni competitive paragonabili a modelli all'avanguardia di dimensioni maggiori."
+  },
+  "deepseek/deepseek-r1-distill-qwen-32b": {
+    "description": "DeepSeek R1 Distill Qwen 32B è un modello di linguaggio distillato basato su Qwen 2.5 32B, addestrato utilizzando l'output di DeepSeek R1. Questo modello ha superato OpenAI's o1-mini in diversi benchmark, raggiungendo risultati all'avanguardia per i modelli densi. Ecco alcuni risultati dei benchmark:\nAIME 2024 pass@1: 72.6\nMATH-500 pass@1: 94.3\nCodeForces Rating: 1691\nQuesto modello, attraverso il fine-tuning dell'output di DeepSeek R1, ha dimostrato prestazioni competitive paragonabili a modelli all'avanguardia di dimensioni maggiori."
+  },
+  "deepseek/deepseek-r1/community": {
+    "description": "DeepSeek R1 è l'ultimo modello open source rilasciato dal team di DeepSeek, con prestazioni di inferenza eccezionali, in particolare nei compiti di matematica, programmazione e ragionamento, raggiungendo livelli comparabili a quelli del modello o1 di OpenAI."
+  },
  "deepseek/deepseek-r1:free": {
    "description": "DeepSeek-R1 ha notevolmente migliorato le capacità di ragionamento del modello con pochissimi dati etichettati. Prima di fornire la risposta finale, il modello genera una catena di pensiero per migliorare l'accuratezza della risposta finale."
  },
+  "deepseek/deepseek-v3": {
+    "description": "DeepSeek-V3 ha realizzato un significativo progresso nella velocità di inferenza rispetto ai modelli precedenti. Si posiziona al primo posto tra i modelli open source e può competere con i modelli closed source più avanzati al mondo. DeepSeek-V3 utilizza l'architettura Multi-Head Latent Attention (MLA) e DeepSeekMoE, che sono state ampiamente validate in DeepSeek-V2. Inoltre, DeepSeek-V3 ha introdotto una strategia ausiliaria senza perdita per il bilanciamento del carico e ha stabilito obiettivi di addestramento per la previsione multi-etichetta per ottenere prestazioni superiori."
+  },
+  "deepseek/deepseek-v3/community": {
+    "description": "DeepSeek-V3 ha realizzato un significativo progresso nella velocità di inferenza rispetto ai modelli precedenti. Si posiziona al primo posto tra i modelli open source e può competere con i modelli closed source più avanzati al mondo. DeepSeek-V3 utilizza l'architettura Multi-Head Latent Attention (MLA) e DeepSeekMoE, che sono state ampiamente validate in DeepSeek-V2. Inoltre, DeepSeek-V3 ha introdotto una strategia ausiliaria senza perdita per il bilanciamento del carico e ha stabilito obiettivi di addestramento per la previsione multi-etichetta per ottenere prestazioni superiori."
+  },
  "doubao-1.5-lite-32k": {
    "description": "Doubao-1.5-lite è un modello leggero di nuova generazione, con una velocità di risposta eccezionale, raggiungendo standard di livello mondiale sia in termini di prestazioni che di latenza."
  },
@@ -800,9 +830,18 @@
  "gemini-2.0-flash-001": {
    "description": "Gemini 2.0 Flash offre funzionalità e miglioramenti di nuova generazione, tra cui velocità eccezionale, utilizzo di strumenti nativi, generazione multimodale e una finestra di contesto di 1M token."
  },
+  "gemini-2.0-flash-lite": {
+    "description": "Gemini 2.0 Flash è una variante del modello Flash, ottimizzata per obiettivi come il rapporto costo-efficacia e la bassa latenza."
+  },
+  "gemini-2.0-flash-lite-001": {
+    "description": "Gemini 2.0 Flash è una variante del modello Flash, ottimizzata per obiettivi come il rapporto costo-efficacia e la bassa latenza."
+  },
  "gemini-2.0-flash-lite-preview-02-05": {
    "description": "Un modello Gemini 2.0 Flash ottimizzato per obiettivi di costo-efficacia e bassa latenza."
  },
+  "gemini-2.0-flash-thinking-exp": {
+    "description": "Gemini 2.0 Flash Exp è il più recente modello AI multimodale sperimentale di Google, dotato di caratteristiche di nuova generazione, velocità eccezionale, chiamate a strumenti nativi e generazione multimodale."
+  },
  "gemini-2.0-flash-thinking-exp-01-21": {
    "description": "Gemini 2.0 Flash Exp è il più recente modello AI multimodale sperimentale di Google, dotato di caratteristiche di nuova generazione, velocità eccezionale, chiamate a strumenti nativi e generazione multimodale."
  },
@@ -953,6 +992,9 @@
  "gpt-4-vision-preview": {
    "description": "L'ultimo modello GPT-4 Turbo ha funzionalità visive. Ora, le richieste visive possono essere effettuate utilizzando il formato JSON e le chiamate di funzione. GPT-4 Turbo è una versione potenziata che offre supporto economico per compiti multimodali. Trova un equilibrio tra accuratezza ed efficienza, adatta a scenari di applicazione che richiedono interazioni in tempo reale."
  },
+  "gpt-4.5-preview": {
+    "description": "Anteprima di ricerca di GPT-4.5, il nostro modello GPT più grande e potente fino ad oggi. Possiede una vasta conoscenza del mondo e comprende meglio le intenzioni degli utenti, eccellendo in compiti creativi e nella pianificazione autonoma. GPT-4.5 accetta input testuali e visivi e genera output testuali (inclusi output strutturati). Supporta funzionalità chiave per gli sviluppatori, come chiamate di funzione, API in batch e output in streaming. GPT-4.5 si distingue particolarmente in compiti che richiedono pensiero creativo, aperto e dialogo (come scrittura, apprendimento o esplorazione di nuove idee). La data di scadenza delle conoscenze è ottobre 2023."
+  },
  "gpt-4o": {
    "description": "ChatGPT-4o è un modello dinamico, aggiornato in tempo reale per mantenere la versione più recente. Combina una potente comprensione e generazione del linguaggio, adatta a scenari di applicazione su larga scala, inclusi servizi clienti, educazione e supporto tecnico."
  },
@@ -1088,15 +1130,6 @@
  "llama-3.1-8b-instant": {
    "description": "Llama 3.1 8B è un modello ad alte prestazioni, offre capacità di generazione di testo rapida, particolarmente adatto per scenari applicativi che richiedono efficienza su larga scala e costi contenuti."
  },
-  "llama-3.1-sonar-huge-128k-online": {
-    "description": "Il modello Llama 3.1 Sonar Huge Online, con 405B parametri, supporta una lunghezza di contesto di circa 127.000 token, progettato per applicazioni di chat online complesse."
-  },
-  "llama-3.1-sonar-large-128k-online": {
-    "description": "Il modello Llama 3.1 Sonar Large Online, con 70B parametri, supporta una lunghezza di contesto di circa 127.000 token, adatto per compiti di chat ad alta capacità e diversificati."
-  },
-  "llama-3.1-sonar-small-128k-online": {
-    "description": "Il modello Llama 3.1 Sonar Small Online, con 8B parametri, supporta una lunghezza di contesto di circa 127.000 token, progettato per chat online, in grado di gestire interazioni testuali in modo efficiente."
-  },
  "llama-3.2-11b-vision-instruct": {
    "description": "Eccellenti capacità di ragionamento visivo su immagini ad alta risoluzione, adatte ad applicazioni di comprensione visiva."
  },
@@ -1250,6 +1283,9 @@
  "meta-llama/llama-3.2-11b-vision-instruct": {
    "description": "LLaMA 3.2 è progettato per gestire compiti che combinano dati visivi e testuali. Si distingue in compiti come la descrizione delle immagini e il question answering visivo, colmando il divario tra generazione del linguaggio e ragionamento visivo."
  },
+  "meta-llama/llama-3.2-3b-instruct": {
+    "description": "meta-llama/llama-3.2-3b-instruct"
+  },
  "meta-llama/llama-3.2-90b-vision-instruct": {
    "description": "LLaMA 3.2 è progettato per gestire compiti che combinano dati visivi e testuali. Si distingue in compiti come la descrizione delle immagini e il question answering visivo, colmando il divario tra generazione del linguaggio e ragionamento visivo."
  },
@@ -1484,6 +1520,9 @@
  "qwen-max-latest": {
    "description": "Modello linguistico su larga scala Tongyi Qwen con miliardi di parametri, supporta input in diverse lingue tra cui cinese e inglese, attualmente il modello API dietro la versione del prodotto Tongyi Qwen 2.5."
  },
+  "qwen-omni-turbo-latest": {
+    "description": "La serie di modelli Qwen-Omni supporta l'input di dati in diverse modalità, inclusi video, audio, immagini e testo, e produce output audio e testuale."
+  },
  "qwen-plus": {
    "description": "Qwen Plus è una versione potenziata del modello linguistico di grandi dimensioni, che supporta input in diverse lingue, tra cui cinese e inglese."
  },
@@ -1511,9 +1550,21 @@
  "qwen-vl-v1": {
    "description": "Inizializzato con il modello di linguaggio Qwen-7B, aggiunge un modello di immagine, con una risoluzione di input dell'immagine di 448."
  },
+  "qwen/qwen-2-7b-instruct": {
+    "description": "Qwen2 è la nuova serie di modelli di linguaggio Qwen. Qwen2 7B è un modello basato su transformer, che mostra prestazioni eccezionali nella comprensione del linguaggio, nelle capacità multilingue, nella programmazione, nella matematica e nel ragionamento."
+  },
  "qwen/qwen-2-7b-instruct:free": {
    "description": "Qwen2 è una nuova serie di modelli di linguaggio di grandi dimensioni, con capacità di comprensione e generazione più forti."
  },
+  "qwen/qwen-2-vl-72b-instruct": {
+    "description": "Qwen2-VL è l'ultima iterazione del modello Qwen-VL, raggiungendo prestazioni all'avanguardia nei benchmark di comprensione visiva, inclusi MathVista, DocVQA, RealWorldQA e MTVQA. Qwen2-VL è in grado di comprendere video di oltre 20 minuti, per domande e risposte, dialoghi e creazione di contenuti di alta qualità basati su video. Ha anche capacità di ragionamento e decisione complesse, che possono essere integrate con dispositivi mobili, robot e altro, per operazioni automatiche basate su ambienti visivi e istruzioni testuali. Oltre all'inglese e al cinese, Qwen2-VL ora supporta anche la comprensione di testi in diverse lingue all'interno delle immagini, comprese la maggior parte delle lingue europee, giapponese, coreano, arabo e vietnamita."
+  },
+  "qwen/qwen-2.5-72b-instruct": {
+    "description": "Qwen2.5-72B-Instruct è uno dei più recenti modelli di linguaggio rilasciati da Alibaba Cloud. Questo modello da 72B ha capacità notevolmente migliorate in campi come la codifica e la matematica. Il modello offre anche supporto multilingue, coprendo oltre 29 lingue, tra cui cinese e inglese. Ha mostrato miglioramenti significativi nel seguire istruzioni, comprendere dati strutturati e generare output strutturati (in particolare JSON)."
+  },
+  "qwen/qwen2.5-32b-instruct": {
+    "description": "Qwen2.5-32B-Instruct è uno dei più recenti modelli di linguaggio rilasciati da Alibaba Cloud. Questo modello da 32B ha capacità notevolmente migliorate in campi come la codifica e la matematica. Il modello offre anche supporto multilingue, coprendo oltre 29 lingue, tra cui cinese e inglese. Ha mostrato miglioramenti significativi nel seguire istruzioni, comprendere dati strutturati e generare output strutturati (in particolare JSON)."
+  },
  "qwen/qwen2.5-7b-instruct": {
    "description": "LLM orientato al cinese e all'inglese, focalizzato su linguaggio, programmazione, matematica, ragionamento e altro."
  },
@@ -1589,9 +1640,18 @@
  "qwq": {
    "description": "QwQ è un modello di ricerca sperimentale, focalizzato sul miglioramento delle capacità di ragionamento dell'IA."
  },
+  "qwq-32b": {
+    "description": "Il modello di inferenza QwQ, addestrato sul modello Qwen2.5-32B, ha notevolmente migliorato le capacità di inferenza del modello attraverso l'apprendimento rinforzato. I principali indicatori core (AIME 24/25, LiveCodeBench) e alcuni indicatori generali (IFEval, LiveBench, ecc.) raggiungono il livello della versione completa di DeepSeek-R1, con tutti gli indicatori che superano significativamente il DeepSeek-R1-Distill-Qwen-32B, anch'esso basato su Qwen2.5-32B."
+  },
  "qwq-32b-preview": {
    "description": "Il modello QwQ è un modello di ricerca sperimentale sviluppato dal team Qwen, focalizzato sul potenziamento delle capacità di ragionamento dell'IA."
  },
+  "qwq-plus-latest": {
+    "description": "Il modello di inferenza QwQ, addestrato sul modello Qwen2.5, ha notevolmente migliorato le capacità di inferenza del modello attraverso l'apprendimento rinforzato. I principali indicatori core (AIME 24/25, LiveCodeBench) e alcuni indicatori generali (IFEval, LiveBench, ecc.) raggiungono il livello della versione completa di DeepSeek-R1."
+  },
+  "r1-1776": {
+    "description": "R1-1776 è una versione del modello DeepSeek R1, addestrata successivamente per fornire informazioni fattuali non verificate e prive di pregiudizi."
+  },
  "solar-mini": {
    "description": "Solar Mini è un LLM compatto, con prestazioni superiori a GPT-3.5, dotato di potenti capacità multilingue, supporta inglese e coreano, offrendo soluzioni efficienti e compatte."
  },
@@ -1604,6 +1664,9 @@
  "sonar": {
    "description": "Prodotto di ricerca leggero basato sul contesto di ricerca, più veloce e più economico rispetto a Sonar Pro."
  },
+  "sonar-deep-research": {
+    "description": "Deep Research conduce ricerche complete a livello esperto e le sintetizza in rapporti accessibili e utilizzabili."
+  },
  "sonar-pro": {
    "description": "Prodotto di ricerca avanzata che supporta il contesto di ricerca, query avanzate e follow-up."
  },
@@ -1661,6 +1724,9 @@
  "text-embedding-3-small": {
    "description": "Modello di Embedding di nuova generazione, efficiente ed economico, adatto per la ricerca di conoscenza, applicazioni RAG e altri scenari."
  },
+  "thudm/glm-4-9b-chat": {
+    "description": "La versione open source dell'ultima generazione del modello pre-addestrato GLM-4 rilasciato da Zhizhu AI."
+  },
  "togethercomputer/StripedHyena-Nous-7B": {
    "description": "StripedHyena Nous (7B) offre capacità di calcolo potenziate attraverso strategie e architetture di modelli efficienti."
  },
@@ -1676,6 +1742,9 @@
  "us.anthropic.claude-3-5-sonnet-20241022-v2:0": {
    "description": "Claude 3.5 Sonnet ha elevato gli standard del settore, superando le prestazioni dei modelli concorrenti e di Claude 3 Opus, dimostrando eccellenza in una vasta gamma di valutazioni, mantenendo al contempo la velocità e i costi dei nostri modelli di livello medio."
  },
+  "us.anthropic.claude-3-7-sonnet-20250219-v1:0": {
+    "description": "Claude 3.7 sonnet è il modello di prossima generazione più veloce di Anthropic. Rispetto a Claude 3 Haiku, Claude 3.7 Sonnet ha migliorato le sue capacità in vari ambiti e ha superato il modello di generazione precedente, Claude 3 Opus, in molti test di intelligenza."
+  },
  "whisper-1": {
    "description": "Modello di riconoscimento vocale universale, supporta il riconoscimento vocale multilingue, la traduzione vocale e il riconoscimento linguistico."
  },
@@ -140,6 +140,18 @@
      "close": "Rimuovi",
      "confirm": "Configurazione completata, riprovare"
    },
+    "crawPages": {
+      "crawling": "Riconoscimento del link in corso",
+      "detail": {
+        "preview": "Anteprima",
+        "raw": "Testo originale",
+        "tooLong": "Il contenuto del testo è troppo lungo, il contesto della conversazione manterrà solo i primi {{characters}} caratteri, la parte in eccesso non verrà considerata nel contesto della conversazione"
+      },
+      "meta": {
+        "crawler": "Modalità di scansione",
+        "words": "Numero di caratteri"
+      }
+    },
    "searchxng": {
      "baseURL": "Inserisci",
      "description": "Inserisci l'URL di SearchXNG per iniziare la ricerca online",
@@ -89,6 +89,9 @@
  "perplexity": {
    "description": "Perplexity è un fornitore leader di modelli di generazione di dialogo, offrendo vari modelli avanzati Llama 3.1, supportando applicazioni online e offline, particolarmente adatti per compiti complessi di elaborazione del linguaggio naturale."
  },
+  "ppio": {
+    "description": "PPIO Paeou Cloud offre servizi API per modelli open source stabili e ad alto rapporto qualità-prezzo, supportando l'intera gamma di DeepSeek, Llama, Qwen e altri modelli di grandi dimensioni leader del settore."
+  },
  "qwen": {
    "description": "Qwen è un modello di linguaggio di grande scala sviluppato autonomamente da Alibaba Cloud, con potenti capacità di comprensione e generazione del linguaggio naturale. Può rispondere a varie domande, creare contenuti testuali, esprimere opinioni e scrivere codice, svolgendo un ruolo in vari settori."
  },
@@ -32,7 +32,12 @@
  "duplicateTitle": "{{title}} のコピー",
  "emptyAgent": "エージェントがいません",
  "extendParams": {
+    "disableContextCaching": {
+      "desc": "単一の対話生成コストは最大90%削減され、応答速度は4倍向上します（<1>詳細はこちら</1>）。有効にすると、過去のメッセージ数制限が自動的に無効になります。",
+      "title": "コンテキストキャッシュを有効にする"
+    },
    "enableReasoning": {
+      "desc": "Claude Thinkingメカニズムに基づく制限（<1>詳細はこちら</1>）により、有効にすると過去のメッセージ数制限が自動的に無効になります。",
      "title": "深い思考を有効にする"
    },
    "reasoningBudgetToken": {
@@ -40,6 +45,9 @@
    },
    "title": "モデル拡張機能"
  },
+  "history": {
+    "title": "アシスタントは最後の{{count}}件のメッセージのみを記憶します"
+  },
  "historyRange": "履歴範囲",
  "historySummary": "履歴メッセージの要約",
  "inbox": {
@@ -79,6 +87,39 @@
    "deleteDisabledByThreads": "サブトピックが存在するため、削除できません。",
    "regenerate": "再生成"
  },
+  "messages": {
+    "modelCard": {
+      "credit": "クレジット",
+      "creditPricing": "価格設定",
+      "creditTooltip": "カウントを容易にするために、1ドルを1Mクレジットに換算します。例えば、$3/Mトークンは3クレジット/トークンに相当します。",
+      "pricing": {
+        "inputCachedTokens": "キャッシュ入力 {{amount}}/クレジット · ${{amount}}/M",
+        "inputCharts": "${{amount}}/M 文字",
+        "inputMinutes": "${{amount}}/分",
+        "inputTokens": "入力 {{amount}}/クレジット · ${{amount}}/M",
+        "outputTokens": "出力 {{amount}}/クレジット · ${{amount}}/M",
+        "writeCacheInputTokens": "キャッシュ入力の書き込み {{amount}}/ポイント · ${{amount}}/M"
+      }
+    },
+    "tokenDetails": {
+      "average": "平均単価",
+      "input": "入力",
+      "inputAudio": "音声入力",
+      "inputCached": "キャッシュ入力",
+      "inputCitation": "引用入力",
+      "inputText": "テキスト入力",
+      "inputTitle": "入力の詳細",
+      "inputUncached": "未キャッシュ入力",
+      "inputWriteCached": "入力キャッシュ書き込み",
+      "output": "出力",
+      "outputAudio": "音声出力",
+      "outputText": "テキスト出力",
+      "outputTitle": "出力の詳細",
+      "reasoning": "深い思考",
+      "title": "生成の詳細",
+      "total": "合計消費"
+    }
+  },
  "newAgent": "新しいエージェント",
  "pin": "ピン留め",
  "pinOff": "ピン留め解除",
@@ -322,6 +322,9 @@
    "tooltip": "サービスプロバイダーの基本設定を更新",
    "updateSuccess": "更新に成功しました"
  },
+  "updateCustomAiProvider": {
+    "title": "カスタム AI プロバイダー設定の更新"
+  },
  "vertexai": {
    "apiKey": {
      "desc": "あなたの Vertex AI キーを入力してください",
@@ -8,6 +8,12 @@
  "01-ai/Yi-1.5-9B-Chat-16K": {
    "description": "Yi-1.5 9Bは16Kトークンをサポートし、高効率でスムーズな言語生成能力を提供します。"
  },
+  "01-ai/yi-1.5-34b-chat": {
+    "description": "零一万物、最新のオープンソース微調整モデル、340億パラメータ、微調整は多様な対話シーンをサポートし、高品質なトレーニングデータで人間の好みに合わせています。"
+  },
+  "01-ai/yi-1.5-9b-chat": {
+    "description": "零一万物、最新のオープンソース微調整モデル、90億パラメータ、微調整は多様な対話シーンをサポートし、高品質なトレーニングデータで人間の好みに合わせています。"
+  },
  "360gpt-pro": {
    "description": "360GPT Proは360 AIモデルシリーズの重要なメンバーであり、高効率なテキスト処理能力を持ち、多様な自然言語アプリケーションシーンに対応し、長文理解や多輪対話などの機能をサポートします。"
  },
@@ -239,6 +245,9 @@
  "Qwen/QVQ-72B-Preview": {
    "description": "QVQ-72B-Previewは、Qwenチームによって開発された視覚推論能力に特化した研究モデルであり、複雑なシーン理解と視覚関連の数学問題を解決する上で独自の利点を持っています。"
  },
+  "Qwen/QwQ-32B": {
+    "description": "QwQはQwenシリーズの推論モデルです。従来の指示調整モデルと比較して、QwQは思考と推論能力を備えており、特に困難な問題を解決する際に、下流タスクでのパフォーマンスを大幅に向上させることができます。QwQ-32Bは中型の推論モデルであり、最先端の推論モデル（DeepSeek-R1、o1-miniなど）との比較において競争力のあるパフォーマンスを発揮します。このモデルはRoPE、SwiGLU、RMSNorm、Attention QKVバイアスなどの技術を採用しており、64層のネットワーク構造と40のQアテンションヘッド（GQAアーキテクチャではKVは8個）を持っています。"
+  },
  "Qwen/QwQ-32B-Preview": {
    "description": "QwQ-32B-PreviewはQwenの最新の実験的研究モデルで、AIの推論能力を向上させることに特化しています。言語の混合、再帰的推論などの複雑なメカニズムを探求することで、主な利点は強力な推論分析能力、数学およびプログラミング能力です。同時に、言語切り替えの問題、推論のループ、安全性の考慮、その他の能力の違いも存在します。"
  },
@@ -467,9 +476,6 @@
  "anthropic.claude-3-5-sonnet-20241022-v2:0": {
    "description": "Claude 3.5 Sonnetは業界標準を引き上げ、競合モデルやClaude 3 Opusを上回る性能を発揮し、広範な評価で優れた結果を示しています。また、中程度のレベルのモデルと同等の速度とコストを持っています。"
  },
-  "anthropic.claude-3-7-sonnet-20250219-v1:0": {
-    "description": "Claude 3.7 Sonnetは、競合他社よりも低価格で最大の効用を提供し、信頼性が高く耐久性のある主力機として設計されています。スケール化されたAIデプロイメントに適しています。Claude 3.7 Sonnetは画像を処理し、テキスト出力を返すことができ、200Kのコンテキストウィンドウを持っています。"
-  },
  "anthropic.claude-3-haiku-20240307-v1:0": {
    "description": "Claude 3 HaikuはAnthropicの最も速く、最もコンパクトなモデルで、ほぼ瞬時の応答速度を提供します。簡単なクエリやリクエストに迅速に回答できます。顧客は人間のインタラクションを模倣するシームレスなAI体験を構築できるようになります。Claude 3 Haikuは画像を処理し、テキスト出力を返すことができ、200Kのコンテキストウィンドウを持っています。"
  },
@@ -506,6 +512,9 @@
  "aya:35b": {
    "description": "Aya 23は、Cohereが提供する多言語モデルであり、23の言語をサポートし、多様な言語アプリケーションを便利にします。"
  },
+  "baichuan/baichuan2-13b-chat": {
+    "description": "Baichuan-13Bは百川智能が開発した130億パラメータを持つオープンソースの商用大規模言語モデルで、権威ある中国語と英語のベンチマークで同サイズの中で最良の結果を達成しています。"
+  },
  "charglm-3": {
    "description": "CharGLM-3はキャラクター演技と感情的な伴侶のために設計されており、超長期の多段階記憶と個別化された対話をサポートし、幅広い用途に適しています。"
  },
@@ -686,9 +695,30 @@
  "deepseek/deepseek-r1": {
    "description": "DeepSeek-R1は、わずかなラベル付きデータしかない状況で、モデルの推論能力を大幅に向上させました。最終的な回答を出力する前に、モデルは思考の連鎖を出力し、最終的な答えの正確性を向上させます。"
  },
+  "deepseek/deepseek-r1-distill-llama-70b": {
+    "description": "DeepSeek R1 Distill Llama 70BはLlama3.3 70Bに基づく大規模言語モデルで、DeepSeek R1の出力を微調整に利用し、大規模な最前線モデルと同等の競争力のある性能を実現しています。"
+  },
+  "deepseek/deepseek-r1-distill-llama-8b": {
+    "description": "DeepSeek R1 Distill Llama 8BはLlama-3.1-8B-Instructに基づく蒸留大言語モデルで、DeepSeek R1の出力を使用してトレーニングされています。"
+  },
+  "deepseek/deepseek-r1-distill-qwen-14b": {
+    "description": "DeepSeek R1 Distill Qwen 14BはQwen 2.5 14Bに基づく蒸留大言語モデルで、DeepSeek R1の出力を使用してトレーニングされています。このモデルは複数のベンチマークテストでOpenAIのo1-miniを超え、密なモデル（dense models）の最新技術の成果を達成しました。以下は一部のベンチマークテストの結果です：\nAIME 2024 pass@1: 69.7\nMATH-500 pass@1: 93.9\nCodeForces Rating: 1481\nこのモデルはDeepSeek R1の出力から微調整を行い、より大規模な最前線モデルと同等の競争力のある性能を示しています。"
+  },
+  "deepseek/deepseek-r1-distill-qwen-32b": {
+    "description": "DeepSeek R1 Distill Qwen 32BはQwen 2.5 32Bに基づく蒸留大言語モデルで、DeepSeek R1の出力を使用してトレーニングされています。このモデルは複数のベンチマークテストでOpenAIのo1-miniを超え、密なモデル（dense models）の最新技術の成果を達成しました。以下は一部のベンチマークテストの結果です：\nAIME 2024 pass@1: 72.6\nMATH-500 pass@1: 94.3\nCodeForces Rating: 1691\nこのモデルはDeepSeek R1の出力から微調整を行い、より大規模な最前線モデルと同等の競争力のある性能を示しています。"
+  },
+  "deepseek/deepseek-r1/community": {
+    "description": "DeepSeek R1はDeepSeekチームが発表した最新のオープンソースモデルで、特に数学、プログラミング、推論タスクにおいてOpenAIのo1モデルと同等の推論性能を持っています。"
+  },
  "deepseek/deepseek-r1:free": {
    "description": "DeepSeek-R1は、わずかなラベル付きデータしかない状況で、モデルの推論能力を大幅に向上させました。最終的な回答を出力する前に、モデルは思考の連鎖を出力し、最終的な答えの正確性を向上させます。"
  },
+  "deepseek/deepseek-v3": {
+    "description": "DeepSeek-V3は推論速度において前のモデルに比べて大きなブレークスルーを達成しました。オープンソースモデルの中で1位にランクインし、世界の最先端のクローズドモデルと肩を並べることができます。DeepSeek-V3はマルチヘッド潜在注意（MLA）とDeepSeekMoEアーキテクチャを採用しており、これらのアーキテクチャはDeepSeek-V2で完全に検証されています。さらに、DeepSeek-V3は負荷分散のための補助的な非損失戦略を開発し、より強力な性能を得るためにマルチラベル予測トレーニング目標を設定しました。"
+  },
+  "deepseek/deepseek-v3/community": {
+    "description": "DeepSeek-V3は推論速度において前のモデルに比べて大きなブレークスルーを達成しました。オープンソースモデルの中で1位にランクインし、世界の最先端のクローズドモデルと肩を並べることができます。DeepSeek-V3はマルチヘッド潜在注意（MLA）とDeepSeekMoEアーキテクチャを採用しており、これらのアーキテクチャはDeepSeek-V2で完全に検証されています。さらに、DeepSeek-V3は負荷分散のための補助的な非損失戦略を開発し、より強力な性能を得るためにマルチラベル予測トレーニング目標を設定しました。"
+  },
  "doubao-1.5-lite-32k": {
    "description": "Doubao-1.5-liteは全く新しい世代の軽量版モデルで、極限の応答速度を実現し、効果と遅延の両方で世界トップレベルに達しています。"
  },
@@ -800,9 +830,18 @@
  "gemini-2.0-flash-001": {
    "description": "Gemini 2.0 Flashは、卓越した速度、ネイティブツールの使用、マルチモーダル生成、1Mトークンのコンテキストウィンドウを含む次世代の機能と改善を提供します。"
  },
+  "gemini-2.0-flash-lite": {
+    "description": "Gemini 2.0 Flashモデルのバリアントで、コスト効率と低遅延などの目標に最適化されています。"
+  },
+  "gemini-2.0-flash-lite-001": {
+    "description": "Gemini 2.0 Flashモデルのバリアントで、コスト効率と低遅延などの目標に最適化されています。"
+  },
  "gemini-2.0-flash-lite-preview-02-05": {
    "description": "コスト効率と低遅延を目指して最適化されたGemini 2.0 Flashモデルです。"
  },
+  "gemini-2.0-flash-thinking-exp": {
+    "description": "Gemini 2.0 Flash Expは、Googleの最新の実験的なマルチモーダルAIモデルであり、次世代の機能、卓越した速度、ネイティブツールの呼び出し、マルチモーダル生成を備えています。"
+  },
  "gemini-2.0-flash-thinking-exp-01-21": {
    "description": "Gemini 2.0 Flash Expは、Googleの最新の実験的なマルチモーダルAIモデルであり、次世代の機能、卓越した速度、ネイティブツールの呼び出し、マルチモーダル生成を備えています。"
  },
@@ -953,6 +992,9 @@
  "gpt-4-vision-preview": {
    "description": "最新のGPT-4 Turboモデルは視覚機能を備えています。現在、視覚リクエストはJSON形式と関数呼び出しを使用して行うことができます。GPT-4 Turboは、マルチモーダルタスクに対してコスト効率の高いサポートを提供する強化版です。正確性と効率のバランスを取り、リアルタイムのインタラクションが必要なアプリケーションシナリオに適しています。"
  },
+  "gpt-4.5-preview": {
+    "description": "GPT-4.5の研究プレビュー版で、これまでで最大かつ最強のGPTモデルです。広範な世界知識を持ち、ユーザーの意図をよりよく理解することができるため、創造的なタスクや自律的な計画において優れたパフォーマンスを発揮します。GPT-4.5はテキストと画像の入力を受け付け、テキスト出力（構造化出力を含む）を生成します。関数呼び出し、バッチAPI、ストリーミング出力など、重要な開発者機能をサポートしています。創造的でオープンな思考や対話が求められるタスク（執筆、学習、新しいアイデアの探求など）において、GPT-4.5は特に優れた性能を発揮します。知識のカットオフ日は2023年10月です。"
+  },
  "gpt-4o": {
    "description": "ChatGPT-4oは、リアルタイムで更新される動的モデルで、常に最新のバージョンを維持します。強力な言語理解と生成能力を組み合わせており、顧客サービス、教育、技術サポートなどの大規模なアプリケーションシナリオに適しています。"
  },
@@ -1088,15 +1130,6 @@
  "llama-3.1-8b-instant": {
    "description": "Llama 3.1 8Bは、高効率モデルであり、迅速なテキスト生成能力を提供し、大規模な効率とコスト効果が求められるアプリケーションシナリオに非常に適しています。"
  },
-  "llama-3.1-sonar-huge-128k-online": {
-    "description": "Llama 3.1 Sonar Huge Onlineモデルは、405Bパラメータを持ち、約127,000トークンのコンテキスト長をサポートし、複雑なオンラインチャットアプリケーション用に設計されています。"
-  },
-  "llama-3.1-sonar-large-128k-online": {
-    "description": "Llama 3.1 Sonar Large Onlineモデルは、70Bパラメータを持ち、約127,000トークンのコンテキスト長をサポートし、高容量で多様なチャットタスクに適しています。"
-  },
-  "llama-3.1-sonar-small-128k-online": {
-    "description": "Llama 3.1 Sonar Small Onlineモデルは、8Bパラメータを持ち、約127,000トークンのコンテキスト長をサポートし、オンラインチャット用に設計されており、さまざまなテキストインタラクションを効率的に処理できます。"
-  },
  "llama-3.2-11b-vision-instruct": {
    "description": "高解像度画像で優れた画像推論能力を発揮し、視覚理解アプリケーションに適しています。"
  },
@@ -1250,6 +1283,9 @@
  "meta-llama/llama-3.2-11b-vision-instruct": {
    "description": "LLaMA 3.2は、視覚とテキストデータを組み合わせたタスクを処理することを目的としています。画像の説明や視覚的な質問応答などのタスクで優れたパフォーマンスを発揮し、言語生成と視覚推論の間のギャップを超えています。"
  },
+  "meta-llama/llama-3.2-3b-instruct": {
+    "description": "meta-llama/llama-3.2-3b-instruct"
+  },
  "meta-llama/llama-3.2-90b-vision-instruct": {
    "description": "LLaMA 3.2は、視覚とテキストデータを組み合わせたタスクを処理することを目的としています。画像の説明や視覚的な質問応答などのタスクで優れたパフォーマンスを発揮し、言語生成と視覚推論の間のギャップを超えています。"
  },
@@ -1484,6 +1520,9 @@
  "qwen-max-latest": {
    "description": "通義千問の千億レベルの超大規模言語モデルで、中国語、英語などの異なる言語入力をサポートし、現在の通義千問2.5製品バージョンの背後にあるAPIモデルです。"
  },
+  "qwen-omni-turbo-latest": {
+    "description": "Qwen-Omniシリーズモデルは、動画、音声、画像、テキストなどのさまざまなモダリティのデータを入力し、音声とテキストを出力することをサポートしています。"
+  },
  "qwen-plus": {
    "description": "通義千問の超大規模言語モデルの強化版で、中国語、英語などさまざまな言語の入力をサポートしています。"
  },
@@ -1511,9 +1550,21 @@
  "qwen-vl-v1": {
    "description": "Qwen-7B言語モデルを初期化し、画像モデルを追加した、画像入力解像度448の事前トレーニングモデルです。"
  },
+  "qwen/qwen-2-7b-instruct": {
+    "description": "Qwen2は全く新しいQwen大規模言語モデルシリーズです。Qwen2 7Bはトランスフォーマーに基づくモデルで、言語理解、多言語能力、プログラミング、数学、推論において優れた性能を示しています。"
+  },
  "qwen/qwen-2-7b-instruct:free": {
    "description": "Qwen2は全く新しい大型言語モデルシリーズで、より強力な理解と生成能力を備えています。"
  },
+  "qwen/qwen-2-vl-72b-instruct": {
+    "description": "Qwen2-VLはQwen-VLモデルの最新のイテレーションで、MathVista、DocVQA、RealWorldQA、MTVQAなどの視覚理解ベンチマークテストで最先端の性能を達成しました。Qwen2-VLは20分以上のビデオを理解し、高品質なビデオベースの質問応答、対話、コンテンツ作成を行うことができます。また、複雑な推論と意思決定能力を備えており、モバイルデバイスやロボットなどと統合し、視覚環境とテキスト指示に基づいて自動操作を行うことができます。英語と中国語に加えて、Qwen2-VLは現在、ほとんどのヨーロッパ言語、日本語、韓国語、アラビア語、ベトナム語など、異なる言語のテキストを画像内で理解することもサポートしています。"
+  },
+  "qwen/qwen-2.5-72b-instruct": {
+    "description": "Qwen2.5-72B-Instructはアリババクラウドが発表した最新の大言語モデルシリーズの一つです。この72Bモデルはコーディングや数学などの分野で顕著な能力の向上を示しています。このモデルは29以上の言語をカバーする多言語サポートも提供しており、中国語、英語などが含まれています。モデルは指示の追従、構造化データの理解、構造化出力（特にJSON）の生成においても顕著な向上を示しています。"
+  },
+  "qwen/qwen2.5-32b-instruct": {
+    "description": "Qwen2.5-32B-Instructはアリババクラウドが発表した最新の大言語モデルシリーズの一つです。この32Bモデルはコーディングや数学などの分野で顕著な能力の向上を示しています。このモデルは29以上の言語をカバーする多言語サポートも提供しており、中国語、英語などが含まれています。モデルは指示の追従、構造化データの理解、構造化出力（特にJSON）の生成においても顕著な向上を示しています。"
+  },
  "qwen/qwen2.5-7b-instruct": {
    "description": "中国語と英語に対応したLLMで、言語、プログラミング、数学、推論などの分野に特化しています。"
  },
@@ -1589,9 +1640,18 @@
  "qwq": {
    "description": "QwQはAIの推論能力を向上させることに特化した実験的研究モデルです。"
  },
+  "qwq-32b": {
+    "description": "Qwen2.5-32Bモデルに基づいて訓練されたQwQ推論モデルは、強化学習を通じてモデルの推論能力を大幅に向上させました。モデルの数学コードなどのコア指標（AIME 24/25、LiveCodeBench）および一部の一般的な指標（IFEval、LiveBenchなど）は、DeepSeek-R1のフルバージョンに達しており、すべての指標は同じくQwen2.5-32Bに基づくDeepSeek-R1-Distill-Qwen-32Bを大幅に上回っています。"
+  },
  "qwq-32b-preview": {
    "description": "QwQモデルはQwenチームによって開発された実験的な研究モデルで、AIの推論能力を強化することに焦点を当てています。"
  },
+  "qwq-plus-latest": {
+    "description": "Qwen2.5モデルに基づいて訓練されたQwQ推論モデルは、強化学習を通じてモデルの推論能力を大幅に向上させました。モデルの数学コードなどのコア指標（AIME 24/25、LiveCodeBench）および一部の一般的な指標（IFEval、LiveBenchなど）は、DeepSeek-R1のフルバージョンに達しています。"
+  },
+  "r1-1776": {
+    "description": "R1-1776は、DeepSeek R1モデルの一つのバージョンで、後処理を経て、検閲されていない偏りのない事実情報を提供します。"
+  },
  "solar-mini": {
    "description": "Solar MiniはコンパクトなLLMで、GPT-3.5を上回る性能を持ち、強力な多言語能力を備え、英語と韓国語をサポートし、高効率でコンパクトなソリューションを提供します。"
  },
@@ -1604,6 +1664,9 @@
  "sonar": {
    "description": "検索コンテキストに基づく軽量検索製品で、Sonar Proよりも速く、安価です。"
  },
+  "sonar-deep-research": {
+    "description": "Deep Researchは、専門家による包括的な研究を行い、それをアクセス可能で実行可能なレポートにまとめます。"
+  },
  "sonar-pro": {
    "description": "検索コンテキストをサポートする高度な検索製品で、高度なクエリとフォローアップをサポートします。"
  },
@@ -1661,6 +1724,9 @@
  "text-embedding-3-small": {
    "description": "効率的で経済的な次世代埋め込みモデル、知識検索やRAGアプリケーションなどのシーンに適しています"
  },
+  "thudm/glm-4-9b-chat": {
+    "description": "智谱AIが発表したGLM-4シリーズの最新世代の事前トレーニングモデルのオープンソース版です。"
+  },
  "togethercomputer/StripedHyena-Nous-7B": {
    "description": "StripedHyena Nous (7B)は、高効率の戦略とモデルアーキテクチャを通じて、強化された計算能力を提供します。"
  },
@@ -1676,6 +1742,9 @@
  "us.anthropic.claude-3-5-sonnet-20241022-v2:0": {
    "description": "Claude 3.5 Sonnetは業界標準を向上させ、競合モデルやClaude 3 Opusを超える性能を持ち、広範な評価で優れた結果を示し、我々の中程度のモデルの速度とコストを兼ね備えています。"
  },
+  "us.anthropic.claude-3-7-sonnet-20250219-v1:0": {
+    "description": "Claude 3.7 Sonnetは、Anthropicの最も高速な次世代モデルです。Claude 3 Haikuと比較して、Claude 3.7 Sonnetはすべてのスキルで向上しており、多くの知能ベンチマークテストで前世代の最大モデルClaude 3 Opusを超えています。"
+  },
  "whisper-1": {
    "description": "汎用音声認識モデル、多言語音声認識、音声翻訳、言語認識をサポート"
  },
@@ -140,6 +140,18 @@
      "close": "削除",
      "confirm": "設定が完了し、再試行しました"
    },
+    "crawPages": {
+      "crawling": "リンクを識別中",
+      "detail": {
+        "preview": "プレビュー",
+        "raw": "原文",
+        "tooLong": "テキストが長すぎます。会話のコンテキストには最初の {{characters}} 文字のみが保持され、それを超える部分は会話のコンテキストには含まれません"
+      },
+      "meta": {
+        "crawler": "クローリングモード",
+        "words": "文字数"
+      }
+    },
    "searchxng": {
      "baseURL": "入力してください",
      "description": "SearchXNG の URL を入力すると、ネット検索を開始できます",
@@ -89,6 +89,9 @@
  "perplexity": {
    "description": "Perplexityは、先進的な対話生成モデルの提供者であり、さまざまなLlama 3.1モデルを提供し、オンラインおよびオフラインアプリケーションをサポートし、特に複雑な自然言語処理タスクに適しています。"
  },
+  "ppio": {
+    "description": "PPIO パイオ云は、安定した高コストパフォーマンスのオープンソースモデル API サービスを提供し、DeepSeek の全シリーズ、Llama、Qwen などの業界をリードする大規模モデルをサポートしています。"
+  },
  "qwen": {
    "description": "通義千問は、アリババクラウドが独自に開発した超大規模言語モデルであり、強力な自然言語理解と生成能力を持っています。さまざまな質問に答えたり、文章を創作したり、意見を表現したり、コードを執筆したりすることができ、さまざまな分野で活躍しています。"
  },
@@ -32,7 +32,12 @@
  "duplicateTitle": "{{title}} 복사본",
  "emptyAgent": "도우미가 없습니다",
  "extendParams": {
+    "disableContextCaching": {
+      "desc": "단일 대화 생성 비용을 최대 90%까지 줄이고, 응답 속도를 4배 향상시킵니다 (<1>자세히 알아보기</1>). 활성화하면 자동으로 이전 메시지 수 제한이 비활성화됩니다.",
+      "title": "문맥 캐시 활성화"
+    },
    "enableReasoning": {
+      "desc": "Claude Thinking 메커니즘에 기반한 제한 (<1>자세히 알아보기</1>), 활성화하면 자동으로 이전 메시지 수 제한이 비활성화됩니다.",
      "title": "심층 사고 활성화"
    },
    "reasoningBudgetToken": {
@@ -40,6 +45,9 @@
    },
    "title": "모델 확장 기능"
  },
+  "history": {
+    "title": "도우미는 마지막 {{count}}개의 메시지만 기억합니다."
+  },
  "historyRange": "대화 기록 범위",
  "historySummary": "역사 메시지 요약",
  "inbox": {
@@ -79,6 +87,39 @@
    "deleteDisabledByThreads": "하위 주제가 존재하여 삭제할 수 없습니다.",
    "regenerate": "다시 생성"
  },
+  "messages": {
+    "modelCard": {
+      "credit": "포인트",
+      "creditPricing": "가격",
+      "creditTooltip": "계산을 용이하게 하기 위해, 1$를 1M 포인트로 환산합니다. 예를 들어, $3/M 토큰은 3포인트/토큰으로 환산됩니다.",
+      "pricing": {
+        "inputCachedTokens": "캐시된 입력 {{amount}}/포인트 · ${{amount}}/M",
+        "inputCharts": "${{amount}}/M 문자",
+        "inputMinutes": "${{amount}}/분",
+        "inputTokens": "입력 {{amount}}/포인트 · ${{amount}}/M",
+        "outputTokens": "출력 {{amount}}/포인트 · ${{amount}}/M",
+        "writeCacheInputTokens": "캐시 입력 쓰기 {{amount}}/포인트 · ${{amount}}/M"
+      }
+    },
+    "tokenDetails": {
+      "average": "평균 단가",
+      "input": "입력",
+      "inputAudio": "오디오 입력",
+      "inputCached": "입력 캐시",
+      "inputCitation": "입력 인용",
+      "inputText": "텍스트 입력",
+      "inputTitle": "입력 세부사항",
+      "inputUncached": "입력 비캐시",
+      "inputWriteCached": "입력 캐시 쓰기",
+      "output": "출력",
+      "outputAudio": "오디오 출력",
+      "outputText": "텍스트 출력",
+      "outputTitle": "출력 세부사항",
+      "reasoning": "심층 사고",
+      "title": "생성 세부사항",
+      "total": "총 소모"
+    }
+  },
  "newAgent": "새 도우미",
  "pin": "고정",
  "pinOff": "고정 해제",
@@ -322,6 +322,9 @@
    "tooltip": "서비스 제공자 기본 설정 업데이트",
    "updateSuccess": "업데이트 성공"
  },
+  "updateCustomAiProvider": {
+    "title": "사용자 정의 AI 서비스 제공자 구성 업데이트"
+  },
  "vertexai": {
    "apiKey": {
      "desc": "당신의 Vertex AI 키를 입력하세요",
@@ -8,6 +8,12 @@
  "01-ai/Yi-1.5-9B-Chat-16K": {
    "description": "Yi-1.5 9B는 16K 토큰을 지원하며, 효율적이고 매끄러운 언어 생성 능력을 제공합니다."
  },
+  "01-ai/yi-1.5-34b-chat": {
+    "description": "제로일 만물, 최신 오픈 소스 미세 조정 모델로, 340억 개의 매개변수를 가지고 있으며, 다양한 대화 시나리오를 지원하는 미세 조정, 고품질 훈련 데이터, 인간의 선호에 맞춘 조정을 제공합니다."
+  },
+  "01-ai/yi-1.5-9b-chat": {
+    "description": "제로일 만물, 최신 오픈 소스 미세 조정 모델로, 90억 개의 매개변수를 가지고 있으며, 다양한 대화 시나리오를 지원하는 미세 조정, 고품질 훈련 데이터, 인간의 선호에 맞춘 조정을 제공합니다."
+  },
  "360gpt-pro": {
    "description": "360GPT Pro는 360 AI 모델 시리즈의 중요한 구성원으로, 다양한 자연어 응용 시나리오에 맞춘 효율적인 텍스트 처리 능력을 갖추고 있으며, 긴 텍스트 이해 및 다중 회화 기능을 지원합니다."
  },
@@ -239,6 +245,9 @@
  "Qwen/QVQ-72B-Preview": {
    "description": "QVQ-72B-Preview는 Qwen 팀이 개발한 시각적 추론 능력에 중점을 둔 연구 모델로, 복잡한 장면 이해 및 시각 관련 수학 문제 해결에서 독특한 장점을 가지고 있습니다."
  },
+  "Qwen/QwQ-32B": {
+    "description": "QwQ는 Qwen 시리즈의 추론 모델입니다. 전통적인 지시 조정 모델과 비교할 때, QwQ는 사고 및 추론 능력을 갖추고 있어 하위 작업에서 특히 어려운 문제를 해결하는 데 있어 성능이 크게 향상됩니다. QwQ-32B는 중형 추론 모델로, 최신 추론 모델(예: DeepSeek-R1, o1-mini)과 비교할 때 경쟁력 있는 성능을 발휘합니다. 이 모델은 RoPE, SwiGLU, RMSNorm 및 Attention QKV bias와 같은 기술을 사용하며, 64층 네트워크 구조와 40개의 Q 주의 헤드(GQA 구조에서 KV는 8개)를 가지고 있습니다."
+  },
  "Qwen/QwQ-32B-Preview": {
    "description": "QwQ-32B-Preview는 Qwen의 최신 실험적 연구 모델로, AI 추론 능력을 향상시키는 데 중점을 두고 있습니다. 언어 혼합, 재귀 추론 등 복잡한 메커니즘을 탐구하며, 주요 장점으로는 강력한 추론 분석 능력, 수학 및 프로그래밍 능력이 포함됩니다. 동시에 언어 전환 문제, 추론 루프, 안전성 고려 및 기타 능력 차이와 같은 문제도 존재합니다."
  },
@@ -467,9 +476,6 @@
  "anthropic.claude-3-5-sonnet-20241022-v2:0": {
    "description": "Claude 3.5 Sonnet는 업계 표준을 향상시켰으며, 경쟁 모델과 Claude 3 Opus를 초월하는 성능을 보여주고, 광범위한 평가에서 뛰어난 성과를 보였습니다. 또한 중간 수준 모델의 속도와 비용을 갖추고 있습니다."
  },
-  "anthropic.claude-3-7-sonnet-20250219-v1:0": {
-    "description": "Claude 3.7 Sonnet는 업계 표준을 향상시켰으며, 경쟁 모델과 Claude 3 Opus를 초월하는 성능을 보여주고, 광범위한 평가에서 뛰어난 성과를 보였습니다. 또한 중간 수준 모델의 속도와 비용을 갖추고 있습니다."
-  },
  "anthropic.claude-3-haiku-20240307-v1:0": {
    "description": "Claude 3 Haiku는 Anthropic의 가장 빠르고 간결한 모델로, 거의 즉각적인 응답 속도를 제공합니다. 간단한 질문과 요청에 신속하게 답변할 수 있습니다. 고객은 인간 상호작용을 모방하는 원활한 AI 경험을 구축할 수 있습니다. Claude 3 Haiku는 이미지를 처리하고 텍스트 출력을 반환할 수 있으며, 200K의 컨텍스트 창을 갖추고 있습니다."
  },
@@ -506,6 +512,9 @@
  "aya:35b": {
    "description": "Aya 23은 Cohere에서 출시한 다국어 모델로, 23개 언어를 지원하여 다양한 언어 응용에 편리함을 제공합니다."
  },
+  "baichuan/baichuan2-13b-chat": {
+    "description": "Baichuan-13B는 백천 인공지능이 개발한 130억 개의 매개변수를 가진 오픈 소스 상용 대형 언어 모델로, 권위 있는 중국어 및 영어 벤치마크에서 동일한 크기에서 최고의 성과를 달성했습니다."
+  },
  "charglm-3": {
    "description": "CharGLM-3는 역할 수행 및 감정 동반을 위해 설계된 모델로, 초장 다회 기억 및 개인화된 대화를 지원하여 광범위하게 사용됩니다."
  },
@@ -686,9 +695,30 @@
  "deepseek/deepseek-r1": {
    "description": "DeepSeek-R1은 극히 적은 주석 데이터로 모델의 추론 능력을 크게 향상시킵니다. 최종 답변을 출력하기 전에 모델은 먼저 사고의 연쇄 내용을 출력하여 최종 답변의 정확성을 높입니다."
  },
+  "deepseek/deepseek-r1-distill-llama-70b": {
+    "description": "DeepSeek R1 Distill Llama 70B는 Llama3.3 70B를 기반으로 한 대형 언어 모델로, DeepSeek R1의 출력을 활용하여 대형 최첨단 모델과 동등한 경쟁 성능을 달성했습니다."
+  },
+  "deepseek/deepseek-r1-distill-llama-8b": {
+    "description": "DeepSeek R1 Distill Llama 8B는 Llama-3.1-8B-Instruct를 기반으로 한 증류 대형 언어 모델로, DeepSeek R1의 출력을 사용하여 훈련되었습니다."
+  },
+  "deepseek/deepseek-r1-distill-qwen-14b": {
+    "description": "DeepSeek R1 Distill Qwen 14B는 Qwen 2.5 14B를 기반으로 한 증류 대형 언어 모델로, DeepSeek R1의 출력을 사용하여 훈련되었습니다. 이 모델은 여러 벤치마크 테스트에서 OpenAI의 o1-mini를 초월하며, 밀집 모델(dense models)에서 최신 기술 선도 성과(state-of-the-art)를 달성했습니다. 다음은 몇 가지 벤치마크 테스트 결과입니다:\nAIME 2024 pass@1: 69.7\nMATH-500 pass@1: 93.9\nCodeForces Rating: 1481\n이 모델은 DeepSeek R1의 출력을 미세 조정하여 더 큰 규모의 최첨단 모델과 동등한 경쟁 성능을 보여주었습니다."
+  },
+  "deepseek/deepseek-r1-distill-qwen-32b": {
+    "description": "DeepSeek R1 Distill Qwen 32B는 Qwen 2.5 32B를 기반으로 한 증류 대형 언어 모델로, DeepSeek R1의 출력을 사용하여 훈련되었습니다. 이 모델은 여러 벤치마크 테스트에서 OpenAI의 o1-mini를 초월하며, 밀집 모델(dense models)에서 최신 기술 선도 성과(state-of-the-art)를 달성했습니다. 다음은 몇 가지 벤치마크 테스트 결과입니다:\nAIME 2024 pass@1: 72.6\nMATH-500 pass@1: 94.3\nCodeForces Rating: 1691\n이 모델은 DeepSeek R1의 출력을 미세 조정하여 더 큰 규모의 최첨단 모델과 동등한 경쟁 성능을 보여주었습니다."
+  },
+  "deepseek/deepseek-r1/community": {
+    "description": "DeepSeek R1은 DeepSeek 팀이 발표한 최신 오픈 소스 모델로, 특히 수학, 프로그래밍 및 추론 작업에서 OpenAI의 o1 모델과 동등한 수준의 강력한 추론 성능을 갖추고 있습니다."
+  },
  "deepseek/deepseek-r1:free": {
    "description": "DeepSeek-R1은 극히 적은 주석 데이터로 모델의 추론 능력을 크게 향상시킵니다. 최종 답변을 출력하기 전에 모델은 먼저 사고의 연쇄 내용을 출력하여 최종 답변의 정확성을 높입니다."
  },
+  "deepseek/deepseek-v3": {
+    "description": "DeepSeek-V3는 추론 속도에서 이전 모델에 비해 중대한 돌파구를 이루었습니다. 오픈 소스 모델 중 1위를 차지하며, 세계에서 가장 진보된 폐쇄형 모델과 견줄 수 있습니다. DeepSeek-V3는 다중 헤드 잠재 주의(Multi-Head Latent Attention, MLA)와 DeepSeekMoE 아키텍처를 채택하였으며, 이 아키텍처는 DeepSeek-V2에서 철저히 검증되었습니다. 또한, DeepSeek-V3는 부하 균형을 위한 보조 무손실 전략을 개척하고, 더 강력한 성능을 위해 다중 레이블 예측 훈련 목표를 설정했습니다."
+  },
+  "deepseek/deepseek-v3/community": {
+    "description": "DeepSeek-V3는 추론 속도에서 이전 모델에 비해 중대한 돌파구를 이루었습니다. 오픈 소스 모델 중 1위를 차지하며, 세계에서 가장 진보된 폐쇄형 모델과 견줄 수 있습니다. DeepSeek-V3는 다중 헤드 잠재 주의(Multi-Head Latent Attention, MLA)와 DeepSeekMoE 아키텍처를 채택하였으며, 이 아키텍처는 DeepSeek-V2에서 철저히 검증되었습니다. 또한, DeepSeek-V3는 부하 균형을 위한 보조 무손실 전략을 개척하고, 더 강력한 성능을 위해 다중 레이블 예측 훈련 목표를 설정했습니다."
+  },
  "doubao-1.5-lite-32k": {
    "description": "Doubao-1.5-lite는 전혀 새로운 세대의 경량 모델로, 극한의 응답 속도를 자랑하며, 효과와 지연 모두 세계 최고 수준에 도달했습니다."
  },
@@ -800,9 +830,18 @@
  "gemini-2.0-flash-001": {
    "description": "Gemini 2.0 Flash는 뛰어난 속도, 원주율 도구 사용, 다중 모달 생성 및 1M 토큰 문맥 창을 포함한 차세대 기능과 개선 사항을 제공합니다."
  },
+  "gemini-2.0-flash-lite": {
+    "description": "Gemini 2.0 플래시 모델 변형으로, 비용 효율성과 낮은 지연 시간 등의 목표를 위해 최적화되었습니다."
+  },
+  "gemini-2.0-flash-lite-001": {
+    "description": "Gemini 2.0 플래시 모델 변형으로, 비용 효율성과 낮은 지연 시간 등의 목표를 위해 최적화되었습니다."
+  },
  "gemini-2.0-flash-lite-preview-02-05": {
    "description": "비용 효율성과 낮은 지연 시간 등을 목표로 최적화된 Gemini 2.0 Flash 모델입니다."
  },
+  "gemini-2.0-flash-thinking-exp": {
+    "description": "Gemini 2.0 Flash Exp는 Google의 최신 실험적 다중 모드 AI 모델로, 차세대 기능, 뛰어난 속도, 네이티브 도구 호출 및 다중 모드 생성을 제공합니다."
+  },
  "gemini-2.0-flash-thinking-exp-01-21": {
    "description": "Gemini 2.0 Flash Exp는 Google의 최신 실험적 다중 모드 AI 모델로, 차세대 기능, 뛰어난 속도, 네이티브 도구 호출 및 다중 모드 생성을 제공합니다."
  },
@@ -953,6 +992,9 @@
  "gpt-4-vision-preview": {
    "description": "최신 GPT-4 Turbo 모델은 시각적 기능을 갖추고 있습니다. 이제 시각적 요청은 JSON 형식과 함수 호출을 사용하여 처리할 수 있습니다. GPT-4 Turbo는 다중 모드 작업을 위한 비용 효율적인 지원을 제공하는 향상된 버전입니다. 정확성과 효율성 간의 균형을 찾아 실시간 상호작용이 필요한 응용 프로그램에 적합합니다."
  },
+  "gpt-4.5-preview": {
+    "description": "GPT-4.5 연구 미리보기 버전으로, 지금까지 우리가 만든 가장 크고 강력한 GPT 모델입니다. 광범위한 세계 지식을 보유하고 있으며 사용자 의도를 더 잘 이해하여 창의적인 작업과 자율 계획에서 뛰어난 성능을 발휘합니다. GPT-4.5는 텍스트와 이미지 입력을 수용하고 텍스트 출력을 생성합니다(구조화된 출력 포함). 함수 호출, 배치 API 및 스트리밍 출력을 포함한 주요 개발자 기능을 지원합니다. 창의적이고 개방적인 사고 및 대화가 필요한 작업(예: 글쓰기, 학습 또는 새로운 아이디어 탐색)에서 특히 뛰어난 성능을 보입니다. 지식 기준일은 2023년 10월입니다."
+  },
  "gpt-4o": {
    "description": "ChatGPT-4o는 동적 모델로, 최신 버전을 유지하기 위해 실시간으로 업데이트됩니다. 강력한 언어 이해 및 생성 능력을 결합하여 고객 서비스, 교육 및 기술 지원을 포함한 대규모 응용 프로그램에 적합합니다."
  },
@@ -1088,15 +1130,6 @@
  "llama-3.1-8b-instant": {
    "description": "Llama 3.1 8B는 효율적인 모델로, 빠른 텍스트 생성 능력을 제공하며, 대규모 효율성과 비용 효과성이 필요한 응용 프로그램에 매우 적합합니다."
  },
-  "llama-3.1-sonar-huge-128k-online": {
-    "description": "Llama 3.1 Sonar Huge Online 모델은 405B 매개변수를 갖추고 있으며, 약 127,000개의 토큰의 컨텍스트 길이를 지원하여 복잡한 온라인 채팅 애플리케이션을 위해 설계되었습니다."
-  },
-  "llama-3.1-sonar-large-128k-online": {
-    "description": "Llama 3.1 Sonar Large Online 모델은 70B 매개변수를 갖추고 있으며, 약 127,000개의 토큰의 컨텍스트 길이를 지원하여 대용량 및 다양한 채팅 작업에 적합합니다."
-  },
-  "llama-3.1-sonar-small-128k-online": {
-    "description": "Llama 3.1 Sonar Small Online 모델은 8B 매개변수를 갖추고 있으며, 약 127,000개의 토큰의 컨텍스트 길이를 지원하여 온라인 채팅을 위해 설계되었습니다."
-  },
  "llama-3.2-11b-vision-instruct": {
    "description": "고해상도 이미지에서 탁월한 이미지 추론 능력을 발휘하며, 시각 이해 응용 프로그램에 적합합니다."
  },
@@ -1250,6 +1283,9 @@
  "meta-llama/llama-3.2-11b-vision-instruct": {
    "description": "LLaMA 3.2는 시각 및 텍스트 데이터를 결합한 작업을 처리하기 위해 설계되었습니다. 이미지 설명 및 시각적 질문 응답과 같은 작업에서 뛰어난 성능을 보이며, 언어 생성과 시각적 추론 간의 간극을 넘습니다."
  },
+  "meta-llama/llama-3.2-3b-instruct": {
+    "description": "meta-llama/llama-3.2-3b-instruct"
+  },
  "meta-llama/llama-3.2-90b-vision-instruct": {
    "description": "LLaMA 3.2는 시각 및 텍스트 데이터를 결합한 작업을 처리하기 위해 설계되었습니다. 이미지 설명 및 시각적 질문 응답과 같은 작업에서 뛰어난 성능을 보이며, 언어 생성과 시각적 추론 간의 간극을 넘습니다."
  },
@@ -1484,6 +1520,9 @@
  "qwen-max-latest": {
    "description": "통의 천문 1000억급 초대규모 언어 모델로, 중국어, 영어 등 다양한 언어 입력을 지원하며, 현재 통의 천문 2.5 제품 버전의 API 모델입니다."
  },
+  "qwen-omni-turbo-latest": {
+    "description": "Qwen-Omni 시리즈 모델은 비디오, 오디오, 이미지, 텍스트 등 다양한 모드의 데이터를 입력으로 지원하며, 오디오와 텍스트를 출력합니다."
+  },
  "qwen-plus": {
    "description": "통의천문 초대형 언어 모델의 강화 버전으로, 중국어, 영어 등 다양한 언어 입력을 지원합니다."
  },
@@ -1511,9 +1550,21 @@
  "qwen-vl-v1": {
    "description": "Qwen-7B 언어 모델로 초기화된 모델로, 이미지 모델을 추가하여 이미지 입력 해상도가 448인 사전 훈련 모델입니다."
  },
+  "qwen/qwen-2-7b-instruct": {
+    "description": "Qwen2는 새로운 Qwen 대형 언어 모델 시리즈입니다. Qwen2 7B는 트랜스포머 기반 모델로, 언어 이해, 다국어 능력, 프로그래밍, 수학 및 추론에서 뛰어난 성능을 보여줍니다."
+  },
  "qwen/qwen-2-7b-instruct:free": {
    "description": "Qwen2는 더 강력한 이해 및 생성 능력을 갖춘 새로운 대형 언어 모델 시리즈입니다."
  },
+  "qwen/qwen-2-vl-72b-instruct": {
+    "description": "Qwen2-VL은 Qwen-VL 모델의 최신 반복 버전으로, MathVista, DocVQA, RealWorldQA 및 MTVQA와 같은 시각적 이해 벤치마크 테스트에서 최첨단 성능을 달성했습니다. Qwen2-VL은 20분 이상의 비디오를 이해할 수 있으며, 고품질의 비디오 기반 질문 응답, 대화 및 콘텐츠 생성에 사용됩니다. 또한 복잡한 추론 및 의사 결정 능력을 갖추고 있어, 모바일 장치, 로봇 등과 통합되어 시각적 환경 및 텍스트 지침에 따라 자동으로 작업을 수행할 수 있습니다. 영어와 중국어 외에도 Qwen2-VL은 이제 대부분의 유럽 언어, 일본어, 한국어, 아랍어 및 베트남어 등 다양한 언어의 텍스트를 이해할 수 있습니다."
+  },
+  "qwen/qwen-2.5-72b-instruct": {
+    "description": "Qwen2.5-72B-Instruct는 알리바바 클라우드에서 발표한 최신 대형 언어 모델 시리즈 중 하나입니다. 이 72B 모델은 코딩 및 수학 등 분야에서 현저한 개선된 능력을 가지고 있습니다. 이 모델은 또한 29개 이상의 언어를 포함한 다국어 지원을 제공하며, 지침 준수, 구조화된 데이터 이해 및 구조화된 출력 생성(특히 JSON)에서 현저한 향상을 보였습니다."
+  },
+  "qwen/qwen2.5-32b-instruct": {
+    "description": "Qwen2.5-32B-Instruct는 알리바바 클라우드에서 발표한 최신 대형 언어 모델 시리즈 중 하나입니다. 이 32B 모델은 코딩 및 수학 등 분야에서 현저한 개선된 능력을 가지고 있습니다. 이 모델은 29개 이상의 언어를 포함한 다국어 지원을 제공하며, 지침 준수, 구조화된 데이터 이해 및 구조화된 출력 생성(특히 JSON)에서 현저한 향상을 보였습니다."
+  },
  "qwen/qwen2.5-7b-instruct": {
    "description": "중국어와 영어를 위한 LLM으로, 언어, 프로그래밍, 수학, 추론 등 다양한 분야를 다룹니다."
  },
@@ -1589,9 +1640,18 @@
  "qwq": {
    "description": "QwQ는 AI 추론 능력을 향상시키는 데 중점을 둔 실험 연구 모델입니다."
  },
+  "qwq-32b": {
+    "description": "Qwen2.5-32B 모델을 기반으로 훈련된 QwQ 추론 모델로, 강화 학습을 통해 모델의 추론 능력을 크게 향상시켰습니다. 모델의 수학 코드 등 핵심 지표(AIME 24/25, LiveCodeBench) 및 일부 일반 지표(IFEval, LiveBench 등)는 DeepSeek-R1 풀 버전 수준에 도달했으며, 모든 지표는 동일하게 Qwen2.5-32B를 기반으로 한 DeepSeek-R1-Distill-Qwen-32B를 크게 초과합니다."
+  },
  "qwq-32b-preview": {
    "description": "QwQ 모델은 Qwen 팀이 개발한 실험적 연구 모델로, AI 추론 능력을 향상시키는 데 중점을 두고 있습니다."
  },
+  "qwq-plus-latest": {
+    "description": "Qwen2.5 모델을 기반으로 훈련된 QwQ 추론 모델로, 강화 학습을 통해 모델의 추론 능력을 크게 향상시켰습니다. 모델의 수학 코드 등 핵심 지표(AIME 24/25, LiveCodeBench) 및 일부 일반 지표(IFEval, LiveBench 등)는 DeepSeek-R1 풀 버전 수준에 도달했습니다."
+  },
+  "r1-1776": {
+    "description": "R1-1776은 DeepSeek R1 모델의 한 버전으로, 후속 훈련을 거쳐 검토되지 않은 편향 없는 사실 정보를 제공합니다."
+  },
  "solar-mini": {
    "description": "Solar Mini는 컴팩트한 LLM으로, GPT-3.5보다 성능이 우수하며, 강력한 다국어 능력을 갖추고 있어 영어와 한국어를 지원하며, 효율적이고 소형의 솔루션을 제공합니다."
  },
@@ -1604,6 +1664,9 @@
  "sonar": {
    "description": "검색 맥락 기반의 경량 검색 제품으로, Sonar Pro보다 더 빠르고 저렴합니다."
  },
+  "sonar-deep-research": {
+    "description": "Deep Research는 포괄적인 전문가 수준의 연구를 수행하고 이를 접근 가능하고 실행 가능한 보고서로 통합합니다."
+  },
  "sonar-pro": {
    "description": "고급 쿼리 및 후속 작업을 지원하는 검색 맥락 기반의 고급 검색 제품입니다."
  },
@@ -1661,6 +1724,9 @@
  "text-embedding-3-small": {
    "description": "효율적이고 경제적인 차세대 임베딩 모델로, 지식 검색, RAG 애플리케이션 등 다양한 상황에 적합합니다."
  },
+  "thudm/glm-4-9b-chat": {
+    "description": "지프 AI가 발표한 GLM-4 시리즈 최신 세대의 사전 훈련 모델의 오픈 소스 버전입니다."
+  },
  "togethercomputer/StripedHyena-Nous-7B": {
    "description": "StripedHyena Nous (7B)는 효율적인 전략과 모델 아키텍처를 통해 향상된 계산 능력을 제공합니다."
  },
@@ -1676,6 +1742,9 @@
  "us.anthropic.claude-3-5-sonnet-20241022-v2:0": {
    "description": "Claude 3.5 Sonnet는 업계 표준을 향상시켰으며, 경쟁 모델과 Claude 3 Opus를 초월하는 성능을 보여주고, 광범위한 평가에서 뛰어난 성과를 보이며, 중간 수준 모델의 속도와 비용을 갖추고 있습니다."
  },
+  "us.anthropic.claude-3-7-sonnet-20250219-v1:0": {
+    "description": "Claude 3.7 소네트는 Anthropic의 가장 빠른 차세대 모델입니다. Claude 3 하이쿠와 비교할 때, Claude 3.7 소네트는 모든 기술에서 향상되었으며, 많은 지능 기준 테스트에서 이전 세대의 가장 큰 모델인 Claude 3 오푸스를 초월했습니다."
+  },
  "whisper-1": {
    "description": "범용 음성 인식 모델로, 다국어 음성 인식, 음성 번역 및 언어 인식을 지원합니다."
  },
@@ -140,6 +140,18 @@
      "close": "삭제",
      "confirm": "구성이 완료되었습니다. 다시 시도하십시오."
    },
+    "crawPages": {
+      "crawling": "링크 인식 중",
+      "detail": {
+        "preview": "미리보기",
+        "raw": "원본 텍스트",
+        "tooLong": "텍스트 내용이 너무 깁니다. 대화 맥락은 앞의 {{characters}}자만 유지되며, 초과 부분은 대화 맥락에 포함되지 않습니다."
+      },
+      "meta": {
+        "crawler": "크롤링 모드",
+        "words": "문자 수"
+      }
+    },
    "searchxng": {
      "baseURL": "입력하십시오",
      "description": "SearchXNG의 URL을 입력하면 인터넷 검색을 시작할 수 있습니다.",
@@ -89,6 +89,9 @@
  "perplexity": {
    "description": "Perplexity는 선도적인 대화 생성 모델 제공업체로, 다양한 고급 Llama 3.1 모델을 제공하며, 온라인 및 오프라인 응용 프로그램을 지원하고 복잡한 자연어 처리 작업에 특히 적합합니다."
  },
+  "ppio": {
+    "description": "PPIO 파이오 클라우드는 안정적이고 비용 효율적인 오픈 소스 모델 API 서비스를 제공하며, DeepSeek 전 시리즈, Llama, Qwen 등 업계 선도 대모델을 지원합니다."
+  },
  "qwen": {
    "description": "통의천문은 알리바바 클라우드가 자주 개발한 초대형 언어 모델로, 강력한 자연어 이해 및 생성 능력을 갖추고 있습니다. 다양한 질문에 답변하고, 텍스트 콘텐츠를 창작하며, 의견을 표현하고, 코드를 작성하는 등 여러 분야에서 활용됩니다."
  },
@@ -32,7 +32,12 @@
  "duplicateTitle": "{{title}} Kopie",
  "emptyAgent": "Geen assistent beschikbaar",
  "extendParams": {
+    "disableContextCaching": {
+      "desc": "De kosten voor het genereren van een enkele conversatie kunnen met maximaal 90% worden verlaagd, en de responssnelheid kan tot 4 keer worden verhoogd (<1>Lees meer</1>). Wanneer ingeschakeld, wordt automatisch de limiet voor het aantal historische berichten uitgeschakeld.",
+      "title": "Contextcaching inschakelen"
+    },
    "enableReasoning": {
+      "desc": "Beperkingen op basis van het Claude Thinking-mechanisme (<1>Lees meer</1>), wanneer ingeschakeld, wordt automatisch de limiet voor het aantal historische berichten uitgeschakeld.",
      "title": "Diepe denkwijze inschakelen"
    },
    "reasoningBudgetToken": {
@@ -40,6 +45,9 @@
    },
    "title": "Modeluitbreidingsfunctie"
  },
+  "history": {
+    "title": "De assistent onthoudt alleen de laatste {{count}} berichten"
+  },
  "historyRange": "Geschiedenisbereik",
  "historySummary": "Geschiedenis samenvatting",
  "inbox": {
@@ -79,6 +87,39 @@
    "deleteDisabledByThreads": "Er zijn subonderwerpen, verwijderen is niet mogelijk.",
    "regenerate": "Opnieuw genereren"
  },
+  "messages": {
+    "modelCard": {
+      "credit": "Credits",
+      "creditPricing": "Prijsstelling",
+      "creditTooltip": "Voor de eenvoud van de berekening beschouwen we $1 als 1M credits, bijvoorbeeld $3/M tokens wordt omgezet naar 3 credits/token",
+      "pricing": {
+        "inputCachedTokens": "Gecacheerde invoer {{amount}}/credits · ${{amount}}/M",
+        "inputCharts": "${{amount}}/M tekens",
+        "inputMinutes": "${{amount}}/minuut",
+        "inputTokens": "Invoer {{amount}}/credits · ${{amount}}/M",
+        "outputTokens": "Uitvoer {{amount}}/credits · ${{amount}}/M",
+        "writeCacheInputTokens": "Cache-invoer schrijven {{amount}}/punten · ${{amount}}/M"
+      }
+    },
+    "tokenDetails": {
+      "average": "Gemiddelde prijs",
+      "input": "Invoer",
+      "inputAudio": "Audio-invoer",
+      "inputCached": "Gecacheerde invoer",
+      "inputCitation": "Invoer citeren",
+      "inputText": "Tekstinvoer",
+      "inputTitle": "Invoerdetails",
+      "inputUncached": "Ongecacheerde invoer",
+      "inputWriteCached": "Invoer cache schrijven",
+      "output": "Uitvoer",
+      "outputAudio": "Audio-uitvoer",
+      "outputText": "Tekstuitvoer",
+      "outputTitle": "Uitvoerdetails",
+      "reasoning": "Diep nadenken",
+      "title": "Genereren van details",
+      "total": "Totaal verbruik"
+    }
+  },
  "newAgent": "Nieuwe assistent",
  "pin": "Vastzetten",
  "pinOff": "Vastzetten uitschakelen",
@@ -322,6 +322,9 @@
    "tooltip": "Werk basisconfiguratie van provider bij",
    "updateSuccess": "Bijwerking geslaagd"
  },
+  "updateCustomAiProvider": {
+    "title": "Bijwerken van de configuratie van de aangepaste AI-provider"
+  },
  "vertexai": {
    "apiKey": {
      "desc": "Vul je Vertex AI-sleutels in",
@@ -8,6 +8,12 @@
  "01-ai/Yi-1.5-9B-Chat-16K": {
    "description": "Yi-1.5 9B ondersteunt 16K tokens en biedt efficiënte, vloeiende taalgeneratiecapaciteiten."
  },
+  "01-ai/yi-1.5-34b-chat": {
+    "description": "Zero One Everything, het nieuwste open-source fine-tuning model, met 34 miljard parameters, dat fine-tuning ondersteunt voor verschillende dialoogscenario's, met hoogwaardige trainingsdata die zijn afgestemd op menselijke voorkeuren."
+  },
+  "01-ai/yi-1.5-9b-chat": {
+    "description": "Zero One Everything, het nieuwste open-source fine-tuning model, met 9 miljard parameters, dat fine-tuning ondersteunt voor verschillende dialoogscenario's, met hoogwaardige trainingsdata die zijn afgestemd op menselijke voorkeuren."
+  },
  "360gpt-pro": {
    "description": "360GPT Pro, als een belangrijk lid van de 360 AI-modelreeks, voldoet aan de diverse natuurlijke taaltoepassingsscenario's met efficiënte tekstverwerkingscapaciteiten en ondersteunt lange tekstbegrip en meerdaagse gesprekken."
  },
@@ -239,6 +245,9 @@
  "Qwen/QVQ-72B-Preview": {
    "description": "QVQ-72B-Preview is een onderzoeksmodel ontwikkeld door het Qwen-team, dat zich richt op visuele redeneervaardigheden en unieke voordelen heeft in het begrijpen van complexe scènes en het oplossen van visueel gerelateerde wiskundige problemen."
  },
+  "Qwen/QwQ-32B": {
+    "description": "QwQ is het inferentiemodel van de Qwen-serie. In vergelijking met traditionele instructie-geoptimaliseerde modellen beschikt QwQ over denk- en redeneervaardigheden, waardoor het in staat is om aanzienlijk verbeterde prestaties te leveren in downstream-taken, vooral bij het oplossen van moeilijke problemen. QwQ-32B is een middelgroot inferentiemodel dat concurrerende prestaties kan behalen in vergelijking met de meest geavanceerde inferentiemodellen (zoals DeepSeek-R1, o1-mini). Dit model maakt gebruik van technologieën zoals RoPE, SwiGLU, RMSNorm en Attention QKV bias, en heeft een netwerkstructuur van 64 lagen en 40 Q-aandachtshoofden (met KV van 8 in de GQA-architectuur)."
+  },
  "Qwen/QwQ-32B-Preview": {
    "description": "QwQ-32B-Preview is het nieuwste experimentele onderzoeksmodel van Qwen, gericht op het verbeteren van AI-redeneringscapaciteiten. Door het verkennen van complexe mechanismen zoals taalmixing en recursieve redenering, zijn de belangrijkste voordelen onder andere krachtige redeneringsanalyses, wiskundige en programmeervaardigheden. Tegelijkertijd zijn er ook problemen met taalwisseling, redeneringscycli, veiligheidskwesties en verschillen in andere capaciteiten."
  },
@@ -467,9 +476,6 @@
  "anthropic.claude-3-5-sonnet-20241022-v2:0": {
    "description": "Claude 3.5 Sonnet heeft de industrienormen verhoogd, met prestaties die de concurrentiemodellen en Claude 3 Opus overtreffen. Het presteert uitstekend in uitgebreide evaluaties, terwijl het de snelheid en kosten van onze middelgrote modellen behoudt."
  },
-  "anthropic.claude-3-7-sonnet-20250219-v1:0": {
-    "description": "Claude 3.7 Sonnet is een van de nieuwste modellen van Anthropic, met verbeterde prestaties en een groter contextvenster, waardoor het model beter in staat is om complexe taken uit te voeren."
-  },
  "anthropic.claude-3-haiku-20240307-v1:0": {
    "description": "Claude 3 Haiku is het snelste en meest compacte model van Anthropic, met bijna onmiddellijke reactietijden. Het kan snel eenvoudige vragen en verzoeken beantwoorden. Klanten kunnen een naadloze AI-ervaring creëren die menselijke interactie nabootst. Claude 3 Haiku kan afbeeldingen verwerken en tekstoutput retourneren, met een contextvenster van 200K."
  },
@@ -506,6 +512,9 @@
  "aya:35b": {
    "description": "Aya 23 is een meertalig model van Cohere, ondersteunt 23 talen en biedt gemak voor diverse taaltoepassingen."
  },
+  "baichuan/baichuan2-13b-chat": {
+    "description": "Baichuan-13B is een open-source, commercieel bruikbaar groot taalmodel ontwikkeld door Baichuan Intelligent, met 13 miljard parameters, dat de beste prestaties in zijn klasse heeft behaald op gezaghebbende Chinese en Engelse benchmarks."
+  },
  "charglm-3": {
    "description": "CharGLM-3 is ontworpen voor rollenspellen en emotionele begeleiding, ondersteunt zeer lange meerdaagse herinneringen en gepersonaliseerde gesprekken, met brede toepassingen."
  },
@@ -686,9 +695,30 @@
  "deepseek/deepseek-r1": {
    "description": "DeepSeek-R1 heeft de redeneringscapaciteiten van het model aanzienlijk verbeterd, zelfs met zeer weinig gelabelde gegevens. Voordat het model het uiteindelijke antwoord geeft, genereert het eerst een denkproces om de nauwkeurigheid van het uiteindelijke antwoord te verbeteren."
  },
+  "deepseek/deepseek-r1-distill-llama-70b": {
+    "description": "DeepSeek R1 Distill Llama 70B is een groot taalmodel gebaseerd op Llama3.3 70B, dat gebruikmaakt van de fine-tuning van DeepSeek R1-output en vergelijkbare concurrentieprestaties bereikt als grote vooraanstaande modellen."
+  },
+  "deepseek/deepseek-r1-distill-llama-8b": {
+    "description": "DeepSeek R1 Distill Llama 8B is een gedistilleerd groot taalmodel gebaseerd op Llama-3.1-8B-Instruct, dat is getraind met behulp van de output van DeepSeek R1."
+  },
+  "deepseek/deepseek-r1-distill-qwen-14b": {
+    "description": "DeepSeek R1 Distill Qwen 14B is een gedistilleerd groot taalmodel gebaseerd op Qwen 2.5 14B, dat is getraind met behulp van de output van DeepSeek R1. Dit model heeft in verschillende benchmarktests OpenAI's o1-mini overtroffen en heeft de nieuwste technologische vooruitgang behaald voor dichte modellen (state-of-the-art). Hier zijn enkele resultaten van benchmarktests:\nAIME 2024 pass@1: 69.7\nMATH-500 pass@1: 93.9\nCodeForces Rating: 1481\nDit model toont concurrentieprestaties die vergelijkbaar zijn met grotere vooraanstaande modellen door fine-tuning op de output van DeepSeek R1."
+  },
+  "deepseek/deepseek-r1-distill-qwen-32b": {
+    "description": "DeepSeek R1 Distill Qwen 32B is een gedistilleerd groot taalmodel gebaseerd op Qwen 2.5 32B, dat is getraind met behulp van de output van DeepSeek R1. Dit model heeft in verschillende benchmarktests OpenAI's o1-mini overtroffen en heeft de nieuwste technologische vooruitgang behaald voor dichte modellen (state-of-the-art). Hier zijn enkele resultaten van benchmarktests:\nAIME 2024 pass@1: 72.6\nMATH-500 pass@1: 94.3\nCodeForces Rating: 1691\nDit model toont concurrentieprestaties die vergelijkbaar zijn met grotere vooraanstaande modellen door fine-tuning op de output van DeepSeek R1."
+  },
+  "deepseek/deepseek-r1/community": {
+    "description": "DeepSeek R1 is het nieuwste open-source model dat door het DeepSeek-team is uitgebracht, met zeer krachtige inferentieprestaties, vooral op het gebied van wiskunde, programmeren en redeneringstaken, en bereikt een niveau dat vergelijkbaar is met het o1-model van OpenAI."
+  },
  "deepseek/deepseek-r1:free": {
    "description": "DeepSeek-R1 heeft de redeneringscapaciteiten van het model aanzienlijk verbeterd, zelfs met zeer weinig gelabelde gegevens. Voordat het model het uiteindelijke antwoord geeft, genereert het eerst een denkproces om de nauwkeurigheid van het uiteindelijke antwoord te verbeteren."
  },
+  "deepseek/deepseek-v3": {
+    "description": "DeepSeek-V3 heeft een belangrijke doorbraak bereikt in inferentiesnelheid ten opzichte van eerdere modellen. Het staat op de eerste plaats onder open-source modellen en kan zich meten met de meest geavanceerde gesloten modellen ter wereld. DeepSeek-V3 maakt gebruik van Multi-Head Latent Attention (MLA) en de DeepSeekMoE-architectuur, die grondig zijn gevalideerd in DeepSeek-V2. Bovendien introduceert DeepSeek-V3 een aanvullende verliesloze strategie voor load balancing en stelt het multi-label voorspellingsdoelen in om sterkere prestaties te behalen."
+  },
+  "deepseek/deepseek-v3/community": {
+    "description": "DeepSeek-V3 heeft een belangrijke doorbraak bereikt in inferentiesnelheid ten opzichte van eerdere modellen. Het staat op de eerste plaats onder open-source modellen en kan zich meten met de meest geavanceerde gesloten modellen ter wereld. DeepSeek-V3 maakt gebruik van Multi-Head Latent Attention (MLA) en de DeepSeekMoE-architectuur, die grondig zijn gevalideerd in DeepSeek-V2. Bovendien introduceert DeepSeek-V3 een aanvullende verliesloze strategie voor load balancing en stelt het multi-label voorspellingsdoelen in om sterkere prestaties te behalen."
+  },
  "doubao-1.5-lite-32k": {
    "description": "Doubao-1.5-lite is de nieuwste generatie lichtgewicht model, met extreme responssnelheid en prestaties die wereldwijd tot de top behoren."
  },
@@ -800,9 +830,18 @@
  "gemini-2.0-flash-001": {
    "description": "Gemini 2.0 Flash biedt next-gen functies en verbeteringen, waaronder uitstekende snelheid, native toolgebruik, multimodale generatie en een contextvenster van 1M tokens."
  },
+  "gemini-2.0-flash-lite": {
+    "description": "Gemini 2.0 Flash is een modelvariant die is geoptimaliseerd voor kosteneffectiviteit en lage latentie."
+  },
+  "gemini-2.0-flash-lite-001": {
+    "description": "Gemini 2.0 Flash is een modelvariant die is geoptimaliseerd voor kosteneffectiviteit en lage latentie."
+  },
  "gemini-2.0-flash-lite-preview-02-05": {
    "description": "Een Gemini 2.0 Flash-model dat is geoptimaliseerd voor kosteneffectiviteit en lage latentie."
  },
+  "gemini-2.0-flash-thinking-exp": {
+    "description": "Gemini 2.0 Flash Exp is Google's nieuwste experimentele multimodale AI-model, met next-gen functies, uitstekende snelheid, native tool-aanroepen en multimodale generatie."
+  },
  "gemini-2.0-flash-thinking-exp-01-21": {
    "description": "Gemini 2.0 Flash Exp is Google's nieuwste experimentele multimodale AI-model, met next-gen functies, uitstekende snelheid, native tool-aanroepen en multimodale generatie."
  },
@@ -953,6 +992,9 @@
  "gpt-4-vision-preview": {
    "description": "Het nieuwste GPT-4 Turbo-model heeft visuele functies. Nu kunnen visuele verzoeken worden gedaan met behulp van JSON-indeling en functieaanroepen. GPT-4 Turbo is een verbeterde versie die kosteneffectieve ondersteuning biedt voor multimodale taken. Het vindt een balans tussen nauwkeurigheid en efficiëntie, geschikt voor toepassingen die realtime interactie vereisen."
  },
+  "gpt-4.5-preview": {
+    "description": "De onderzoekspreview van GPT-4.5, ons grootste en krachtigste GPT-model tot nu toe. Het heeft een uitgebreide wereldkennis en kan de intenties van gebruikers beter begrijpen, waardoor het uitblinkt in creatieve taken en autonome planning. GPT-4.5 accepteert tekst- en afbeeldingsinvoer en genereert tekstuitvoer (inclusief gestructureerde uitvoer). Het ondersteunt belangrijke ontwikkelaarsfuncties zoals functieaanroepen, batch-API's en streaminguitvoer. In taken die creativiteit, open denken en dialoog vereisen (zoals schrijven, leren of het verkennen van nieuwe ideeën), presteert GPT-4.5 bijzonder goed. De kennis is bijgewerkt tot oktober 2023."
+  },
  "gpt-4o": {
    "description": "ChatGPT-4o is een dynamisch model dat in realtime wordt bijgewerkt om de meest actuele versie te behouden. Het combineert krachtige taalbegrip- en generatiecapaciteiten, geschikt voor grootschalige toepassingsscenario's, waaronder klantenservice, onderwijs en technische ondersteuning."
  },
@@ -1088,15 +1130,6 @@
  "llama-3.1-8b-instant": {
    "description": "Llama 3.1 8B is een hoogpresterend model dat snelle tekstgeneratiecapaciteiten biedt, zeer geschikt voor toepassingen die grootschalige efficiëntie en kosteneffectiviteit vereisen."
  },
-  "llama-3.1-sonar-huge-128k-online": {
-    "description": "Llama 3.1 Sonar Huge Online model, met 405B parameters, ondersteunt een contextlengte van ongeveer 127.000 tokens, ontworpen voor complexe online chattoepassingen."
-  },
-  "llama-3.1-sonar-large-128k-online": {
-    "description": "Llama 3.1 Sonar Large Online model, met 70B parameters, ondersteunt een contextlengte van ongeveer 127.000 tokens, geschikt voor hoge capaciteit en diverse chattaken."
-  },
-  "llama-3.1-sonar-small-128k-online": {
-    "description": "Llama 3.1 Sonar Small Online model, met 8B parameters, ondersteunt een contextlengte van ongeveer 127.000 tokens, speciaal ontworpen voor online chat en kan efficiënt verschillende tekstinteracties verwerken."
-  },
  "llama-3.2-11b-vision-instruct": {
    "description": "Uitstekende beeldredeneringscapaciteiten op hoge resolutie-afbeeldingen, geschikt voor visuele begrijptoepassingen."
  },
@@ -1250,6 +1283,9 @@
  "meta-llama/llama-3.2-11b-vision-instruct": {
    "description": "LLaMA 3.2 is ontworpen voor taken die visuele en tekstuele gegevens combineren. Het presteert uitstekend in taken zoals afbeeldingsbeschrijving en visuele vraag-en-antwoord, en overbrugt de kloof tussen taalgeneratie en visuele redenering."
  },
+  "meta-llama/llama-3.2-3b-instruct": {
+    "description": "meta-llama/llama-3.2-3b-instruct"
+  },
  "meta-llama/llama-3.2-90b-vision-instruct": {
    "description": "LLaMA 3.2 is ontworpen voor taken die visuele en tekstuele gegevens combineren. Het presteert uitstekend in taken zoals afbeeldingsbeschrijving en visuele vraag-en-antwoord, en overbrugt de kloof tussen taalgeneratie en visuele redenering."
  },
@@ -1484,6 +1520,9 @@
  "qwen-max-latest": {
    "description": "Het Tongyi Qianwen model met een schaal van honderden miljarden, ondersteunt invoer in verschillende talen, waaronder Chinees en Engels, en is de API-model achter de huidige Tongyi Qianwen 2.5 productversie."
  },
+  "qwen-omni-turbo-latest": {
+    "description": "De Qwen-Omni serie modellen ondersteunt het invoeren van gegevens in verschillende modaliteiten, waaronder video, audio, afbeeldingen en tekst, en kan audio en tekst als output genereren."
+  },
  "qwen-plus": {
    "description": "Qwen is een verbeterde versie van het grootschalige taalmodel dat ondersteuning biedt voor verschillende taalinputs zoals Chinees en Engels."
  },
@@ -1511,9 +1550,21 @@
  "qwen-vl-v1": {
    "description": "Geïnitieerd met het Qwen-7B taalmodel, voegt het een afbeeldingsmodel toe, met een invoerresolutie van 448 voor het voorgetrainde model."
  },
+  "qwen/qwen-2-7b-instruct": {
+    "description": "Qwen2 is de gloednieuwe serie van grote taalmodellen van Qwen. Qwen2 7B is een transformer-gebaseerd model dat uitblinkt in taalbegrip, meertalige capaciteiten, programmeren, wiskunde en redenering."
+  },
  "qwen/qwen-2-7b-instruct:free": {
    "description": "Qwen2 is een gloednieuwe serie grote taalmodellen met sterkere begrip- en generatiecapaciteiten."
  },
+  "qwen/qwen-2-vl-72b-instruct": {
+    "description": "Qwen2-VL is de nieuwste iteratie van het Qwen-VL-model en heeft geavanceerde prestaties behaald in visuele begrip benchmarktests, waaronder MathVista, DocVQA, RealWorldQA en MTVQA. Qwen2-VL kan video's van meer dan 20 minuten begrijpen voor hoogwaardige video-gebaseerde vraag-en-antwoord, dialoog en contentcreatie. Het heeft ook complexe redenerings- en besluitvormingscapaciteiten en kan worden geïntegreerd met mobiele apparaten, robots, enzovoort, voor automatische operaties op basis van visuele omgevingen en tekstinstructies. Naast Engels en Chinees ondersteunt Qwen2-VL nu ook het begrijpen van tekst in verschillende talen in afbeeldingen, waaronder de meeste Europese talen, Japans, Koreaans, Arabisch en Vietnamees."
+  },
+  "qwen/qwen-2.5-72b-instruct": {
+    "description": "Qwen2.5-72B-Instruct is een van de nieuwste grote taalmodellen die door Alibaba Cloud is uitgebracht. Dit 72B-model heeft aanzienlijke verbeteringen in codering en wiskunde. Het model biedt ook ondersteuning voor meerdere talen, met meer dan 29 talen, waaronder Chinees en Engels. Het model heeft aanzienlijke verbeteringen in het volgen van instructies, het begrijpen van gestructureerde gegevens en het genereren van gestructureerde output (vooral JSON)."
+  },
+  "qwen/qwen2.5-32b-instruct": {
+    "description": "Qwen2.5-32B-Instruct is een van de nieuwste grote taalmodellen die door Alibaba Cloud is uitgebracht. Dit 32B-model heeft aanzienlijke verbeteringen in codering en wiskunde. Het model biedt ook ondersteuning voor meerdere talen, met meer dan 29 talen, waaronder Chinees en Engels. Het model heeft aanzienlijke verbeteringen in het volgen van instructies, het begrijpen van gestructureerde gegevens en het genereren van gestructureerde output (vooral JSON)."
+  },
  "qwen/qwen2.5-7b-instruct": {
    "description": "LLM gericht op zowel Chinees als Engels, gericht op taal, programmeren, wiskunde, redeneren en meer."
  },
@@ -1589,9 +1640,18 @@
  "qwq": {
    "description": "QwQ is een experimenteel onderzoeksmodel dat zich richt op het verbeteren van de AI-redeneringscapaciteiten."
  },
+  "qwq-32b": {
+    "description": "De QwQ-inferentiemodel, getraind op het Qwen2.5-32B-model, heeft zijn inferentievermogen aanzienlijk verbeterd door middel van versterkend leren. De kernindicatoren van het model, zoals wiskundige code (AIME 24/25, LiveCodeBench) en enkele algemene indicatoren (IFEval, LiveBench, enz.), bereiken het niveau van de DeepSeek-R1 volwaardige versie, waarbij alle indicatoren aanzienlijk beter presteren dan de DeepSeek-R1-Distill-Qwen-32B, die ook op Qwen2.5-32B is gebaseerd."
+  },
  "qwq-32b-preview": {
    "description": "Het QwQ-model is een experimenteel onderzoeksmodel ontwikkeld door het Qwen-team, gericht op het verbeteren van de AI-redeneringscapaciteiten."
  },
+  "qwq-plus-latest": {
+    "description": "De QwQ-inferentiemodel, getraind op het Qwen2.5-model, heeft zijn inferentievermogen aanzienlijk verbeterd door middel van versterkend leren. De kernindicatoren van het model, zoals wiskundige code (AIME 24/25, LiveCodeBench) en enkele algemene indicatoren (IFEval, LiveBench, enz.), bereiken het niveau van de DeepSeek-R1 volwaardige versie."
+  },
+  "r1-1776": {
+    "description": "R1-1776 is een versie van het DeepSeek R1-model, dat is bijgetraind om ongecensureerde, onpartijdige feitelijke informatie te bieden."
+  },
  "solar-mini": {
    "description": "Solar Mini is een compacte LLM die beter presteert dan GPT-3.5, met sterke meertalige capaciteiten, ondersteunt Engels en Koreaans, en biedt een efficiënte en compacte oplossing."
  },
@@ -1604,6 +1664,9 @@
  "sonar": {
    "description": "Een lichtgewicht zoekproduct op basis van contextuele zoekopdrachten, sneller en goedkoper dan Sonar Pro."
  },
+  "sonar-deep-research": {
+    "description": "Deep Research voert uitgebreide expertstudies uit en bundelt deze in toegankelijke, bruikbare rapporten."
+  },
  "sonar-pro": {
    "description": "Een geavanceerd zoekproduct dat contextuele zoekopdrachten ondersteunt, met geavanceerde query's en vervolgacties."
  },
@@ -1661,6 +1724,9 @@
  "text-embedding-3-small": {
    "description": "Een efficiënte en kosteneffectieve nieuwe generatie Embedding model, geschikt voor kennisretrieval, RAG-toepassingen en andere scenario's."
  },
+  "thudm/glm-4-9b-chat": {
+    "description": "De open-source versie van de nieuwste generatie voorgetrainde modellen van de GLM-4-serie, uitgebracht door Zhizhu AI."
+  },
  "togethercomputer/StripedHyena-Nous-7B": {
    "description": "StripedHyena Nous (7B) biedt verbeterde rekenkracht door middel van efficiënte strategieën en modelarchitectuur."
  },
@@ -1676,6 +1742,9 @@
  "us.anthropic.claude-3-5-sonnet-20241022-v2:0": {
    "description": "Claude 3.5 Sonnet heeft de industrienormen verbeterd, met prestaties die de concurrentiemodellen en Claude 3 Opus overtreffen, en excelleert in uitgebreide evaluaties, terwijl het de snelheid en kosten van onze middelgrote modellen behoudt."
  },
+  "us.anthropic.claude-3-7-sonnet-20250219-v1:0": {
+    "description": "Claude 3.7 sonnet is het snelste volgende generatie model van Anthropic. In vergelijking met Claude 3 Haiku heeft Claude 3.7 Sonnet verbeteringen in verschillende vaardigheden en overtreft het de grootste modellen van de vorige generatie, Claude 3 Opus, in veel intellectuele benchmarktests."
+  },
  "whisper-1": {
    "description": "Algemeen spraakherkenningsmodel, ondersteunt meertalige spraakherkenning, spraakvertaling en taalherkenning."
  },
@@ -140,6 +140,18 @@
      "close": "Verwijderen",
      "confirm": "Configuratie voltooid en opnieuw proberen"
    },
+    "crawPages": {
+      "crawling": "Linkherkenning",
+      "detail": {
+        "preview": "Voorbeeld",
+        "raw": "Oorspronkelijke tekst",
+        "tooLong": "De tekstinhoud is te lang, de gesprekscontext houdt alleen de eerste {{characters}} tekens vast, het overschot wordt niet meegerekend in de gesprekscontext"
+      },
+      "meta": {
+        "crawler": "Crawler-modus",
+        "words": "Aantal tekens"
+      }
+    },
    "searchxng": {
      "baseURL": "Voer in",
      "description": "Voer de URL van SearchXNG in om te beginnen met online zoeken",
@@ -89,6 +89,9 @@
  "perplexity": {
    "description": "Perplexity is een toonaangevende aanbieder van dialooggeneratiemodellen, die verschillende geavanceerde Llama 3.1-modellen aanbiedt, die zowel online als offline toepassingen ondersteunen, en bijzonder geschikt zijn voor complexe natuurlijke taalverwerkingstaken."
  },
+  "ppio": {
+    "description": "PPIO biedt stabiele en kosteneffectieve open source model API-diensten, die ondersteuning bieden voor de volledige DeepSeek-serie, Llama, Qwen en andere toonaangevende grote modellen in de industrie."
+  },
  "qwen": {
    "description": "Tongyi Qianwen is een door Alibaba Cloud zelf ontwikkeld grootschalig taalmodel met krachtige mogelijkheden voor natuurlijke taalbegrip en -generatie. Het kan verschillende vragen beantwoorden, tekstinhoud creëren, meningen uiten, code schrijven, en speelt een rol in verschillende domeinen."
  },
@@ -32,7 +32,12 @@
  "duplicateTitle": "{{title}} kopia",
  "emptyAgent": "Brak asystenta",
  "extendParams": {
+    "disableContextCaching": {
+      "desc": "Koszt generowania pojedynczej rozmowy może zostać obniżony o 90%, a prędkość odpowiedzi wzrośnie czterokrotnie (<1>Dowiedz się więcej</1>). Po włączeniu automatycznie wyłączone zostanie ograniczenie liczby wiadomości historycznych",
+      "title": "Włącz pamięć kontekstową"
+    },
    "enableReasoning": {
+      "desc": "Ograniczenia oparte na mechanizmie Claude Thinking (<1>Dowiedz się więcej</1>), po włączeniu automatycznie wyłączone zostanie ograniczenie liczby wiadomości historycznych",
      "title": "Włącz głębokie myślenie"
    },
    "reasoningBudgetToken": {
@@ -40,6 +45,9 @@
    },
    "title": "Funkcje rozszerzenia modelu"
  },
+  "history": {
+    "title": "Asystent zapamięta tylko ostatnie {{count}} wiadomości"
+  },
  "historyRange": "Zakres historii",
  "historySummary": "Podsumowanie wiadomości historycznych",
  "inbox": {
@@ -79,6 +87,39 @@
    "deleteDisabledByThreads": "Istnieją podwątki, nie można usunąć",
    "regenerate": "Wygeneruj ponownie"
  },
+  "messages": {
+    "modelCard": {
+      "credit": "Punkty",
+      "creditPricing": "Cennik",
+      "creditTooltip": "Aby ułatwić obliczenia, przeliczamy 1$ na 1M punktów, na przykład $3/M tokenów to 3 punkty/token",
+      "pricing": {
+        "inputCachedTokens": "Zbuforowane wejście {{amount}}/punktów · ${{amount}}/M",
+        "inputCharts": "${{amount}}/M znaków",
+        "inputMinutes": "${{amount}}/minutę",
+        "inputTokens": "Wejście {{amount}}/punktów · ${{amount}}/M",
+        "outputTokens": "Wyjście {{amount}}/punktów · ${{amount}}/M",
+        "writeCacheInputTokens": "Zapisz wejście w pamięci podręcznej {{amount}}/punktów · ${{amount}}/M"
+      }
+    },
+    "tokenDetails": {
+      "average": "Średnia cena",
+      "input": "Wejście",
+      "inputAudio": "Wejście audio",
+      "inputCached": "Zbuforowane wejście",
+      "inputCitation": "Cytowanie wejścia",
+      "inputText": "Wejście tekstowe",
+      "inputTitle": "Szczegóły wejścia",
+      "inputUncached": "Wejście niezbuforowane",
+      "inputWriteCached": "Zapisz wejście w pamięci podręcznej",
+      "output": "Wyjście",
+      "outputAudio": "Wyjście audio",
+      "outputText": "Wyjście tekstowe",
+      "outputTitle": "Szczegóły wyjścia",
+      "reasoning": "Głębokie myślenie",
+      "title": "Szczegóły generacji",
+      "total": "Całkowite zużycie"
+    }
+  },
  "newAgent": "Nowy asystent",
  "pin": "Przypnij",
  "pinOff": "Odepnij",
@@ -322,6 +322,9 @@
    "tooltip": "Aktualizuj podstawowe ustawienia dostawcy",
    "updateSuccess": "Aktualizacja zakończona sukcesem"
  },
+  "updateCustomAiProvider": {
+    "title": "Aktualizuj konfigurację dostawcy AI"
+  },
  "vertexai": {
    "apiKey": {
      "desc": "Wprowadź swoje klucze Vertex AI",
@@ -8,6 +8,12 @@
  "01-ai/Yi-1.5-9B-Chat-16K": {
    "description": "Yi-1.5 9B obsługuje 16K tokenów, oferując wydajne i płynne zdolności generowania języka."
  },
+  "01-ai/yi-1.5-34b-chat": {
+    "description": "Zero One, najnowszy model open source z dostrojeniem, zawierający 34 miliardy parametrów, dostosowany do różnych scenariuszy dialogowych, z wysokiej jakości danymi treningowymi, dostosowany do preferencji ludzkich."
+  },
+  "01-ai/yi-1.5-9b-chat": {
+    "description": "Zero One, najnowszy model open source z dostrojeniem, zawierający 9 miliardów parametrów, dostosowany do różnych scenariuszy dialogowych, z wysokiej jakości danymi treningowymi, dostosowany do preferencji ludzkich."
+  },
  "360gpt-pro": {
    "description": "360GPT Pro, jako ważny członek serii modeli AI 360, zaspokaja różnorodne potrzeby aplikacji przetwarzania języka naturalnego dzięki wydajnym zdolnościom przetwarzania tekstu, obsługując zrozumienie długich tekstów i wielokrotne dialogi."
  },
@@ -239,6 +245,9 @@
  "Qwen/QVQ-72B-Preview": {
    "description": "QVQ-72B-Preview to model badawczy opracowany przez zespół Qwen, skoncentrowany na zdolnościach wnioskowania wizualnego, który ma unikalne zalety w zrozumieniu złożonych scenariuszy i rozwiązywaniu wizualnie związanych problemów matematycznych."
  },
+  "Qwen/QwQ-32B": {
+    "description": "QwQ jest modelem inferencyjnym z serii Qwen. W porównaniu do tradycyjnych modeli dostosowanych do instrukcji, QwQ posiada zdolności myślenia i wnioskowania, co pozwala na znaczące zwiększenie wydajności w zadaniach końcowych, szczególnie w rozwiązywaniu trudnych problemów. QwQ-32B to średniej wielkości model inferencyjny, który osiąga konkurencyjną wydajność w porównaniu z najnowocześniejszymi modelami inferencyjnymi, takimi jak DeepSeek-R1 i o1-mini. Model ten wykorzystuje technologie takie jak RoPE, SwiGLU, RMSNorm oraz Attention QKV bias, posiada 64-warstwową strukturę sieci i 40 głowic uwagi Q (w architekturze GQA KV wynosi 8)."
+  },
  "Qwen/QwQ-32B-Preview": {
    "description": "QwQ-32B-Preview to najnowszy eksperymentalny model badawczy Qwen, skoncentrowany na zwiększeniu zdolności wnioskowania AI. Poprzez eksplorację złożonych mechanizmów, takich jak mieszanie języków i wnioskowanie rekurencyjne, główne zalety obejmują silne zdolności analizy wnioskowania, matematyki i programowania. Jednocześnie występują problemy z przełączaniem języków, cyklami wnioskowania, kwestiami bezpieczeństwa oraz różnicami w innych zdolnościach."
  },
@@ -467,9 +476,6 @@
  "anthropic.claude-3-5-sonnet-20241022-v2:0": {
    "description": "Claude 3.5 Sonnet podnosi standardy branżowe, przewyższając modele konkurencji oraz Claude 3 Opus, wykazując doskonałe wyniki w szerokich ocenach, jednocześnie oferując prędkość i koszty naszych modeli średniego poziomu."
  },
-  "anthropic.claude-3-7-sonnet-20250219-v1:0": {
-    "description": "Claude 3.7 Sonnet to najnowszy model od Anthropic, który oferuje doskonałe wyniki w szerokim zakresie zadań, w tym generowanie treści, rozumienie języka naturalnego i przestrzeganie instrukcji. Claude 3.7 Sonnet jest szybki, niezawodny i ekonomiczny, co sprawia, że jest idealny do zastosowań produkcyjnych."
-  },
  "anthropic.claude-3-haiku-20240307-v1:0": {
    "description": "Claude 3 Haiku to najszybszy i najbardziej kompaktowy model od Anthropic, oferujący niemal natychmiastową szybkość odpowiedzi. Może szybko odpowiadać na proste zapytania i prośby. Klienci będą mogli budować płynne doświadczenia AI, które naśladują interakcje międzyludzkie. Claude 3 Haiku może przetwarzać obrazy i zwracać wyjścia tekstowe, z oknem kontekstowym wynoszącym 200K."
  },
@@ -506,6 +512,9 @@
  "aya:35b": {
    "description": "Aya 23 to model wielojęzyczny wydany przez Cohere, wspierający 23 języki, ułatwiający różnorodne zastosowania językowe."
  },
+  "baichuan/baichuan2-13b-chat": {
+    "description": "Baichuan-13B to otwarty model językowy stworzony przez Baichuan Intelligence, zawierający 13 miliardów parametrów, który osiągnął najlepsze wyniki w swojej klasie w autorytatywnych benchmarkach w języku chińskim i angielskim."
+  },
  "charglm-3": {
    "description": "CharGLM-3 zaprojektowany z myślą o odgrywaniu ról i emocjonalnym towarzyszeniu, obsługujący ultra-długą pamięć wielokrotną i spersonalizowane dialogi, z szerokim zakresem zastosowań."
  },
@@ -686,9 +695,30 @@
  "deepseek/deepseek-r1": {
    "description": "DeepSeek-R1 znacznie poprawił zdolności wnioskowania modelu przy minimalnej ilości oznaczonych danych. Przed wygenerowaniem ostatecznej odpowiedzi, model najpierw wygeneruje fragment myślenia, aby zwiększyć dokładność końcowej odpowiedzi."
  },
+  "deepseek/deepseek-r1-distill-llama-70b": {
+    "description": "DeepSeek R1 Distill Llama 70B to duży model językowy oparty na Llama3.3 70B, który wykorzystuje dostrojenie na podstawie wyjścia DeepSeek R1, osiągając konkurencyjną wydajność porównywalną z dużymi modelami na czołowej pozycji."
+  },
+  "deepseek/deepseek-r1-distill-llama-8b": {
+    "description": "DeepSeek R1 Distill Llama 8B to destylowany duży model językowy oparty na Llama-3.1-8B-Instruct, wytrenowany przy użyciu wyjścia DeepSeek R1."
+  },
+  "deepseek/deepseek-r1-distill-qwen-14b": {
+    "description": "DeepSeek R1 Distill Qwen 14B to destylowany duży model językowy oparty na Qwen 2.5 14B, wytrenowany przy użyciu wyjścia DeepSeek R1. Model ten przewyższył OpenAI o1-mini w wielu testach benchmarkowych, osiągając najnowsze osiągnięcia technologiczne w dziedzinie modeli gęstych (dense models). Oto niektóre wyniki testów benchmarkowych:\nAIME 2024 pass@1: 69.7\nMATH-500 pass@1: 93.9\nCodeForces Rating: 1481\nModel ten, dostrojony na podstawie wyjścia DeepSeek R1, wykazuje konkurencyjną wydajność porównywalną z większymi modelami na czołowej pozycji."
+  },
+  "deepseek/deepseek-r1-distill-qwen-32b": {
+    "description": "DeepSeek R1 Distill Qwen 32B to destylowany duży model językowy oparty na Qwen 2.5 32B, wytrenowany przy użyciu wyjścia DeepSeek R1. Model ten przewyższył OpenAI o1-mini w wielu testach benchmarkowych, osiągając najnowsze osiągnięcia technologiczne w dziedzinie modeli gęstych (dense models). Oto niektóre wyniki testów benchmarkowych:\nAIME 2024 pass@1: 72.6\nMATH-500 pass@1: 94.3\nCodeForces Rating: 1691\nModel ten, dostrojony na podstawie wyjścia DeepSeek R1, wykazuje konkurencyjną wydajność porównywalną z większymi modelami na czołowej pozycji."
+  },
+  "deepseek/deepseek-r1/community": {
+    "description": "DeepSeek R1 to najnowszy model open source wydany przez zespół DeepSeek, który charakteryzuje się bardzo silnymi możliwościami wnioskowania, szczególnie w zadaniach matematycznych, programistycznych i logicznych, osiągając poziom porównywalny z modelem o1 OpenAI."
+  },
  "deepseek/deepseek-r1:free": {
    "description": "DeepSeek-R1 znacznie poprawił zdolności wnioskowania modelu przy minimalnej ilości oznaczonych danych. Przed wygenerowaniem ostatecznej odpowiedzi, model najpierw wygeneruje fragment myślenia, aby zwiększyć dokładność końcowej odpowiedzi."
  },
+  "deepseek/deepseek-v3": {
+    "description": "DeepSeek-V3 osiągnął znaczący przełom w szybkości wnioskowania w porównaniu do wcześniejszych modeli. Zajmuje pierwsze miejsce wśród modeli open source i może konkurować z najnowocześniejszymi modelami zamkniętymi na świecie. DeepSeek-V3 wykorzystuje architekturę wielogłowicowej uwagi (MLA) oraz DeepSeekMoE, które zostały w pełni zweryfikowane w DeepSeek-V2. Ponadto, DeepSeek-V3 wprowadza pomocniczą strategię bezstratną do równoważenia obciążenia oraz ustala cele treningowe dla wieloetykietowego przewidywania, aby uzyskać lepszą wydajność."
+  },
+  "deepseek/deepseek-v3/community": {
+    "description": "DeepSeek-V3 osiągnął znaczący przełom w szybkości wnioskowania w porównaniu do wcześniejszych modeli. Zajmuje pierwsze miejsce wśród modeli open source i może konkurować z najnowocześniejszymi modelami zamkniętymi na świecie. DeepSeek-V3 wykorzystuje architekturę wielogłowicowej uwagi (MLA) oraz DeepSeekMoE, które zostały w pełni zweryfikowane w DeepSeek-V2. Ponadto, DeepSeek-V3 wprowadza pomocniczą strategię bezstratną do równoważenia obciążenia oraz ustala cele treningowe dla wieloetykietowego przewidywania, aby uzyskać lepszą wydajność."
+  },
  "doubao-1.5-lite-32k": {
    "description": "Doubao-1.5-lite to nowa generacja modelu o lekkiej konstrukcji, charakteryzująca się ekstremalną szybkością reakcji, osiągając światowy poziom zarówno w zakresie wydajności, jak i opóźnienia."
  },
@@ -800,9 +830,18 @@
  "gemini-2.0-flash-001": {
    "description": "Gemini 2.0 Flash oferuje funkcje i ulepszenia nowej generacji, w tym doskonałą prędkość, natywne korzystanie z narzędzi, generowanie multimodalne oraz okno kontekstowe o długości 1M tokenów."
  },
+  "gemini-2.0-flash-lite": {
+    "description": "Gemini 2.0 Flash to wariant modelu, zoptymalizowany pod kątem efektywności kosztowej i niskiego opóźnienia."
+  },
+  "gemini-2.0-flash-lite-001": {
+    "description": "Gemini 2.0 Flash to wariant modelu, zoptymalizowany pod kątem efektywności kosztowej i niskiego opóźnienia."
+  },
  "gemini-2.0-flash-lite-preview-02-05": {
    "description": "Model Gemini 2.0 Flash, zoptymalizowany pod kątem efektywności kosztowej i niskiej latencji."
  },
+  "gemini-2.0-flash-thinking-exp": {
+    "description": "Gemini 2.0 Flash Exp to najnowszy eksperymentalny model AI multimodalnego Google, posiadający cechy nowej generacji, doskonałą prędkość, natywne wywołania narzędzi oraz generację multimodalną."
+  },
  "gemini-2.0-flash-thinking-exp-01-21": {
    "description": "Gemini 2.0 Flash Exp to najnowszy eksperymentalny model AI multimodalnego Google, posiadający cechy nowej generacji, doskonałą prędkość, natywne wywołania narzędzi oraz generację multimodalną."
  },
@@ -953,6 +992,9 @@
  "gpt-4-vision-preview": {
    "description": "Najnowszy model GPT-4 Turbo posiada funkcje wizualne. Teraz zapytania wizualne mogą być obsługiwane za pomocą formatu JSON i wywołań funkcji. GPT-4 Turbo to ulepszona wersja, która oferuje opłacalne wsparcie dla zadań multimodalnych. Znajduje równowagę między dokładnością a wydajnością, co czyni go odpowiednim do aplikacji wymagających interakcji w czasie rzeczywistym."
  },
+  "gpt-4.5-preview": {
+    "description": "Wersja badawcza GPT-4.5, która jest naszym największym i najpotężniejszym modelem GPT do tej pory. Posiada szeroką wiedzę o świecie i lepiej rozumie intencje użytkowników, co sprawia, że doskonale radzi sobie w zadaniach kreatywnych i autonomicznym planowaniu. GPT-4.5 akceptuje tekstowe i graficzne wejścia oraz generuje wyjścia tekstowe (w tym wyjścia strukturalne). Wspiera kluczowe funkcje dla deweloperów, takie jak wywołania funkcji, API wsadowe i strumieniowe wyjścia. W zadaniach wymagających kreatywności, otwartego myślenia i dialogu (takich jak pisanie, nauka czy odkrywanie nowych pomysłów), GPT-4.5 sprawdza się szczególnie dobrze. Data graniczna wiedzy to październik 2023."
+  },
  "gpt-4o": {
    "description": "ChatGPT-4o to dynamiczny model, który jest na bieżąco aktualizowany, aby utrzymać najnowszą wersję. Łączy potężne zdolności rozumienia i generowania języka, co czyni go odpowiednim do zastosowań na dużą skalę, w tym obsługi klienta, edukacji i wsparcia technicznego."
  },
@@ -1088,15 +1130,6 @@
  "llama-3.1-8b-instant": {
    "description": "Llama 3.1 8B to model o wysokiej wydajności, oferujący szybkie możliwości generowania tekstu, idealny do zastosowań wymagających dużej efektywności i opłacalności."
  },
-  "llama-3.1-sonar-huge-128k-online": {
-    "description": "Model Llama 3.1 Sonar Huge Online, z 405B parametrami, obsługujący kontekst o długości około 127,000 tokenów, zaprojektowany do złożonych aplikacji czatu online."
-  },
-  "llama-3.1-sonar-large-128k-online": {
-    "description": "Model Llama 3.1 Sonar Large Online, z 70B parametrami, obsługujący kontekst o długości około 127,000 tokenów, idealny do zadań czatu o dużej pojemności i różnorodności."
-  },
-  "llama-3.1-sonar-small-128k-online": {
-    "description": "Model Llama 3.1 Sonar Small Online, z 8B parametrami, obsługujący kontekst o długości około 127,000 tokenów, zaprojektowany do czatów online, efektywnie przetwarzający różne interakcje tekstowe."
-  },
  "llama-3.2-11b-vision-instruct": {
    "description": "Wyjątkowe zdolności wnioskowania wizualnego na obrazach o wysokiej rozdzielczości, idealne do zastosowań związanych ze zrozumieniem wizualnym."
  },
@@ -1250,6 +1283,9 @@
  "meta-llama/llama-3.2-11b-vision-instruct": {
    "description": "LLaMA 3.2 jest zaprojektowana do przetwarzania zadań łączących dane wizualne i tekstowe. Wykazuje doskonałe wyniki w zadaniach takich jak opisywanie obrazów i wizualne pytania i odpowiedzi, przekraczając granice między generowaniem języka a wnioskowaniem wizualnym."
  },
+  "meta-llama/llama-3.2-3b-instruct": {
+    "description": "meta-llama/llama-3.2-3b-instruct"
+  },
  "meta-llama/llama-3.2-90b-vision-instruct": {
    "description": "LLaMA 3.2 jest zaprojektowana do przetwarzania zadań łączących dane wizualne i tekstowe. Wykazuje doskonałe wyniki w zadaniach takich jak opisywanie obrazów i wizualne pytania i odpowiedzi, przekraczając granice między generowaniem języka a wnioskowaniem wizualnym."
  },
@@ -1484,6 +1520,9 @@
  "qwen-max-latest": {
    "description": "Model językowy Qwen Max o skali miliardów parametrów, obsługujący różne języki, w tym chiński i angielski, będący API modelu za produktem Qwen 2.5."
  },
+  "qwen-omni-turbo-latest": {
+    "description": "Modele z serii Qwen-Omni obsługują różne rodzaje danych wejściowych, w tym wideo, audio, obrazy i tekst, oraz generują wyjścia w postaci audio i tekstu."
+  },
  "qwen-plus": {
    "description": "Qwen Plus to ulepszona wersja ogromnego modelu językowego, wspierająca różne języki, w tym chiński i angielski."
  },
@@ -1511,9 +1550,21 @@
  "qwen-vl-v1": {
    "description": "Model wstępnie wytrenowany, zainicjowany przez model językowy Qwen-7B, dodający model obrazowy, z rozdzielczością wejściową obrazu wynoszącą 448."
  },
+  "qwen/qwen-2-7b-instruct": {
+    "description": "Qwen2 to nowa seria dużych modeli językowych Qwen. Qwen2 7B to model oparty na transformatorze, który wykazuje doskonałe wyniki w zakresie rozumienia języka, zdolności wielojęzycznych, programowania, matematyki i wnioskowania."
+  },
  "qwen/qwen-2-7b-instruct:free": {
    "description": "Qwen2 to nowa seria dużych modeli językowych, charakteryzująca się silniejszymi zdolnościami rozumienia i generowania."
  },
+  "qwen/qwen-2-vl-72b-instruct": {
+    "description": "Qwen2-VL to najnowsza iteracja modelu Qwen-VL, która osiągnęła najnowocześniejsze wyniki w testach benchmarkowych dotyczących rozumienia wizualnego, w tym MathVista, DocVQA, RealWorldQA i MTVQA. Qwen2-VL potrafi rozumieć filmy trwające ponad 20 minut, umożliwiając wysokiej jakości pytania i odpowiedzi, dialogi oraz tworzenie treści oparte na wideo. Posiada również zdolności do złożonego wnioskowania i podejmowania decyzji, co pozwala na integrację z urządzeniami mobilnymi, robotami itp., aby automatycznie działać na podstawie środowiska wizualnego i instrukcji tekstowych. Oprócz angielskiego i chińskiego, Qwen2-VL teraz wspiera również rozumienie tekstu w różnych językach w obrazach, w tym większości języków europejskich, japońskiego, koreańskiego, arabskiego i wietnamskiego."
+  },
+  "qwen/qwen-2.5-72b-instruct": {
+    "description": "Qwen2.5-72B-Instruct to jeden z najnowszych modeli dużych języków wydanych przez Alibaba Cloud. Model 72B wykazuje znaczną poprawę w obszarach kodowania i matematyki. Model ten oferuje wsparcie dla wielu języków, obejmując ponad 29 języków, w tym chiński i angielski. Model znacząco poprawił zdolność do podążania za instrukcjami, rozumienia danych strukturalnych oraz generowania strukturalnych wyników (szczególnie JSON)."
+  },
+  "qwen/qwen2.5-32b-instruct": {
+    "description": "Qwen2.5-32B-Instruct to jeden z najnowszych modeli dużych języków wydanych przez Alibaba Cloud. Model 32B wykazuje znaczną poprawę w obszarach kodowania i matematyki. Model ten oferuje wsparcie dla wielu języków, obejmując ponad 29 języków, w tym chiński i angielski. Model znacząco poprawił zdolność do podążania za instrukcjami, rozumienia danych strukturalnych oraz generowania strukturalnych wyników (szczególnie JSON)."
+  },
  "qwen/qwen2.5-7b-instruct": {
    "description": "LLM skierowany na język chiński i angielski, skoncentrowany na języku, programowaniu, matematyce, wnioskowaniu i innych dziedzinach."
  },
@@ -1589,9 +1640,18 @@
  "qwq": {
    "description": "QwQ to eksperymentalny model badawczy, skoncentrowany na zwiększeniu zdolności wnioskowania AI."
  },
+  "qwq-32b": {
+    "description": "Model inferency QwQ, oparty na modelu Qwen2.5-32B, został znacznie ulepszony dzięki uczeniu przez wzmocnienie, co zwiększa jego zdolności inferencyjne. Kluczowe wskaźniki modelu, takie jak matematyczny kod i inne (AIME 24/25, LiveCodeBench), oraz niektóre ogólne wskaźniki (IFEval, LiveBench itp.) osiągają poziom pełnej wersji DeepSeek-R1, a wszystkie wskaźniki znacznie przewyższają te, które są oparte na Qwen2.5-32B, w tym DeepSeek-R1-Distill-Qwen-32B."
+  },
  "qwq-32b-preview": {
    "description": "Model QwQ to eksperymentalny model badawczy opracowany przez zespół Qwen, skoncentrowany na zwiększeniu zdolności wnioskowania AI."
  },
+  "qwq-plus-latest": {
+    "description": "Model inferency QwQ, oparty na modelu Qwen2.5, został znacznie ulepszony dzięki uczeniu przez wzmocnienie, co zwiększa jego zdolności inferencyjne. Kluczowe wskaźniki modelu, takie jak matematyczny kod i inne (AIME 24/25, LiveCodeBench), oraz niektóre ogólne wskaźniki (IFEval, LiveBench itp.) osiągają poziom pełnej wersji DeepSeek-R1."
+  },
+  "r1-1776": {
+    "description": "R1-1776 to wersja modelu DeepSeek R1, która została poddana dalszemu treningowi, aby dostarczać nieocenzurowane, bezstronne informacje faktograficzne."
+  },
  "solar-mini": {
    "description": "Solar Mini to kompaktowy LLM, który przewyższa GPT-3.5, posiadając potężne zdolności wielojęzyczne, wspierając angielski i koreański, oferując efektywne i zgrabne rozwiązania."
  },
@@ -1604,6 +1664,9 @@
  "sonar": {
    "description": "Lekki produkt wyszukiwania oparty na kontekście, szybszy i tańszy niż Sonar Pro."
  },
+  "sonar-deep-research": {
+    "description": "Deep Research przeprowadza kompleksowe badania na poziomie eksperckim i łączy je w dostępne, praktyczne raporty."
+  },
  "sonar-pro": {
    "description": "Zaawansowany produkt wyszukiwania wspierający kontekst wyszukiwania, oferujący zaawansowane zapytania i śledzenie."
  },
@@ -1661,6 +1724,9 @@
  "text-embedding-3-small": {
    "description": "Nowej generacji model Embedding, efektywny i ekonomiczny, odpowiedni do wyszukiwania wiedzy, aplikacji RAG i innych scenariuszy."
  },
+  "thudm/glm-4-9b-chat": {
+    "description": "Otwarta wersja najnowszej generacji modelu pretrenowanego GLM-4 wydanego przez Zhipu AI."
+  },
  "togethercomputer/StripedHyena-Nous-7B": {
    "description": "StripedHyena Nous (7B) oferuje zwiększoną moc obliczeniową dzięki efektywnym strategiom i architekturze modelu."
  },
@@ -1676,6 +1742,9 @@
  "us.anthropic.claude-3-5-sonnet-20241022-v2:0": {
    "description": "Claude 3.5 Sonnet podnosi standardy branżowe, przewyższając modele konkurencji oraz Claude 3 Opus, osiągając doskonałe wyniki w szerokim zakresie ocen, przy zachowaniu prędkości i kosztów naszych modeli średniego poziomu."
  },
+  "us.anthropic.claude-3-7-sonnet-20250219-v1:0": {
+    "description": "Claude 3.7 sonet to najszybszy model następnej generacji od Anthropic. W porównaniu do Claude 3 Haiku, Claude 3.7 Sonet wykazuje poprawę w różnych umiejętnościach i przewyższa największy model poprzedniej generacji, Claude 3 Opus, w wielu testach inteligencji."
+  },
  "whisper-1": {
    "description": "Uniwersalny model rozpoznawania mowy, obsługujący rozpoznawanie mowy w wielu językach, tłumaczenie mowy i rozpoznawanie języków."
  },
@@ -140,6 +140,18 @@
      "close": "Usuń",
      "confirm": "Konfiguracja zakończona, spróbuj ponownie"
    },
+    "crawPages": {
+      "crawling": "Rozpoznawanie linków",
+      "detail": {
+        "preview": "Podgląd",
+        "raw": "Tekst źródłowy",
+        "tooLong": "Treść tekstu jest zbyt długa, kontekst rozmowy zachowuje tylko pierwsze {{characters}} znaków, a nadmiar nie jest uwzględniany w kontekście rozmowy"
+      },
+      "meta": {
+        "crawler": "Tryb przeszukiwania",
+        "words": "Liczba znaków"
+      }
+    },
    "searchxng": {
      "baseURL": "Wprowadź",
      "description": "Wprowadź adres URL SearchXNG, aby rozpocząć wyszukiwanie w sieci",
@@ -89,6 +89,9 @@
  "perplexity": {
    "description": "Perplexity to wiodący dostawca modeli generacji dialogów, oferujący różnorodne zaawansowane modele Llama 3.1, wspierające aplikacje online i offline, szczególnie odpowiednie do złożonych zadań przetwarzania języka naturalnego."
  },
+  "ppio": {
+    "description": "PPIO Paiou Cloud oferuje stabilne i opłacalne usługi API modeli open source, wspierające pełną gamę DeepSeek, Llama, Qwen i inne wiodące modele w branży."
+  },
  "qwen": {
    "description": "Tongyi Qianwen to samodzielnie opracowany przez Alibaba Cloud model językowy o dużej skali, charakteryzujący się silnymi zdolnościami rozumienia i generowania języka naturalnego. Może odpowiadać na różnorodne pytania, tworzyć treści pisemne, wyrażać opinie, pisać kod i działać w wielu dziedzinach."
  },
--- a/Show More
+++ b/Show More