diff --git a/.github/ISSUE_TEMPLATE/bug_report.yml b/.github/ISSUE_TEMPLATE/bug_report.yml
index c8806d68..ca963b82 100644
--- a/.github/ISSUE_TEMPLATE/bug_report.yml
+++ b/.github/ISSUE_TEMPLATE/bug_report.yml
@@ -56,7 +56,7 @@ body:
label: Environment
description: Share your environment details. Reports without proper environment details will likely be closed.
value: |
- - APINTO Dashboard version:
+ - ApiPark version:
- Operating system (run `uname -a`):
validations:
required: true
\ No newline at end of file
diff --git a/.gitlab-ci.yml b/.gitlab-ci.yml
deleted file mode 100644
index 035b15b9..00000000
--- a/.gitlab-ci.yml
+++ /dev/null
@@ -1,99 +0,0 @@
-variables:
- PATH: /opt/go-1.23/go/bin/:/opt/node-1.22/bin/:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/root/bin
- GOROOT: /opt/go-1.23/go
- GOPROXY: https://goproxy.cn
- VERSION: $CI_COMMIT_SHORT_SHA
- APP: apipark
- APP_PRE: ${APP}_${VERSION}
- BUILD_DIR: ${APP}-build
- DEPLOY_DESC: "DEV 环境"
- VIEW_ADDR: http://172.18.166.219:8288
- SAVE_DIR: /opt/${APP}
- NODE_OPTIONS: --max_old_space_size=8192
- APIPARK_OLLAMA_BASE: http://127.0.0.1:11434
-
-stages:
- - notice
- - prefix
- - build
- - deploy
- - webhook
-
-feishu-informer: # 飞书回调
- stage: notice
- variables:
- DIFF_URL: "$CI_MERGE_REQUEST_PROJECT_URL/-/merge_requests/$CI_MERGE_REQUEST_IID/diffs"
- rules:
- - if: $CI_PIPELINE_SOURCE=="merge_request_event" && $CI_COMMIT_BRANCH =~ "main"
- script:
- - echo "merge request"
- - |
- curl -X POST -H "Content-Type: application/json" \
- -d "{\"msg_type\":\"text\",\"content\":{\"text\":\"项目:${CI_PROJECT_NAME}\\n提交人:${GITLAB_USER_NAME}\\n提交信息:${CI_MERGE_REQUEST_TITLE}\\n合并分支信息:${CI_MERGE_REQUEST_SOURCE_BRANCH_NAME} -> ${CI_MERGE_REQUEST_TARGET_BRANCH_NAME}\\n差异性地址:${DIFF_URL}\\n请及时review代码\"}}" \
- https://open.feishu.cn/open-apis/bot/v2/hook/1c334752-2874-41a1-8f1b-3060f2d46b6c
-
-prebuild:
- stage: prefix
- rules:
- - if: $CI_COMMIT_BRANCH == "main"
- script:
- - echo "prebuild"
- - chmod +x ./scripts/prefix.sh
- - ./scripts/prefix.sh
-
-builder:
- stage: build
- rules:
- - if: $CI_COMMIT_BRANCH == "main"
- script:
- - set -e
- - |
- if [ ! -d "../artifacts" ]; then
- mkdir -p ../artifacts
- fi
- if [ -d "../artifacts/dist" ]; then
- cp -r ../artifacts/dist frontend/dist
- fi
- - |
- if [ -n "$(git diff --name-status HEAD~1 HEAD -- frontend)" ]; then
- ./scripts/build.sh $BUILD_DIR ${VERSION} all ""
- else
- ./scripts/build.sh $BUILD_DIR ${VERSION}
- fi
- if [ -d "frontend/dist" ]; then
- echo "copy frontend/dist to artifacts/dist"
- rm -fr ../artifacts/dist
- cp -r frontend/dist ../artifacts/dist
- fi
- cp $BUILD_DIR/${APP_PRE}_linux_amd64.tar.gz ${SAVE_DIR}
-
-deployer:
- stage: deploy
- rules:
- - if: $CI_COMMIT_BRANCH == "main"
- variables:
- APIPARK_GUEST_MODE: allow
- APIPARK_GUEST_ID: dklejrfbhjqwdh
- script:
- - cd ${SAVE_DIR};mkdir -p ${APP_PRE};tar -zxvf ${APP_PRE}_linux_amd64.tar.gz -C ${APP_PRE};cd ${APP_PRE};./install.sh ${SAVE_DIR};./run.sh restart;cd ${SAVE_DIR} && ./clean.sh ${APP_PRE}
- when: on_success
-success:
- stage: webhook
- rules:
- - if: $CI_COMMIT_BRANCH == "main"
- script:
- - |
- curl -X POST -H "Content-Type: application/json" \
- -d "{\"msg_type\":\"text\",\"content\":{\"text\":\"最近一次提交:${CI_COMMIT_TITLE}\\n提交人:${GITLAB_USER_NAME}\\n项目:${CI_PROJECT_NAME}\\n环境:${DEPLOY_DESC}\\n更新部署完成.\\n访问地址:${VIEW_ADDR}\\n工作流地址:${CI_PIPELINE_URL}\"}}" \
- https://open.feishu.cn/open-apis/bot/v2/hook/c3672932-4dfa-4989-8023-0128bae59338
- when: on_success
-failure:
- stage: webhook
- rules:
- - if: $CI_COMMIT_BRANCH == "main"
- script:
- - |
- curl -X POST -H "Content-Type: application/json" \
- -d "{\"msg_type\":\"text\",\"content\":{\"text\":\"最近一次提交:${CI_COMMIT_TITLE}\\n提交人:${GITLAB_USER_NAME}\\n项目:${CI_PROJECT_NAME}\\n环境:${DEPLOY_DESC}\\n更新部署失败,请及时到gitlab上查看\\n工作流地址:${CI_PIPELINE_URL}\"}}" \
- https://open.feishu.cn/open-apis/bot/v2/hook/c3672932-4dfa-4989-8023-0128bae59338
- when: on_failure
diff --git a/ai-provider/local/local.go b/ai-provider/local/local.go
index 5e084eeb..bcea9e84 100644
--- a/ai-provider/local/local.go
+++ b/ai-provider/local/local.go
@@ -8,10 +8,11 @@ import (
)
var (
- client *api.Client
+ client *api.Client
+ ProviderLocal = "LocalModel"
)
-func ResetOllamaAddress(address string) error {
+func ResetLocalAddress(address string) error {
u, err := url.Parse(address)
if err != nil {
return err
@@ -19,3 +20,12 @@ func ResetOllamaAddress(address string) error {
client = api.NewClient(u, http.DefaultClient)
return nil
}
+
+var (
+ LocalConfig = "{\n \"temperature\": \"\",\n \"top_p\": \"\",\n \"max_tokens\": \"\"\n}"
+ LocalSvg = `
+
+`
+)
diff --git a/ai-provider/local/models.json b/ai-provider/local/models.json
index 74fea8d1..42bc9927 100644
--- a/ai-provider/local/models.json
+++ b/ai-provider/local/models.json
@@ -10703,7 +10703,7 @@
{
"id": "llava",
"name": "llava",
- "description": "🌋 LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
+ "description": "LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
"size": "4.7GB",
"digest": "8dd30f6b0cb1",
"provider": "",
@@ -10713,7 +10713,7 @@
{
"id": "llava:7b",
"name": "llava:7b",
- "description": "🌋 LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
+ "description": "LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
"size": "4.7GB",
"digest": "8dd30f6b0cb1",
"provider": "",
@@ -10723,7 +10723,7 @@
{
"id": "llava:13b",
"name": "llava:13b",
- "description": "🌋 LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
+ "description": "LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
"size": "8.0GB",
"digest": "0d0eb4d7f485",
"provider": "",
@@ -10733,7 +10733,7 @@
{
"id": "llava:34b",
"name": "llava:34b",
- "description": "🌋 LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
+ "description": "LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
"size": "20GB",
"digest": "3d2d24f46674",
"provider": "",
@@ -10743,7 +10743,7 @@
{
"id": "llava:13b-v1.5-fp16",
"name": "llava:13b-v1.5-fp16",
- "description": "🌋 LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
+ "description": "LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
"size": "27GB",
"digest": "ce3bde71eaa7",
"provider": "",
@@ -10753,7 +10753,7 @@
{
"id": "llava:13b-v1.5-q2_K",
"name": "llava:13b-v1.5-q2_K",
- "description": "🌋 LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
+ "description": "LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
"size": "6.1GB",
"digest": "3cdd3869f154",
"provider": "",
@@ -10763,7 +10763,7 @@
{
"id": "llava:13b-v1.5-q3_K_L",
"name": "llava:13b-v1.5-q3_K_L",
- "description": "🌋 LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
+ "description": "LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
"size": "7.6GB",
"digest": "07b1b74ec398",
"provider": "",
@@ -10773,7 +10773,7 @@
{
"id": "llava:13b-v1.5-q3_K_M",
"name": "llava:13b-v1.5-q3_K_M",
- "description": "🌋 LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
+ "description": "LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
"size": "7.0GB",
"digest": "61441e82808c",
"provider": "",
@@ -10783,7 +10783,7 @@
{
"id": "llava:13b-v1.5-q3_K_S",
"name": "llava:13b-v1.5-q3_K_S",
- "description": "🌋 LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
+ "description": "LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
"size": "6.3GB",
"digest": "c860f869008d",
"provider": "",
@@ -10793,7 +10793,7 @@
{
"id": "llava:13b-v1.5-q4_0",
"name": "llava:13b-v1.5-q4_0",
- "description": "🌋 LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
+ "description": "LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
"size": "8.0GB",
"digest": "e3b7997801dc",
"provider": "",
@@ -10803,7 +10803,7 @@
{
"id": "llava:13b-v1.5-q4_1",
"name": "llava:13b-v1.5-q4_1",
- "description": "🌋 LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
+ "description": "LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
"size": "8.8GB",
"digest": "0ca30ff66062",
"provider": "",
@@ -10813,7 +10813,7 @@
{
"id": "llava:13b-v1.5-q4_K_M",
"name": "llava:13b-v1.5-q4_K_M",
- "description": "🌋 LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
+ "description": "LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
"size": "8.5GB",
"digest": "d0a6a3f0e6c4",
"provider": "",
@@ -10823,7 +10823,7 @@
{
"id": "llava:13b-v1.5-q4_K_S",
"name": "llava:13b-v1.5-q4_K_S",
- "description": "🌋 LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
+ "description": "LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
"size": "8.1GB",
"digest": "16939c152bd9",
"provider": "",
@@ -10833,7 +10833,7 @@
{
"id": "llava:13b-v1.5-q5_0",
"name": "llava:13b-v1.5-q5_0",
- "description": "🌋 LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
+ "description": "LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
"size": "9.6GB",
"digest": "78e17026912a",
"provider": "",
@@ -10843,7 +10843,7 @@
{
"id": "llava:13b-v1.5-q5_1",
"name": "llava:13b-v1.5-q5_1",
- "description": "🌋 LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
+ "description": "LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
"size": "10GB",
"digest": "b11f33bc65fa",
"provider": "",
@@ -10853,7 +10853,7 @@
{
"id": "llava:13b-v1.5-q5_K_M",
"name": "llava:13b-v1.5-q5_K_M",
- "description": "🌋 LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
+ "description": "LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
"size": "9.9GB",
"digest": "48418b116e18",
"provider": "",
@@ -10863,7 +10863,7 @@
{
"id": "llava:13b-v1.5-q5_K_S",
"name": "llava:13b-v1.5-q5_K_S",
- "description": "🌋 LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
+ "description": "LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
"size": "9.6GB",
"digest": "c7f4b8076a0e",
"provider": "",
@@ -10873,7 +10873,7 @@
{
"id": "llava:13b-v1.5-q6_K",
"name": "llava:13b-v1.5-q6_K",
- "description": "🌋 LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
+ "description": "LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
"size": "11GB",
"digest": "3c085b55f924",
"provider": "",
@@ -10883,7 +10883,7 @@
{
"id": "llava:13b-v1.5-q8_0",
"name": "llava:13b-v1.5-q8_0",
- "description": "🌋 LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
+ "description": "LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
"size": "14GB",
"digest": "4e00c435bb25",
"provider": "",
@@ -10893,7 +10893,7 @@
{
"id": "llava:13b-v1.6",
"name": "llava:13b-v1.6",
- "description": "🌋 LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
+ "description": "LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
"size": "8.0GB",
"digest": "0d0eb4d7f485",
"provider": "",
@@ -10903,7 +10903,7 @@
{
"id": "llava:13b-v1.6-vicuna-fp16",
"name": "llava:13b-v1.6-vicuna-fp16",
- "description": "🌋 LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
+ "description": "LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
"size": "27GB",
"digest": "81e28406a4e9",
"provider": "",
@@ -10913,7 +10913,7 @@
{
"id": "llava:13b-v1.6-vicuna-q2_K",
"name": "llava:13b-v1.6-vicuna-q2_K",
- "description": "🌋 LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
+ "description": "LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
"size": "5.5GB",
"digest": "87aecb135e2a",
"provider": "",
@@ -10923,7 +10923,7 @@
{
"id": "llava:13b-v1.6-vicuna-q3_K_L",
"name": "llava:13b-v1.6-vicuna-q3_K_L",
- "description": "🌋 LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
+ "description": "LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
"size": "7.6GB",
"digest": "a2b56a2b8e79",
"provider": "",
@@ -10933,7 +10933,7 @@
{
"id": "llava:13b-v1.6-vicuna-q3_K_M",
"name": "llava:13b-v1.6-vicuna-q3_K_M",
- "description": "🌋 LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
+ "description": "LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
"size": "7.0GB",
"digest": "2e48f094b51a",
"provider": "",
@@ -10943,7 +10943,7 @@
{
"id": "llava:13b-v1.6-vicuna-q3_K_S",
"name": "llava:13b-v1.6-vicuna-q3_K_S",
- "description": "🌋 LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
+ "description": "LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
"size": "6.3GB",
"digest": "54ef03322645",
"provider": "",
@@ -10953,7 +10953,7 @@
{
"id": "llava:13b-v1.6-vicuna-q4_0",
"name": "llava:13b-v1.6-vicuna-q4_0",
- "description": "🌋 LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
+ "description": "LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
"size": "8.0GB",
"digest": "0d0eb4d7f485",
"provider": "",
@@ -10963,7 +10963,7 @@
{
"id": "llava:13b-v1.6-vicuna-q4_1",
"name": "llava:13b-v1.6-vicuna-q4_1",
- "description": "🌋 LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
+ "description": "LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
"size": "8.8GB",
"digest": "0b97528b26b0",
"provider": "",
@@ -10973,7 +10973,7 @@
{
"id": "llava:13b-v1.6-vicuna-q4_K_M",
"name": "llava:13b-v1.6-vicuna-q4_K_M",
- "description": "🌋 LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
+ "description": "LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
"size": "8.5GB",
"digest": "0843119c3874",
"provider": "",
@@ -10983,7 +10983,7 @@
{
"id": "llava:13b-v1.6-vicuna-q4_K_S",
"name": "llava:13b-v1.6-vicuna-q4_K_S",
- "description": "🌋 LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
+ "description": "LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
"size": "8.1GB",
"digest": "5e4cf96dfc4c",
"provider": "",
@@ -10993,7 +10993,7 @@
{
"id": "llava:13b-v1.6-vicuna-q5_0",
"name": "llava:13b-v1.6-vicuna-q5_0",
- "description": "🌋 LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
+ "description": "LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
"size": "9.6GB",
"digest": "6e06e1393058",
"provider": "",
@@ -11003,7 +11003,7 @@
{
"id": "llava:13b-v1.6-vicuna-q5_1",
"name": "llava:13b-v1.6-vicuna-q5_1",
- "description": "🌋 LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
+ "description": "LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
"size": "10GB",
"digest": "31f1d78cb272",
"provider": "",
@@ -11013,7 +11013,7 @@
{
"id": "llava:13b-v1.6-vicuna-q5_K_M",
"name": "llava:13b-v1.6-vicuna-q5_K_M",
- "description": "🌋 LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
+ "description": "LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
"size": "9.9GB",
"digest": "446b10458a6a",
"provider": "",
@@ -11023,7 +11023,7 @@
{
"id": "llava:13b-v1.6-vicuna-q5_K_S",
"name": "llava:13b-v1.6-vicuna-q5_K_S",
- "description": "🌋 LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
+ "description": "LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
"size": "9.6GB",
"digest": "53999e2c86c8",
"provider": "",
@@ -11033,7 +11033,7 @@
{
"id": "llava:13b-v1.6-vicuna-q6_K",
"name": "llava:13b-v1.6-vicuna-q6_K",
- "description": "🌋 LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
+ "description": "LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
"size": "11GB",
"digest": "1c0a91e1e4d9",
"provider": "",
@@ -11043,7 +11043,7 @@
{
"id": "llava:13b-v1.6-vicuna-q8_0",
"name": "llava:13b-v1.6-vicuna-q8_0",
- "description": "🌋 LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
+ "description": "LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
"size": "14GB",
"digest": "b25c4195f9e2",
"provider": "",
@@ -11053,7 +11053,7 @@
{
"id": "llava:34b-v1.6",
"name": "llava:34b-v1.6",
- "description": "🌋 LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
+ "description": "LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
"size": "20GB",
"digest": "3d2d24f46674",
"provider": "",
@@ -11063,7 +11063,7 @@
{
"id": "llava:34b-v1.6-fp16",
"name": "llava:34b-v1.6-fp16",
- "description": "🌋 LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
+ "description": "LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
"size": "69GB",
"digest": "89c50af82d5e",
"provider": "",
@@ -11073,7 +11073,7 @@
{
"id": "llava:34b-v1.6-q2_K",
"name": "llava:34b-v1.6-q2_K",
- "description": "🌋 LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
+ "description": "LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
"size": "14GB",
"digest": "6326f59da4f1",
"provider": "",
@@ -11083,7 +11083,7 @@
{
"id": "llava:34b-v1.6-q3_K_L",
"name": "llava:34b-v1.6-q3_K_L",
- "description": "🌋 LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
+ "description": "LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
"size": "19GB",
"digest": "7f9889648d1a",
"provider": "",
@@ -11093,7 +11093,7 @@
{
"id": "llava:34b-v1.6-q3_K_M",
"name": "llava:34b-v1.6-q3_K_M",
- "description": "🌋 LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
+ "description": "LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
"size": "17GB",
"digest": "89e924fed7d4",
"provider": "",
@@ -11103,7 +11103,7 @@
{
"id": "llava:34b-v1.6-q3_K_S",
"name": "llava:34b-v1.6-q3_K_S",
- "description": "🌋 LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
+ "description": "LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
"size": "16GB",
"digest": "a0376a205682",
"provider": "",
@@ -11113,7 +11113,7 @@
{
"id": "llava:34b-v1.6-q4_0",
"name": "llava:34b-v1.6-q4_0",
- "description": "🌋 LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
+ "description": "LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
"size": "20GB",
"digest": "3d2d24f46674",
"provider": "",
@@ -11123,7 +11123,7 @@
{
"id": "llava:34b-v1.6-q4_1",
"name": "llava:34b-v1.6-q4_1",
- "description": "🌋 LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
+ "description": "LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
"size": "22GB",
"digest": "96d20de28a1a",
"provider": "",
@@ -11133,7 +11133,7 @@
{
"id": "llava:34b-v1.6-q4_K_M",
"name": "llava:34b-v1.6-q4_K_M",
- "description": "🌋 LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
+ "description": "LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
"size": "21GB",
"digest": "538ff4c5a8b8",
"provider": "",
@@ -11143,7 +11143,7 @@
{
"id": "llava:34b-v1.6-q4_K_S",
"name": "llava:34b-v1.6-q4_K_S",
- "description": "🌋 LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
+ "description": "LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
"size": "20GB",
"digest": "787b2213f0db",
"provider": "",
@@ -11153,7 +11153,7 @@
{
"id": "llava:34b-v1.6-q5_0",
"name": "llava:34b-v1.6-q5_0",
- "description": "🌋 LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
+ "description": "LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
"size": "24GB",
"digest": "b239e218bdf0",
"provider": "",
@@ -11163,7 +11163,7 @@
{
"id": "llava:34b-v1.6-q5_1",
"name": "llava:34b-v1.6-q5_1",
- "description": "🌋 LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
+ "description": "LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
"size": "27GB",
"digest": "60926fd725ec",
"provider": "",
@@ -11173,7 +11173,7 @@
{
"id": "llava:34b-v1.6-q5_K_M",
"name": "llava:34b-v1.6-q5_K_M",
- "description": "🌋 LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
+ "description": "LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
"size": "25GB",
"digest": "0eb2ab10d35c",
"provider": "",
@@ -11183,7 +11183,7 @@
{
"id": "llava:34b-v1.6-q5_K_S",
"name": "llava:34b-v1.6-q5_K_S",
- "description": "🌋 LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
+ "description": "LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
"size": "24GB",
"digest": "cdd8d5db3870",
"provider": "",
@@ -11193,7 +11193,7 @@
{
"id": "llava:34b-v1.6-q6_K",
"name": "llava:34b-v1.6-q6_K",
- "description": "🌋 LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
+ "description": "LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
"size": "29GB",
"digest": "8f572ea02185",
"provider": "",
@@ -11203,7 +11203,7 @@
{
"id": "llava:34b-v1.6-q8_0",
"name": "llava:34b-v1.6-q8_0",
- "description": "🌋 LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
+ "description": "LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
"size": "37GB",
"digest": "959065f30849",
"provider": "",
@@ -11213,7 +11213,7 @@
{
"id": "llava:7b-v1.5-fp16",
"name": "llava:7b-v1.5-fp16",
- "description": "🌋 LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
+ "description": "LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
"size": "14GB",
"digest": "337a5b25bada",
"provider": "",
@@ -11223,7 +11223,7 @@
{
"id": "llava:7b-v1.5-q2_K",
"name": "llava:7b-v1.5-q2_K",
- "description": "🌋 LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
+ "description": "LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
"size": "3.5GB",
"digest": "33973d2589d1",
"provider": "",
@@ -11233,7 +11233,7 @@
{
"id": "llava:7b-v1.5-q3_K_L",
"name": "llava:7b-v1.5-q3_K_L",
- "description": "🌋 LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
+ "description": "LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
"size": "4.2GB",
"digest": "057fefd59cdb",
"provider": "",
@@ -11243,7 +11243,7 @@
{
"id": "llava:7b-v1.5-q3_K_M",
"name": "llava:7b-v1.5-q3_K_M",
- "description": "🌋 LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
+ "description": "LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
"size": "3.9GB",
"digest": "9d738df24288",
"provider": "",
@@ -11253,7 +11253,7 @@
{
"id": "llava:7b-v1.5-q3_K_S",
"name": "llava:7b-v1.5-q3_K_S",
- "description": "🌋 LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
+ "description": "LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
"size": "3.6GB",
"digest": "605b68e0b568",
"provider": "",
@@ -11263,7 +11263,7 @@
{
"id": "llava:7b-v1.5-q4_0",
"name": "llava:7b-v1.5-q4_0",
- "description": "🌋 LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
+ "description": "LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
"size": "4.5GB",
"digest": "cd3274b81a85",
"provider": "",
@@ -11273,7 +11273,7 @@
{
"id": "llava:7b-v1.5-q4_1",
"name": "llava:7b-v1.5-q4_1",
- "description": "🌋 LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
+ "description": "LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
"size": "4.9GB",
"digest": "146a55d9df75",
"provider": "",
@@ -11283,7 +11283,7 @@
{
"id": "llava:7b-v1.5-q4_K_M",
"name": "llava:7b-v1.5-q4_K_M",
- "description": "🌋 LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
+ "description": "LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
"size": "4.7GB",
"digest": "75a9333e75cd",
"provider": "",
@@ -11293,7 +11293,7 @@
{
"id": "llava:7b-v1.5-q4_K_S",
"name": "llava:7b-v1.5-q4_K_S",
- "description": "🌋 LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
+ "description": "LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
"size": "4.5GB",
"digest": "d8d545afa5f0",
"provider": "",
@@ -11303,7 +11303,7 @@
{
"id": "llava:7b-v1.5-q5_0",
"name": "llava:7b-v1.5-q5_0",
- "description": "🌋 LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
+ "description": "LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
"size": "5.3GB",
"digest": "339249626980",
"provider": "",
@@ -11313,7 +11313,7 @@
{
"id": "llava:7b-v1.5-q5_1",
"name": "llava:7b-v1.5-q5_1",
- "description": "🌋 LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
+ "description": "LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
"size": "5.7GB",
"digest": "6d97e8715c53",
"provider": "",
@@ -11323,7 +11323,7 @@
{
"id": "llava:7b-v1.5-q5_K_M",
"name": "llava:7b-v1.5-q5_K_M",
- "description": "🌋 LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
+ "description": "LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
"size": "5.4GB",
"digest": "4fb097b9cfa3",
"provider": "",
@@ -11333,7 +11333,7 @@
{
"id": "llava:7b-v1.5-q5_K_S",
"name": "llava:7b-v1.5-q5_K_S",
- "description": "🌋 LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
+ "description": "LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
"size": "5.3GB",
"digest": "34f9b24f2315",
"provider": "",
@@ -11343,7 +11343,7 @@
{
"id": "llava:7b-v1.5-q6_K",
"name": "llava:7b-v1.5-q6_K",
- "description": "🌋 LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
+ "description": "LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
"size": "6.2GB",
"digest": "df0203e92f79",
"provider": "",
@@ -11353,7 +11353,7 @@
{
"id": "llava:7b-v1.5-q8_0",
"name": "llava:7b-v1.5-q8_0",
- "description": "🌋 LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
+ "description": "LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
"size": "7.8GB",
"digest": "c684b68b3f34",
"provider": "",
@@ -11363,7 +11363,7 @@
{
"id": "llava:7b-v1.6",
"name": "llava:7b-v1.6",
- "description": "🌋 LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
+ "description": "LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
"size": "4.7GB",
"digest": "8dd30f6b0cb1",
"provider": "",
@@ -11373,7 +11373,7 @@
{
"id": "llava:7b-v1.6-mistral-fp16",
"name": "llava:7b-v1.6-mistral-fp16",
- "description": "🌋 LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
+ "description": "LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
"size": "15GB",
"digest": "9fd1e5417c5f",
"provider": "",
@@ -11383,7 +11383,7 @@
{
"id": "llava:7b-v1.6-mistral-q2_K",
"name": "llava:7b-v1.6-mistral-q2_K",
- "description": "🌋 LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
+ "description": "LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
"size": "3.3GB",
"digest": "52e0ce44a5f5",
"provider": "",
@@ -11393,7 +11393,7 @@
{
"id": "llava:7b-v1.6-mistral-q3_K_L",
"name": "llava:7b-v1.6-mistral-q3_K_L",
- "description": "🌋 LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
+ "description": "LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
"size": "4.4GB",
"digest": "a48bbc9b567b",
"provider": "",
@@ -11403,7 +11403,7 @@
{
"id": "llava:7b-v1.6-mistral-q3_K_M",
"name": "llava:7b-v1.6-mistral-q3_K_M",
- "description": "🌋 LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
+ "description": "LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
"size": "4.1GB",
"digest": "25a00600f8b4",
"provider": "",
@@ -11413,7 +11413,7 @@
{
"id": "llava:7b-v1.6-mistral-q3_K_S",
"name": "llava:7b-v1.6-mistral-q3_K_S",
- "description": "🌋 LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
+ "description": "LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
"size": "3.8GB",
"digest": "2b9c055fe6a2",
"provider": "",
@@ -11423,7 +11423,7 @@
{
"id": "llava:7b-v1.6-mistral-q4_0",
"name": "llava:7b-v1.6-mistral-q4_0",
- "description": "🌋 LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
+ "description": "LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
"size": "4.7GB",
"digest": "8dd30f6b0cb1",
"provider": "",
@@ -11433,7 +11433,7 @@
{
"id": "llava:7b-v1.6-mistral-q4_1",
"name": "llava:7b-v1.6-mistral-q4_1",
- "description": "🌋 LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
+ "description": "LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
"size": "5.2GB",
"digest": "8da3213068e6",
"provider": "",
@@ -11443,7 +11443,7 @@
{
"id": "llava:7b-v1.6-mistral-q4_K_M",
"name": "llava:7b-v1.6-mistral-q4_K_M",
- "description": "🌋 LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
+ "description": "LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
"size": "5.0GB",
"digest": "8d3fbd6ad3f4",
"provider": "",
@@ -11453,7 +11453,7 @@
{
"id": "llava:7b-v1.6-mistral-q4_K_S",
"name": "llava:7b-v1.6-mistral-q4_K_S",
- "description": "🌋 LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
+ "description": "LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
"size": "4.8GB",
"digest": "2878e8c79f6e",
"provider": "",
@@ -11463,7 +11463,7 @@
{
"id": "llava:7b-v1.6-mistral-q5_0",
"name": "llava:7b-v1.6-mistral-q5_0",
- "description": "🌋 LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
+ "description": "LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
"size": "5.6GB",
"digest": "b8f63553f521",
"provider": "",
@@ -11473,7 +11473,7 @@
{
"id": "llava:7b-v1.6-mistral-q5_1",
"name": "llava:7b-v1.6-mistral-q5_1",
- "description": "🌋 LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
+ "description": "LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
"size": "6.1GB",
"digest": "eda0b3f3b09b",
"provider": "",
@@ -11483,7 +11483,7 @@
{
"id": "llava:7b-v1.6-mistral-q5_K_M",
"name": "llava:7b-v1.6-mistral-q5_K_M",
- "description": "🌋 LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
+ "description": "LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
"size": "5.8GB",
"digest": "244b7e3d3d5a",
"provider": "",
@@ -11493,7 +11493,7 @@
{
"id": "llava:7b-v1.6-mistral-q5_K_S",
"name": "llava:7b-v1.6-mistral-q5_K_S",
- "description": "🌋 LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
+ "description": "LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
"size": "5.6GB",
"digest": "62dc434a7ae8",
"provider": "",
@@ -11503,7 +11503,7 @@
{
"id": "llava:7b-v1.6-mistral-q6_K",
"name": "llava:7b-v1.6-mistral-q6_K",
- "description": "🌋 LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
+ "description": "LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
"size": "6.6GB",
"digest": "8781169d7f8f",
"provider": "",
@@ -11513,7 +11513,7 @@
{
"id": "llava:7b-v1.6-mistral-q8_0",
"name": "llava:7b-v1.6-mistral-q8_0",
- "description": "🌋 LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
+ "description": "LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
"size": "8.3GB",
"digest": "c2973e390e84",
"provider": "",
@@ -11523,7 +11523,7 @@
{
"id": "llava:7b-v1.6-vicuna-fp16",
"name": "llava:7b-v1.6-vicuna-fp16",
- "description": "🌋 LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
+ "description": "LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
"size": "14GB",
"digest": "bb8da134bacb",
"provider": "",
@@ -11533,7 +11533,7 @@
{
"id": "llava:7b-v1.6-vicuna-q2_K",
"name": "llava:7b-v1.6-vicuna-q2_K",
- "description": "🌋 LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
+ "description": "LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
"size": "3.2GB",
"digest": "6321163f3833",
"provider": "",
@@ -11543,7 +11543,7 @@
{
"id": "llava:7b-v1.6-vicuna-q3_K_L",
"name": "llava:7b-v1.6-vicuna-q3_K_L",
- "description": "🌋 LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
+ "description": "LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
"size": "4.2GB",
"digest": "0127d9087e07",
"provider": "",
@@ -11553,7 +11553,7 @@
{
"id": "llava:7b-v1.6-vicuna-q3_K_M",
"name": "llava:7b-v1.6-vicuna-q3_K_M",
- "description": "🌋 LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
+ "description": "LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
"size": "3.9GB",
"digest": "7004e1f24eb1",
"provider": "",
@@ -11563,7 +11563,7 @@
{
"id": "llava:7b-v1.6-vicuna-q3_K_S",
"name": "llava:7b-v1.6-vicuna-q3_K_S",
- "description": "🌋 LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
+ "description": "LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
"size": "3.6GB",
"digest": "7701df672950",
"provider": "",
@@ -11573,7 +11573,7 @@
{
"id": "llava:7b-v1.6-vicuna-q4_0",
"name": "llava:7b-v1.6-vicuna-q4_0",
- "description": "🌋 LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
+ "description": "LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
"size": "4.5GB",
"digest": "b6cbe07f1d5e",
"provider": "",
@@ -11583,7 +11583,7 @@
{
"id": "llava:7b-v1.6-vicuna-q4_1",
"name": "llava:7b-v1.6-vicuna-q4_1",
- "description": "🌋 LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
+ "description": "LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
"size": "4.9GB",
"digest": "f8a27e237e97",
"provider": "",
@@ -11593,7 +11593,7 @@
{
"id": "llava:7b-v1.6-vicuna-q4_K_M",
"name": "llava:7b-v1.6-vicuna-q4_K_M",
- "description": "🌋 LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
+ "description": "LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
"size": "4.7GB",
"digest": "15360a9e0fb9",
"provider": "",
@@ -11603,7 +11603,7 @@
{
"id": "llava:7b-v1.6-vicuna-q4_K_S",
"name": "llava:7b-v1.6-vicuna-q4_K_S",
- "description": "🌋 LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
+ "description": "LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
"size": "4.5GB",
"digest": "5006a8a41d2b",
"provider": "",
@@ -11613,7 +11613,7 @@
{
"id": "llava:7b-v1.6-vicuna-q5_0",
"name": "llava:7b-v1.6-vicuna-q5_0",
- "description": "🌋 LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
+ "description": "LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
"size": "5.3GB",
"digest": "6a2bb61a611a",
"provider": "",
@@ -11623,7 +11623,7 @@
{
"id": "llava:7b-v1.6-vicuna-q5_1",
"name": "llava:7b-v1.6-vicuna-q5_1",
- "description": "🌋 LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
+ "description": "LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
"size": "5.7GB",
"digest": "1bd37032ec33",
"provider": "",
@@ -11633,7 +11633,7 @@
{
"id": "llava:7b-v1.6-vicuna-q5_K_M",
"name": "llava:7b-v1.6-vicuna-q5_K_M",
- "description": "🌋 LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
+ "description": "LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
"size": "5.4GB",
"digest": "b22b0c041223",
"provider": "",
@@ -11643,7 +11643,7 @@
{
"id": "llava:7b-v1.6-vicuna-q5_K_S",
"name": "llava:7b-v1.6-vicuna-q5_K_S",
- "description": "🌋 LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
+ "description": "LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
"size": "5.3GB",
"digest": "4aaa19502e34",
"provider": "",
@@ -11653,7 +11653,7 @@
{
"id": "llava:7b-v1.6-vicuna-q6_K",
"name": "llava:7b-v1.6-vicuna-q6_K",
- "description": "🌋 LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
+ "description": "LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
"size": "6.2GB",
"digest": "11bd55683f9c",
"provider": "",
@@ -11663,7 +11663,7 @@
{
"id": "llava:7b-v1.6-vicuna-q8_0",
"name": "llava:7b-v1.6-vicuna-q8_0",
- "description": "🌋 LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
+ "description": "LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
"size": "7.8GB",
"digest": "6da20a71d9bb",
"provider": "",
@@ -11673,7 +11673,7 @@
{
"id": "llava:v1.6",
"name": "llava:v1.6",
- "description": "🌋 LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
+ "description": "LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6.",
"size": "4.7GB",
"digest": "8dd30f6b0cb1",
"provider": "",
@@ -35753,7 +35753,7 @@
{
"id": "smollm",
"name": "smollm",
- "description": "🪐 A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
+ "description": "A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
"size": "991MB",
"digest": "95f6557a0f0f",
"provider": "",
@@ -35763,7 +35763,7 @@
{
"id": "smollm:135m",
"name": "smollm:135m",
- "description": "🪐 A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
+ "description": "A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
"size": "92MB",
"digest": "b0b2a4617438",
"provider": "",
@@ -35773,7 +35773,7 @@
{
"id": "smollm:360m",
"name": "smollm:360m",
- "description": "🪐 A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
+ "description": "A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
"size": "229MB",
"digest": "b3ba1ccba2b8",
"provider": "",
@@ -35783,7 +35783,7 @@
{
"id": "smollm:1.7b",
"name": "smollm:1.7b",
- "description": "🪐 A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
+ "description": "A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
"size": "991MB",
"digest": "95f6557a0f0f",
"provider": "",
@@ -35793,7 +35793,7 @@
{
"id": "smollm:1.7b-base-v0.2-fp16",
"name": "smollm:1.7b-base-v0.2-fp16",
- "description": "🪐 A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
+ "description": "A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
"size": "3.4GB",
"digest": "64f31ee84d1c",
"provider": "",
@@ -35803,7 +35803,7 @@
{
"id": "smollm:1.7b-base-v0.2-q2_K",
"name": "smollm:1.7b-base-v0.2-q2_K",
- "description": "🪐 A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
+ "description": "A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
"size": "675MB",
"digest": "b013da007877",
"provider": "",
@@ -35813,7 +35813,7 @@
{
"id": "smollm:1.7b-base-v0.2-q3_K_L",
"name": "smollm:1.7b-base-v0.2-q3_K_L",
- "description": "🪐 A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
+ "description": "A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
"size": "933MB",
"digest": "9656463272fe",
"provider": "",
@@ -35823,7 +35823,7 @@
{
"id": "smollm:1.7b-base-v0.2-q3_K_M",
"name": "smollm:1.7b-base-v0.2-q3_K_M",
- "description": "🪐 A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
+ "description": "A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
"size": "860MB",
"digest": "9acc25818892",
"provider": "",
@@ -35833,7 +35833,7 @@
{
"id": "smollm:1.7b-base-v0.2-q3_K_S",
"name": "smollm:1.7b-base-v0.2-q3_K_S",
- "description": "🪐 A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
+ "description": "A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
"size": "777MB",
"digest": "596523cb1def",
"provider": "",
@@ -35843,7 +35843,7 @@
{
"id": "smollm:1.7b-base-v0.2-q4_0",
"name": "smollm:1.7b-base-v0.2-q4_0",
- "description": "🪐 A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
+ "description": "A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
"size": "991MB",
"digest": "97f3f0aef2df",
"provider": "",
@@ -35853,7 +35853,7 @@
{
"id": "smollm:1.7b-base-v0.2-q4_1",
"name": "smollm:1.7b-base-v0.2-q4_1",
- "description": "🪐 A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
+ "description": "A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
"size": "1.1GB",
"digest": "0c1bb3471f92",
"provider": "",
@@ -35863,7 +35863,7 @@
{
"id": "smollm:1.7b-base-v0.2-q4_K_M",
"name": "smollm:1.7b-base-v0.2-q4_K_M",
- "description": "🪐 A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
+ "description": "A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
"size": "1.1GB",
"digest": "8dec12ffec4a",
"provider": "",
@@ -35873,7 +35873,7 @@
{
"id": "smollm:1.7b-base-v0.2-q4_K_S",
"name": "smollm:1.7b-base-v0.2-q4_K_S",
- "description": "🪐 A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
+ "description": "A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
"size": "999MB",
"digest": "9b3d36b6e0c2",
"provider": "",
@@ -35883,7 +35883,7 @@
{
"id": "smollm:1.7b-base-v0.2-q5_0",
"name": "smollm:1.7b-base-v0.2-q5_0",
- "description": "🪐 A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
+ "description": "A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
"size": "1.2GB",
"digest": "7eddfb294e53",
"provider": "",
@@ -35893,7 +35893,7 @@
{
"id": "smollm:1.7b-base-v0.2-q5_1",
"name": "smollm:1.7b-base-v0.2-q5_1",
- "description": "🪐 A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
+ "description": "A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
"size": "1.3GB",
"digest": "fde4c91abcce",
"provider": "",
@@ -35903,7 +35903,7 @@
{
"id": "smollm:1.7b-base-v0.2-q5_K_M",
"name": "smollm:1.7b-base-v0.2-q5_K_M",
- "description": "🪐 A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
+ "description": "A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
"size": "1.2GB",
"digest": "7daaf6f561d8",
"provider": "",
@@ -35913,7 +35913,7 @@
{
"id": "smollm:1.7b-base-v0.2-q5_K_S",
"name": "smollm:1.7b-base-v0.2-q5_K_S",
- "description": "🪐 A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
+ "description": "A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
"size": "1.2GB",
"digest": "4f0e5ec42d5b",
"provider": "",
@@ -35923,7 +35923,7 @@
{
"id": "smollm:1.7b-base-v0.2-q6_K",
"name": "smollm:1.7b-base-v0.2-q6_K",
- "description": "🪐 A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
+ "description": "A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
"size": "1.4GB",
"digest": "9cf3be2645b6",
"provider": "",
@@ -35933,7 +35933,7 @@
{
"id": "smollm:1.7b-base-v0.2-q8_0",
"name": "smollm:1.7b-base-v0.2-q8_0",
- "description": "🪐 A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
+ "description": "A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
"size": "1.8GB",
"digest": "d1f91cd676ad",
"provider": "",
@@ -35943,7 +35943,7 @@
{
"id": "smollm:1.7b-instruct-v0.2-fp16",
"name": "smollm:1.7b-instruct-v0.2-fp16",
- "description": "🪐 A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
+ "description": "A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
"size": "3.4GB",
"digest": "b07e591ca9ba",
"provider": "",
@@ -35953,7 +35953,7 @@
{
"id": "smollm:1.7b-instruct-v0.2-q2_K",
"name": "smollm:1.7b-instruct-v0.2-q2_K",
- "description": "🪐 A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
+ "description": "A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
"size": "675MB",
"digest": "da8ba92e42b1",
"provider": "",
@@ -35963,7 +35963,7 @@
{
"id": "smollm:1.7b-instruct-v0.2-q3_K_L",
"name": "smollm:1.7b-instruct-v0.2-q3_K_L",
- "description": "🪐 A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
+ "description": "A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
"size": "933MB",
"digest": "88ef3062260e",
"provider": "",
@@ -35973,7 +35973,7 @@
{
"id": "smollm:1.7b-instruct-v0.2-q3_K_M",
"name": "smollm:1.7b-instruct-v0.2-q3_K_M",
- "description": "🪐 A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
+ "description": "A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
"size": "860MB",
"digest": "728c1f932b06",
"provider": "",
@@ -35983,7 +35983,7 @@
{
"id": "smollm:1.7b-instruct-v0.2-q3_K_S",
"name": "smollm:1.7b-instruct-v0.2-q3_K_S",
- "description": "🪐 A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
+ "description": "A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
"size": "777MB",
"digest": "c35438da7180",
"provider": "",
@@ -35993,7 +35993,7 @@
{
"id": "smollm:1.7b-instruct-v0.2-q4_0",
"name": "smollm:1.7b-instruct-v0.2-q4_0",
- "description": "🪐 A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
+ "description": "A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
"size": "991MB",
"digest": "95f6557a0f0f",
"provider": "",
@@ -36003,7 +36003,7 @@
{
"id": "smollm:1.7b-instruct-v0.2-q4_1",
"name": "smollm:1.7b-instruct-v0.2-q4_1",
- "description": "🪐 A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
+ "description": "A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
"size": "1.1GB",
"digest": "77d7238b232e",
"provider": "",
@@ -36013,7 +36013,7 @@
{
"id": "smollm:1.7b-instruct-v0.2-q4_K_M",
"name": "smollm:1.7b-instruct-v0.2-q4_K_M",
- "description": "🪐 A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
+ "description": "A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
"size": "1.1GB",
"digest": "dd7299829a14",
"provider": "",
@@ -36023,7 +36023,7 @@
{
"id": "smollm:1.7b-instruct-v0.2-q4_K_S",
"name": "smollm:1.7b-instruct-v0.2-q4_K_S",
- "description": "🪐 A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
+ "description": "A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
"size": "999MB",
"digest": "35eec1a7014d",
"provider": "",
@@ -36033,7 +36033,7 @@
{
"id": "smollm:1.7b-instruct-v0.2-q5_0",
"name": "smollm:1.7b-instruct-v0.2-q5_0",
- "description": "🪐 A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
+ "description": "A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
"size": "1.2GB",
"digest": "8391060f29db",
"provider": "",
@@ -36043,7 +36043,7 @@
{
"id": "smollm:1.7b-instruct-v0.2-q5_1",
"name": "smollm:1.7b-instruct-v0.2-q5_1",
- "description": "🪐 A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
+ "description": "A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
"size": "1.3GB",
"digest": "ce91dd1d7380",
"provider": "",
@@ -36053,7 +36053,7 @@
{
"id": "smollm:1.7b-instruct-v0.2-q5_K_M",
"name": "smollm:1.7b-instruct-v0.2-q5_K_M",
- "description": "🪐 A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
+ "description": "A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
"size": "1.2GB",
"digest": "91d16f72a7b3",
"provider": "",
@@ -36063,7 +36063,7 @@
{
"id": "smollm:1.7b-instruct-v0.2-q5_K_S",
"name": "smollm:1.7b-instruct-v0.2-q5_K_S",
- "description": "🪐 A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
+ "description": "A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
"size": "1.2GB",
"digest": "489a893ac8a7",
"provider": "",
@@ -36073,7 +36073,7 @@
{
"id": "smollm:1.7b-instruct-v0.2-q6_K",
"name": "smollm:1.7b-instruct-v0.2-q6_K",
- "description": "🪐 A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
+ "description": "A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
"size": "1.4GB",
"digest": "ecdf9864899c",
"provider": "",
@@ -36083,7 +36083,7 @@
{
"id": "smollm:1.7b-instruct-v0.2-q8_0",
"name": "smollm:1.7b-instruct-v0.2-q8_0",
- "description": "🪐 A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
+ "description": "A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
"size": "1.8GB",
"digest": "4afeb8de9eec",
"provider": "",
@@ -36093,7 +36093,7 @@
{
"id": "smollm:135m-base-v0.2-fp16",
"name": "smollm:135m-base-v0.2-fp16",
- "description": "🪐 A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
+ "description": "A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
"size": "271MB",
"digest": "1d0f00cec918",
"provider": "",
@@ -36103,7 +36103,7 @@
{
"id": "smollm:135m-base-v0.2-q2_K",
"name": "smollm:135m-base-v0.2-q2_K",
- "description": "🪐 A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
+ "description": "A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
"size": "88MB",
"digest": "e2048e8ac78d",
"provider": "",
@@ -36113,7 +36113,7 @@
{
"id": "smollm:135m-base-v0.2-q3_K_L",
"name": "smollm:135m-base-v0.2-q3_K_L",
- "description": "🪐 A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
+ "description": "A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
"size": "98MB",
"digest": "c2e22813067a",
"provider": "",
@@ -36123,7 +36123,7 @@
{
"id": "smollm:135m-base-v0.2-q3_K_M",
"name": "smollm:135m-base-v0.2-q3_K_M",
- "description": "🪐 A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
+ "description": "A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
"size": "94MB",
"digest": "a5ab45ae2e2e",
"provider": "",
@@ -36133,7 +36133,7 @@
{
"id": "smollm:135m-base-v0.2-q3_K_S",
"name": "smollm:135m-base-v0.2-q3_K_S",
- "description": "🪐 A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
+ "description": "A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
"size": "88MB",
"digest": "102433ffd9fb",
"provider": "",
@@ -36143,7 +36143,7 @@
{
"id": "smollm:135m-base-v0.2-q4_0",
"name": "smollm:135m-base-v0.2-q4_0",
- "description": "🪐 A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
+ "description": "A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
"size": "92MB",
"digest": "528415e872e5",
"provider": "",
@@ -36153,7 +36153,7 @@
{
"id": "smollm:135m-base-v0.2-q4_1",
"name": "smollm:135m-base-v0.2-q4_1",
- "description": "🪐 A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
+ "description": "A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
"size": "98MB",
"digest": "edecca7cff90",
"provider": "",
@@ -36163,7 +36163,7 @@
{
"id": "smollm:135m-base-v0.2-q4_K_M",
"name": "smollm:135m-base-v0.2-q4_K_M",
- "description": "🪐 A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
+ "description": "A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
"size": "105MB",
"digest": "3177ecf5d3b5",
"provider": "",
@@ -36173,7 +36173,7 @@
{
"id": "smollm:135m-base-v0.2-q4_K_S",
"name": "smollm:135m-base-v0.2-q4_K_S",
- "description": "🪐 A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
+ "description": "A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
"size": "102MB",
"digest": "2aa760d22716",
"provider": "",
@@ -36183,7 +36183,7 @@
{
"id": "smollm:135m-base-v0.2-q5_0",
"name": "smollm:135m-base-v0.2-q5_0",
- "description": "🪐 A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
+ "description": "A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
"size": "105MB",
"digest": "825973a56945",
"provider": "",
@@ -36193,7 +36193,7 @@
{
"id": "smollm:135m-base-v0.2-q5_1",
"name": "smollm:135m-base-v0.2-q5_1",
- "description": "🪐 A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
+ "description": "A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
"size": "112MB",
"digest": "065d585f86d9",
"provider": "",
@@ -36203,7 +36203,7 @@
{
"id": "smollm:135m-base-v0.2-q5_K_M",
"name": "smollm:135m-base-v0.2-q5_K_M",
- "description": "🪐 A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
+ "description": "A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
"size": "112MB",
"digest": "34545da0aa92",
"provider": "",
@@ -36213,7 +36213,7 @@
{
"id": "smollm:135m-base-v0.2-q5_K_S",
"name": "smollm:135m-base-v0.2-q5_K_S",
- "description": "🪐 A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
+ "description": "A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
"size": "110MB",
"digest": "4aef8aaa4469",
"provider": "",
@@ -36223,7 +36223,7 @@
{
"id": "smollm:135m-base-v0.2-q6_K",
"name": "smollm:135m-base-v0.2-q6_K",
- "description": "🪐 A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
+ "description": "A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
"size": "138MB",
"digest": "b11338fff65a",
"provider": "",
@@ -36233,7 +36233,7 @@
{
"id": "smollm:135m-base-v0.2-q8_0",
"name": "smollm:135m-base-v0.2-q8_0",
- "description": "🪐 A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
+ "description": "A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
"size": "145MB",
"digest": "fcdc33f9909d",
"provider": "",
@@ -36243,7 +36243,7 @@
{
"id": "smollm:135m-instruct-v0.2-fp16",
"name": "smollm:135m-instruct-v0.2-fp16",
- "description": "🪐 A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
+ "description": "A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
"size": "271MB",
"digest": "95d01a081beb",
"provider": "",
@@ -36253,7 +36253,7 @@
{
"id": "smollm:135m-instruct-v0.2-q2_K",
"name": "smollm:135m-instruct-v0.2-q2_K",
- "description": "🪐 A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
+ "description": "A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
"size": "88MB",
"digest": "e14a680b0b22",
"provider": "",
@@ -36263,7 +36263,7 @@
{
"id": "smollm:135m-instruct-v0.2-q3_K_L",
"name": "smollm:135m-instruct-v0.2-q3_K_L",
- "description": "🪐 A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
+ "description": "A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
"size": "98MB",
"digest": "aede666c7e16",
"provider": "",
@@ -36273,7 +36273,7 @@
{
"id": "smollm:135m-instruct-v0.2-q3_K_M",
"name": "smollm:135m-instruct-v0.2-q3_K_M",
- "description": "🪐 A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
+ "description": "A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
"size": "94MB",
"digest": "f5db1ab329b1",
"provider": "",
@@ -36283,7 +36283,7 @@
{
"id": "smollm:135m-instruct-v0.2-q3_K_S",
"name": "smollm:135m-instruct-v0.2-q3_K_S",
- "description": "🪐 A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
+ "description": "A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
"size": "88MB",
"digest": "3ae895b5e9ea",
"provider": "",
@@ -36293,7 +36293,7 @@
{
"id": "smollm:135m-instruct-v0.2-q4_0",
"name": "smollm:135m-instruct-v0.2-q4_0",
- "description": "🪐 A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
+ "description": "A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
"size": "92MB",
"digest": "b0b2a4617438",
"provider": "",
@@ -36303,7 +36303,7 @@
{
"id": "smollm:135m-instruct-v0.2-q4_1",
"name": "smollm:135m-instruct-v0.2-q4_1",
- "description": "🪐 A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
+ "description": "A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
"size": "98MB",
"digest": "bbf7e14150a9",
"provider": "",
@@ -36313,7 +36313,7 @@
{
"id": "smollm:135m-instruct-v0.2-q4_K_M",
"name": "smollm:135m-instruct-v0.2-q4_K_M",
- "description": "🪐 A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
+ "description": "A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
"size": "105MB",
"digest": "7eedbf45baa1",
"provider": "",
@@ -36323,7 +36323,7 @@
{
"id": "smollm:135m-instruct-v0.2-q4_K_S",
"name": "smollm:135m-instruct-v0.2-q4_K_S",
- "description": "🪐 A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
+ "description": "A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
"size": "102MB",
"digest": "45013939c7c9",
"provider": "",
@@ -36333,7 +36333,7 @@
{
"id": "smollm:135m-instruct-v0.2-q5_0",
"name": "smollm:135m-instruct-v0.2-q5_0",
- "description": "🪐 A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
+ "description": "A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
"size": "105MB",
"digest": "33187e134422",
"provider": "",
@@ -36343,7 +36343,7 @@
{
"id": "smollm:135m-instruct-v0.2-q5_1",
"name": "smollm:135m-instruct-v0.2-q5_1",
- "description": "🪐 A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
+ "description": "A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
"size": "112MB",
"digest": "51f73e9aa3f5",
"provider": "",
@@ -36353,7 +36353,7 @@
{
"id": "smollm:135m-instruct-v0.2-q5_K_M",
"name": "smollm:135m-instruct-v0.2-q5_K_M",
- "description": "🪐 A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
+ "description": "A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
"size": "112MB",
"digest": "a8975f4dc03b",
"provider": "",
@@ -36363,7 +36363,7 @@
{
"id": "smollm:135m-instruct-v0.2-q5_K_S",
"name": "smollm:135m-instruct-v0.2-q5_K_S",
- "description": "🪐 A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
+ "description": "A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
"size": "110MB",
"digest": "52d3fabb63ee",
"provider": "",
@@ -36373,7 +36373,7 @@
{
"id": "smollm:135m-instruct-v0.2-q6_K",
"name": "smollm:135m-instruct-v0.2-q6_K",
- "description": "🪐 A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
+ "description": "A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
"size": "138MB",
"digest": "dd1e60cf54df",
"provider": "",
@@ -36383,7 +36383,7 @@
{
"id": "smollm:135m-instruct-v0.2-q8_0",
"name": "smollm:135m-instruct-v0.2-q8_0",
- "description": "🪐 A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
+ "description": "A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
"size": "145MB",
"digest": "6fbf8e918862",
"provider": "",
@@ -36393,7 +36393,7 @@
{
"id": "smollm:360m-base-v0.2-fp16",
"name": "smollm:360m-base-v0.2-fp16",
- "description": "🪐 A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
+ "description": "A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
"size": "726MB",
"digest": "417c81308b94",
"provider": "",
@@ -36403,7 +36403,7 @@
{
"id": "smollm:360m-base-v0.2-q2_K",
"name": "smollm:360m-base-v0.2-q2_K",
- "description": "🪐 A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
+ "description": "A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
"size": "219MB",
"digest": "e5e1a58c7d0c",
"provider": "",
@@ -36413,7 +36413,7 @@
{
"id": "smollm:360m-base-v0.2-q3_K_L",
"name": "smollm:360m-base-v0.2-q3_K_L",
- "description": "🪐 A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
+ "description": "A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
"size": "246MB",
"digest": "d13db1d8af29",
"provider": "",
@@ -36423,7 +36423,7 @@
{
"id": "smollm:360m-base-v0.2-q3_K_M",
"name": "smollm:360m-base-v0.2-q3_K_M",
- "description": "🪐 A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
+ "description": "A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
"size": "235MB",
"digest": "66875ceb33a7",
"provider": "",
@@ -36433,7 +36433,7 @@
{
"id": "smollm:360m-base-v0.2-q3_K_S",
"name": "smollm:360m-base-v0.2-q3_K_S",
- "description": "🪐 A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
+ "description": "A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
"size": "219MB",
"digest": "8aba991b34bf",
"provider": "",
@@ -36443,7 +36443,7 @@
{
"id": "smollm:360m-base-v0.2-q4_0",
"name": "smollm:360m-base-v0.2-q4_0",
- "description": "🪐 A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
+ "description": "A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
"size": "229MB",
"digest": "32ed02cfe24e",
"provider": "",
@@ -36453,7 +36453,7 @@
{
"id": "smollm:360m-base-v0.2-q4_1",
"name": "smollm:360m-base-v0.2-q4_1",
- "description": "🪐 A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
+ "description": "A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
"size": "249MB",
"digest": "74c8ae01b04d",
"provider": "",
@@ -36463,7 +36463,7 @@
{
"id": "smollm:360m-base-v0.2-q4_K_M",
"name": "smollm:360m-base-v0.2-q4_K_M",
- "description": "🪐 A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
+ "description": "A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
"size": "271MB",
"digest": "d3b4961678c3",
"provider": "",
@@ -36473,7 +36473,7 @@
{
"id": "smollm:360m-base-v0.2-q4_K_S",
"name": "smollm:360m-base-v0.2-q4_K_S",
- "description": "🪐 A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
+ "description": "A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
"size": "260MB",
"digest": "81b950fac810",
"provider": "",
@@ -36483,7 +36483,7 @@
{
"id": "smollm:360m-base-v0.2-q5_0",
"name": "smollm:360m-base-v0.2-q5_0",
- "description": "🪐 A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
+ "description": "A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
"size": "268MB",
"digest": "319a822c1baa",
"provider": "",
@@ -36493,7 +36493,7 @@
{
"id": "smollm:360m-base-v0.2-q5_1",
"name": "smollm:360m-base-v0.2-q5_1",
- "description": "🪐 A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
+ "description": "A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
"size": "288MB",
"digest": "1c350d9f5c43",
"provider": "",
@@ -36503,7 +36503,7 @@
{
"id": "smollm:360m-base-v0.2-q5_K_M",
"name": "smollm:360m-base-v0.2-q5_K_M",
- "description": "🪐 A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
+ "description": "A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
"size": "290MB",
"digest": "bf2e3336142d",
"provider": "",
@@ -36513,7 +36513,7 @@
{
"id": "smollm:360m-base-v0.2-q5_K_S",
"name": "smollm:360m-base-v0.2-q5_K_S",
- "description": "🪐 A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
+ "description": "A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
"size": "283MB",
"digest": "05dad743d112",
"provider": "",
@@ -36523,7 +36523,7 @@
{
"id": "smollm:360m-base-v0.2-q6_K",
"name": "smollm:360m-base-v0.2-q6_K",
- "description": "🪐 A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
+ "description": "A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
"size": "367MB",
"digest": "6006320b3839",
"provider": "",
@@ -36533,7 +36533,7 @@
{
"id": "smollm:360m-base-v0.2-q8_0",
"name": "smollm:360m-base-v0.2-q8_0",
- "description": "🪐 A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
+ "description": "A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
"size": "386MB",
"digest": "dd417453fb49",
"provider": "",
@@ -36543,7 +36543,7 @@
{
"id": "smollm:360m-instruct-v0.2-fp16",
"name": "smollm:360m-instruct-v0.2-fp16",
- "description": "🪐 A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
+ "description": "A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
"size": "726MB",
"digest": "d0475be06ee3",
"provider": "",
@@ -36553,7 +36553,7 @@
{
"id": "smollm:360m-instruct-v0.2-q2_K",
"name": "smollm:360m-instruct-v0.2-q2_K",
- "description": "🪐 A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
+ "description": "A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
"size": "219MB",
"digest": "1dfe94149c4d",
"provider": "",
@@ -36563,7 +36563,7 @@
{
"id": "smollm:360m-instruct-v0.2-q3_K_L",
"name": "smollm:360m-instruct-v0.2-q3_K_L",
- "description": "🪐 A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
+ "description": "A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
"size": "246MB",
"digest": "6f711219bd5f",
"provider": "",
@@ -36573,7 +36573,7 @@
{
"id": "smollm:360m-instruct-v0.2-q3_K_M",
"name": "smollm:360m-instruct-v0.2-q3_K_M",
- "description": "🪐 A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
+ "description": "A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
"size": "235MB",
"digest": "4ecfcbc87975",
"provider": "",
@@ -36583,7 +36583,7 @@
{
"id": "smollm:360m-instruct-v0.2-q3_K_S",
"name": "smollm:360m-instruct-v0.2-q3_K_S",
- "description": "🪐 A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
+ "description": "A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
"size": "219MB",
"digest": "359f743b44a1",
"provider": "",
@@ -36593,7 +36593,7 @@
{
"id": "smollm:360m-instruct-v0.2-q4_0",
"name": "smollm:360m-instruct-v0.2-q4_0",
- "description": "🪐 A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
+ "description": "A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
"size": "229MB",
"digest": "b3ba1ccba2b8",
"provider": "",
@@ -36603,7 +36603,7 @@
{
"id": "smollm:360m-instruct-v0.2-q4_1",
"name": "smollm:360m-instruct-v0.2-q4_1",
- "description": "🪐 A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
+ "description": "A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
"size": "249MB",
"digest": "4a28c336aedd",
"provider": "",
@@ -36613,7 +36613,7 @@
{
"id": "smollm:360m-instruct-v0.2-q4_K_M",
"name": "smollm:360m-instruct-v0.2-q4_K_M",
- "description": "🪐 A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
+ "description": "A family of small models with 135M, 360M, and 1.7B parameters, trained on a new high-quality dataset.",
"size": "271MB",
"digest": "535cb302b6b9",
"provider": "",
@@ -43183,7 +43183,7 @@
{
"id": "dolphin3",
"name": "dolphin3",
- "description": "Dolphin 3.0 Llama 3.1 8B 🐬 is the next generation of the Dolphin series of instruct-tuned models designed to be the ultimate general purpose local model, enabling coding, math, agentic, function calling, and general use cases.",
+ "description": "Dolphin 3.0 Llama 3.1 8B is the next generation of the Dolphin series of instruct-tuned models designed to be the ultimate general purpose local model, enabling coding, math, agentic, function calling, and general use cases.",
"size": "4.9GB",
"digest": "d5ab9ae8e1f2",
"provider": "",
@@ -43193,7 +43193,7 @@
{
"id": "dolphin3:8b",
"name": "dolphin3:8b",
- "description": "Dolphin 3.0 Llama 3.1 8B 🐬 is the next generation of the Dolphin series of instruct-tuned models designed to be the ultimate general purpose local model, enabling coding, math, agentic, function calling, and general use cases.",
+ "description": "Dolphin 3.0 Llama 3.1 8B is the next generation of the Dolphin series of instruct-tuned models designed to be the ultimate general purpose local model, enabling coding, math, agentic, function calling, and general use cases.",
"size": "4.9GB",
"digest": "d5ab9ae8e1f2",
"provider": "",
@@ -43203,7 +43203,7 @@
{
"id": "dolphin3:8b-llama3.1-fp16",
"name": "dolphin3:8b-llama3.1-fp16",
- "description": "Dolphin 3.0 Llama 3.1 8B 🐬 is the next generation of the Dolphin series of instruct-tuned models designed to be the ultimate general purpose local model, enabling coding, math, agentic, function calling, and general use cases.",
+ "description": "Dolphin 3.0 Llama 3.1 8B is the next generation of the Dolphin series of instruct-tuned models designed to be the ultimate general purpose local model, enabling coding, math, agentic, function calling, and general use cases.",
"size": "16GB",
"digest": "b0941c6f3226",
"provider": "",
@@ -43213,7 +43213,7 @@
{
"id": "dolphin3:8b-llama3.1-q4_K_M",
"name": "dolphin3:8b-llama3.1-q4_K_M",
- "description": "Dolphin 3.0 Llama 3.1 8B 🐬 is the next generation of the Dolphin series of instruct-tuned models designed to be the ultimate general purpose local model, enabling coding, math, agentic, function calling, and general use cases.",
+ "description": "Dolphin 3.0 Llama 3.1 8B is the next generation of the Dolphin series of instruct-tuned models designed to be the ultimate general purpose local model, enabling coding, math, agentic, function calling, and general use cases.",
"size": "4.9GB",
"digest": "d5ab9ae8e1f2",
"provider": "",
@@ -43223,7 +43223,7 @@
{
"id": "dolphin3:8b-llama3.1-q8_0",
"name": "dolphin3:8b-llama3.1-q8_0",
- "description": "Dolphin 3.0 Llama 3.1 8B 🐬 is the next generation of the Dolphin series of instruct-tuned models designed to be the ultimate general purpose local model, enabling coding, math, agentic, function calling, and general use cases.",
+ "description": "Dolphin 3.0 Llama 3.1 8B is the next generation of the Dolphin series of instruct-tuned models designed to be the ultimate general purpose local model, enabling coding, math, agentic, function calling, and general use cases.",
"size": "8.5GB",
"digest": "e3310b61ffdb",
"provider": "",
@@ -59063,7 +59063,7 @@
{
"id": "magicoder",
"name": "magicoder",
- "description": "🎩 Magicoder is a family of 7B parameter models trained on 75K synthetic instruction data using OSS-Instruct, a novel approach to enlightening LLMs with open-source code snippets.",
+ "description": "Magicoder is a family of 7B parameter models trained on 75K synthetic instruction data using OSS-Instruct, a novel approach to enlightening LLMs with open-source code snippets.",
"size": "3.8GB",
"digest": "8007de06f5d9",
"provider": "",
@@ -59073,7 +59073,7 @@
{
"id": "magicoder:7b",
"name": "magicoder:7b",
- "description": "🎩 Magicoder is a family of 7B parameter models trained on 75K synthetic instruction data using OSS-Instruct, a novel approach to enlightening LLMs with open-source code snippets.",
+ "description": "Magicoder is a family of 7B parameter models trained on 75K synthetic instruction data using OSS-Instruct, a novel approach to enlightening LLMs with open-source code snippets.",
"size": "3.8GB",
"digest": "8007de06f5d9",
"provider": "",
@@ -59083,7 +59083,7 @@
{
"id": "magicoder:7b-s-cl",
"name": "magicoder:7b-s-cl",
- "description": "🎩 Magicoder is a family of 7B parameter models trained on 75K synthetic instruction data using OSS-Instruct, a novel approach to enlightening LLMs with open-source code snippets.",
+ "description": "Magicoder is a family of 7B parameter models trained on 75K synthetic instruction data using OSS-Instruct, a novel approach to enlightening LLMs with open-source code snippets.",
"size": "3.8GB",
"digest": "8007de06f5d9",
"provider": "",
@@ -59093,7 +59093,7 @@
{
"id": "magicoder:7b-s-cl-fp16",
"name": "magicoder:7b-s-cl-fp16",
- "description": "🎩 Magicoder is a family of 7B parameter models trained on 75K synthetic instruction data using OSS-Instruct, a novel approach to enlightening LLMs with open-source code snippets.",
+ "description": "Magicoder is a family of 7B parameter models trained on 75K synthetic instruction data using OSS-Instruct, a novel approach to enlightening LLMs with open-source code snippets.",
"size": "13GB",
"digest": "859e1ae4f566",
"provider": "",
@@ -59103,7 +59103,7 @@
{
"id": "magicoder:7b-s-cl-q2_K",
"name": "magicoder:7b-s-cl-q2_K",
- "description": "🎩 Magicoder is a family of 7B parameter models trained on 75K synthetic instruction data using OSS-Instruct, a novel approach to enlightening LLMs with open-source code snippets.",
+ "description": "Magicoder is a family of 7B parameter models trained on 75K synthetic instruction data using OSS-Instruct, a novel approach to enlightening LLMs with open-source code snippets.",
"size": "2.8GB",
"digest": "86fd329c64b6",
"provider": "",
@@ -59113,7 +59113,7 @@
{
"id": "magicoder:7b-s-cl-q3_K_L",
"name": "magicoder:7b-s-cl-q3_K_L",
- "description": "🎩 Magicoder is a family of 7B parameter models trained on 75K synthetic instruction data using OSS-Instruct, a novel approach to enlightening LLMs with open-source code snippets.",
+ "description": "Magicoder is a family of 7B parameter models trained on 75K synthetic instruction data using OSS-Instruct, a novel approach to enlightening LLMs with open-source code snippets.",
"size": "3.6GB",
"digest": "2bf1232fd9c1",
"provider": "",
@@ -59123,7 +59123,7 @@
{
"id": "magicoder:7b-s-cl-q3_K_M",
"name": "magicoder:7b-s-cl-q3_K_M",
- "description": "🎩 Magicoder is a family of 7B parameter models trained on 75K synthetic instruction data using OSS-Instruct, a novel approach to enlightening LLMs with open-source code snippets.",
+ "description": "Magicoder is a family of 7B parameter models trained on 75K synthetic instruction data using OSS-Instruct, a novel approach to enlightening LLMs with open-source code snippets.",
"size": "3.3GB",
"digest": "b2a3d9987ff3",
"provider": "",
@@ -59133,7 +59133,7 @@
{
"id": "magicoder:7b-s-cl-q3_K_S",
"name": "magicoder:7b-s-cl-q3_K_S",
- "description": "🎩 Magicoder is a family of 7B parameter models trained on 75K synthetic instruction data using OSS-Instruct, a novel approach to enlightening LLMs with open-source code snippets.",
+ "description": "Magicoder is a family of 7B parameter models trained on 75K synthetic instruction data using OSS-Instruct, a novel approach to enlightening LLMs with open-source code snippets.",
"size": "2.9GB",
"digest": "b7e2d7a303f8",
"provider": "",
@@ -59143,7 +59143,7 @@
{
"id": "magicoder:7b-s-cl-q4_0",
"name": "magicoder:7b-s-cl-q4_0",
- "description": "🎩 Magicoder is a family of 7B parameter models trained on 75K synthetic instruction data using OSS-Instruct, a novel approach to enlightening LLMs with open-source code snippets.",
+ "description": "Magicoder is a family of 7B parameter models trained on 75K synthetic instruction data using OSS-Instruct, a novel approach to enlightening LLMs with open-source code snippets.",
"size": "3.8GB",
"digest": "8007de06f5d9",
"provider": "",
@@ -59153,7 +59153,7 @@
{
"id": "magicoder:7b-s-cl-q4_1",
"name": "magicoder:7b-s-cl-q4_1",
- "description": "🎩 Magicoder is a family of 7B parameter models trained on 75K synthetic instruction data using OSS-Instruct, a novel approach to enlightening LLMs with open-source code snippets.",
+ "description": "Magicoder is a family of 7B parameter models trained on 75K synthetic instruction data using OSS-Instruct, a novel approach to enlightening LLMs with open-source code snippets.",
"size": "4.2GB",
"digest": "b29bf322a686",
"provider": "",
@@ -59163,7 +59163,7 @@
{
"id": "magicoder:7b-s-cl-q4_K_M",
"name": "magicoder:7b-s-cl-q4_K_M",
- "description": "🎩 Magicoder is a family of 7B parameter models trained on 75K synthetic instruction data using OSS-Instruct, a novel approach to enlightening LLMs with open-source code snippets.",
+ "description": "Magicoder is a family of 7B parameter models trained on 75K synthetic instruction data using OSS-Instruct, a novel approach to enlightening LLMs with open-source code snippets.",
"size": "4.1GB",
"digest": "902b6b028113",
"provider": "",
@@ -59173,7 +59173,7 @@
{
"id": "magicoder:7b-s-cl-q4_K_S",
"name": "magicoder:7b-s-cl-q4_K_S",
- "description": "🎩 Magicoder is a family of 7B parameter models trained on 75K synthetic instruction data using OSS-Instruct, a novel approach to enlightening LLMs with open-source code snippets.",
+ "description": "Magicoder is a family of 7B parameter models trained on 75K synthetic instruction data using OSS-Instruct, a novel approach to enlightening LLMs with open-source code snippets.",
"size": "3.9GB",
"digest": "42b56dd9b1da",
"provider": "",
@@ -59183,7 +59183,7 @@
{
"id": "magicoder:7b-s-cl-q5_0",
"name": "magicoder:7b-s-cl-q5_0",
- "description": "🎩 Magicoder is a family of 7B parameter models trained on 75K synthetic instruction data using OSS-Instruct, a novel approach to enlightening LLMs with open-source code snippets.",
+ "description": "Magicoder is a family of 7B parameter models trained on 75K synthetic instruction data using OSS-Instruct, a novel approach to enlightening LLMs with open-source code snippets.",
"size": "4.7GB",
"digest": "10fa66c827ee",
"provider": "",
@@ -59193,7 +59193,7 @@
{
"id": "magicoder:7b-s-cl-q5_1",
"name": "magicoder:7b-s-cl-q5_1",
- "description": "🎩 Magicoder is a family of 7B parameter models trained on 75K synthetic instruction data using OSS-Instruct, a novel approach to enlightening LLMs with open-source code snippets.",
+ "description": "Magicoder is a family of 7B parameter models trained on 75K synthetic instruction data using OSS-Instruct, a novel approach to enlightening LLMs with open-source code snippets.",
"size": "5.1GB",
"digest": "7da1fdad5251",
"provider": "",
@@ -59203,7 +59203,7 @@
{
"id": "magicoder:7b-s-cl-q5_K_M",
"name": "magicoder:7b-s-cl-q5_K_M",
- "description": "🎩 Magicoder is a family of 7B parameter models trained on 75K synthetic instruction data using OSS-Instruct, a novel approach to enlightening LLMs with open-source code snippets.",
+ "description": "Magicoder is a family of 7B parameter models trained on 75K synthetic instruction data using OSS-Instruct, a novel approach to enlightening LLMs with open-source code snippets.",
"size": "4.8GB",
"digest": "057c4f587f41",
"provider": "",
@@ -59213,7 +59213,7 @@
{
"id": "magicoder:7b-s-cl-q5_K_S",
"name": "magicoder:7b-s-cl-q5_K_S",
- "description": "🎩 Magicoder is a family of 7B parameter models trained on 75K synthetic instruction data using OSS-Instruct, a novel approach to enlightening LLMs with open-source code snippets.",
+ "description": "Magicoder is a family of 7B parameter models trained on 75K synthetic instruction data using OSS-Instruct, a novel approach to enlightening LLMs with open-source code snippets.",
"size": "4.7GB",
"digest": "ce0b81d40da6",
"provider": "",
@@ -59223,7 +59223,7 @@
{
"id": "magicoder:7b-s-cl-q6_K",
"name": "magicoder:7b-s-cl-q6_K",
- "description": "🎩 Magicoder is a family of 7B parameter models trained on 75K synthetic instruction data using OSS-Instruct, a novel approach to enlightening LLMs with open-source code snippets.",
+ "description": "Magicoder is a family of 7B parameter models trained on 75K synthetic instruction data using OSS-Instruct, a novel approach to enlightening LLMs with open-source code snippets.",
"size": "5.5GB",
"digest": "cf853951ae4a",
"provider": "",
@@ -59233,7 +59233,7 @@
{
"id": "magicoder:7b-s-cl-q8_0",
"name": "magicoder:7b-s-cl-q8_0",
- "description": "🎩 Magicoder is a family of 7B parameter models trained on 75K synthetic instruction data using OSS-Instruct, a novel approach to enlightening LLMs with open-source code snippets.",
+ "description": "Magicoder is a family of 7B parameter models trained on 75K synthetic instruction data using OSS-Instruct, a novel approach to enlightening LLMs with open-source code snippets.",
"size": "7.2GB",
"digest": "96b5e4193464",
"provider": "",
diff --git a/ai-provider/local/ollama.go b/ai-provider/local/ollama.go
deleted file mode 100644
index be765848..00000000
--- a/ai-provider/local/ollama.go
+++ /dev/null
@@ -1,102 +0,0 @@
-package ai_provider_local
-
-var (
- OllamaConfig = "{\n \"mirostat\": 0,\n \"mirostat_eta\": 0.1,\n \"mirostat_tau\": 5.0,\n \"num_ctx\": 4096,\n \"repeat_last_n\":64,\n \"repeat_penalty\": 1.1,\n \"temperature\": 0.7,\n \"seed\": 42,\n \"num_predict\": 42,\n \"top_k\": 40,\n \"top_p\": 0.9,\n \"min_p\": 0.5\n}\n"
- OllamaSvg = `
-
-
-`
-)
diff --git a/ai-provider/model-runtime/model-providers/authropic/anthropic.yaml b/ai-provider/model-runtime/model-providers/authropic/anthropic.yaml
index f44d3e18..7bcaf986 100644
--- a/ai-provider/model-runtime/model-providers/authropic/anthropic.yaml
+++ b/ai-provider/model-runtime/model-providers/authropic/anthropic.yaml
@@ -31,12 +31,12 @@ provider_credential_schema:
en_US: Enter your API Key
- variable: anthropic_api_url
label:
- en_US: API URL
+ en_US: https://api.anthropic.com/v1/
type: text-input
required: false
placeholder:
zh_Hans: 在此输入您的 API URL
en_US: Enter your API URL
-address: https://api.anthropic.com
+address: https://api.anthropic.com/v1/
recommend: true
sort: 2
\ No newline at end of file
diff --git a/ai-provider/model-runtime/model-providers/baichuan/baichuan.yaml b/ai-provider/model-runtime/model-providers/baichuan/baichuan.yaml
index dcadb657..da814abd 100644
--- a/ai-provider/model-runtime/model-providers/baichuan/baichuan.yaml
+++ b/ai-provider/model-runtime/model-providers/baichuan/baichuan.yaml
@@ -27,4 +27,12 @@ provider_credential_schema:
placeholder:
zh_Hans: 在此输入您的 API Key
en_US: Enter your API Key
-address: https://api.baichuan-ai.com
+ - variable: base_url
+ label:
+ en_US: https://api.baichuan-ai.com/v1
+ type: text-input
+ required: false
+ placeholder:
+ zh_Hans: 在此输入您的 Base URL
+ en_US: Enter your Base URL
+address: https://api.baichuan-ai.com/v1
diff --git a/ai-provider/model-runtime/model-providers/bailian/bailian.yaml b/ai-provider/model-runtime/model-providers/bailian/bailian.yaml
index 7456a7de..93bd6a02 100644
--- a/ai-provider/model-runtime/model-providers/bailian/bailian.yaml
+++ b/ai-provider/model-runtime/model-providers/bailian/bailian.yaml
@@ -1,7 +1,7 @@
provider: bailian
label:
zh_Hans: 阿里云百炼
- en_US: bailian
+ en_US: BaiLian
icon_small:
en_US: icon_s_en.svg
icon_large:
@@ -21,7 +21,7 @@ configurate_methods:
- customizable-model
provider_credential_schema:
credential_form_schemas:
- - variable: dashscope_api_key
+ - variable: api_key
label:
en_US: API Key
type: secret-input
@@ -29,4 +29,12 @@ provider_credential_schema:
placeholder:
zh_Hans: 在此输入您的 API Key
en_US: Enter your API Key
-address: https://dashscope.aliyuncs.com
\ No newline at end of file
+ - variable: base_url
+ label:
+ en_US: https://dashscope.aliyuncs.com/compatible-mode/v1
+ type: text-input
+ required: false
+ placeholder:
+ zh_Hans: 在此输入您的 Base URL
+ en_US: Enter your Base URL
+address: https://dashscope.aliyuncs.com/compatible-mode/v1
\ No newline at end of file
diff --git a/ai-provider/model-runtime/model-providers/bedrock/bedrock.yaml b/ai-provider/model-runtime/model-providers/bedrock/bedrock.yaml
index b9f165c2..f7332e40 100644
--- a/ai-provider/model-runtime/model-providers/bedrock/bedrock.yaml
+++ b/ai-provider/model-runtime/model-providers/bedrock/bedrock.yaml
@@ -87,6 +87,9 @@ provider_credential_schema:
placeholder:
en_US: A model you have access to (e.g. amazon.titan-text-lite-v1) for validation.
zh_Hans: 为了进行验证,请输入一个您可用的模型名称 (例如:amazon.titan-text-lite-v1)
+model_config:
+ access_configuration_status: true
+ access_configuration_demo: "{\"region\":\"\",\"model\":\"\"}"
address: https://bedrock-runtime.amazonaws.com
sort: 4
recommend: true
\ No newline at end of file
diff --git a/ai-provider/model-runtime/model-providers/chatglm/chatglm.yaml b/ai-provider/model-runtime/model-providers/chatglm/chatglm.yaml
index 715febcd..25ee59f2 100644
--- a/ai-provider/model-runtime/model-providers/chatglm/chatglm.yaml
+++ b/ai-provider/model-runtime/model-providers/chatglm/chatglm.yaml
@@ -18,12 +18,20 @@ configurate_methods:
- predefined-model
provider_credential_schema:
credential_form_schemas:
- - variable: api_base
+ - variable: api_key
label:
- en_US: API URL
- type: text-input
+ en_US: API Key
+ type: secret-input
required: true
+ placeholder:
+ zh_Hans: 在此输入您的 API Key
+ en_US: Enter your API Key
+ - variable: base_url
+ label:
+ en_US: https://open.bigmodel.cn/api/paas/v4/
+ type: text-input
+ required: false
placeholder:
zh_Hans: 在此输入您的 API URL
en_US: Enter your API URL
-address: https://api.openai.com
\ No newline at end of file
+address: https://open.bigmodel.cn/api/paas/v4/
\ No newline at end of file
diff --git a/ai-provider/model-runtime/model-providers/cohere/cohere.yaml b/ai-provider/model-runtime/model-providers/cohere/cohere.yaml
index fa6e0556..27419ba1 100644
--- a/ai-provider/model-runtime/model-providers/cohere/cohere.yaml
+++ b/ai-provider/model-runtime/model-providers/cohere/cohere.yaml
@@ -32,4 +32,12 @@ provider_credential_schema:
zh_Hans: 在此输入您的 API Key
en_US: Enter your API Key
show_on: [ ]
-address: https://api.cohere.com
\ No newline at end of file
+ - variable: base_url
+ label:
+ en_US: https://api.cohere.ai/compatibility/v1
+ type: text-input
+ required: false
+ placeholder:
+ zh_Hans: 在此输入您的 Base URL
+ en_US: Enter your Base URL
+address: https://api.cohere.ai/compatibility/v1
\ No newline at end of file
diff --git a/ai-provider/model-runtime/model-providers/deepseek/deepseek.yaml b/ai-provider/model-runtime/model-providers/deepseek/deepseek.yaml
index 6e1bf082..1aebab42 100644
--- a/ai-provider/model-runtime/model-providers/deepseek/deepseek.yaml
+++ b/ai-provider/model-runtime/model-providers/deepseek/deepseek.yaml
@@ -30,4 +30,12 @@ provider_credential_schema:
placeholder:
zh_Hans: 在此输入您的 API Key
en_US: Enter your API Key
-address: https://api.deepseek.com
\ No newline at end of file
+ - variable: base_url
+ label:
+ en_US: https://api.deepseek.com/v1
+ type: text-input
+ required: false
+ placeholder:
+ zh_Hans: 在此输入您的 Base URL
+ en_US: Enter your Base URL
+address: https://api.deepseek.com/v1
\ No newline at end of file
diff --git a/ai-provider/model-runtime/model-providers/fireworks/fireworks.yaml b/ai-provider/model-runtime/model-providers/fireworks/fireworks.yaml
index be734ac4..c375b6f3 100644
--- a/ai-provider/model-runtime/model-providers/fireworks/fireworks.yaml
+++ b/ai-provider/model-runtime/model-providers/fireworks/fireworks.yaml
@@ -28,4 +28,12 @@ provider_credential_schema:
placeholder:
zh_Hans: 在此输入您的 API Key
en_US: Enter your API Key
-address: https://api.fireworks.ai
\ No newline at end of file
+ - variable: base_url
+ label:
+ en_US: https://generativelanguage.googleapis.com/v1beta/openai
+ type: text-input
+ required: false
+ placeholder:
+ zh_Hans: 在此输入您的 Base URL
+ en_US: Enter your Base URL
+address: https://api.fireworks.ai/inference/v1
\ No newline at end of file
diff --git a/ai-provider/model-runtime/model-providers/google/google.yaml b/ai-provider/model-runtime/model-providers/google/google.yaml
index e54c899f..afc731cf 100644
--- a/ai-provider/model-runtime/model-providers/google/google.yaml
+++ b/ai-provider/model-runtime/model-providers/google/google.yaml
@@ -32,12 +32,12 @@ provider_credential_schema:
- variable: google_api_base
label:
zh_Hans: API Base
- en_US: API Base
+ en_US: https://generativelanguage.googleapis.com/v1beta/openai
type: text-input
required: false
placeholder:
zh_Hans: 在此输入您的 API Base, 如:https://api.google.com
en_US: Enter your API Base, e.g. https://api.google.com
-address: https://generativelanguage.googleapis.com
+address: https://generativelanguage.googleapis.com/v1beta/openai
recommend: true
sort: 3
\ No newline at end of file
diff --git a/ai-provider/model-runtime/model-providers/groq/groq.yaml b/ai-provider/model-runtime/model-providers/groq/groq.yaml
index b2ce06f8..697a4e10 100644
--- a/ai-provider/model-runtime/model-providers/groq/groq.yaml
+++ b/ai-provider/model-runtime/model-providers/groq/groq.yaml
@@ -30,4 +30,12 @@ provider_credential_schema:
placeholder:
zh_Hans: 在此输入您的 API Key
en_US: Enter your API Key
-address: https://api.groq.com
\ No newline at end of file
+ - variable: base_url
+ label:
+ en_US: https://api.groq.com/openai/v1
+ type: text-input
+ required: false
+ placeholder:
+ zh_Hans: 在此输入您的 Base URL
+ en_US: Enter your Base URL
+address: https://api.groq.com/openai/v1
\ No newline at end of file
diff --git a/ai-provider/model-runtime/model-providers/huggingface_hub/huggingface_hub.yaml b/ai-provider/model-runtime/model-providers/huggingface_hub/huggingface_hub.yaml
index e51e6081..8605c82c 100644
--- a/ai-provider/model-runtime/model-providers/huggingface_hub/huggingface_hub.yaml
+++ b/ai-provider/model-runtime/model-providers/huggingface_hub/huggingface_hub.yaml
@@ -100,4 +100,22 @@ model_credential_schema:
show_on:
- variable: huggingfacehub_api_type
value: inference_endpoints
-address: https://api-inference.huggingface.co
\ No newline at end of file
+provider_credential_schema:
+ credential_form_schemas:
+ - variable: api_key
+ label:
+ en_US: API Key
+ type: secret-input
+ required: true
+ placeholder:
+ zh_Hans: 在此输入您的 API Key
+ en_US: Enter your API Key
+ - variable: base_url
+ label:
+ en_US: https://router.huggingface.co/hf-inference/v1
+ type: text-input
+ required: false
+ placeholder:
+ zh_Hans: 在此输入您的 Base URL
+ en_US: Enter your Base URL
+address: https://router.huggingface.co/hf-inference/v1
\ No newline at end of file
diff --git a/ai-provider/model-runtime/model-providers/hunyuan/hunyuan.yaml b/ai-provider/model-runtime/model-providers/hunyuan/hunyuan.yaml
index 4b87e243..51a068dd 100644
--- a/ai-provider/model-runtime/model-providers/hunyuan/hunyuan.yaml
+++ b/ai-provider/model-runtime/model-providers/hunyuan/hunyuan.yaml
@@ -23,20 +23,36 @@ configurate_methods:
- predefined-model
provider_credential_schema:
credential_form_schemas:
- - variable: secret_id
+# - variable: secret_id
+# label:
+# en_US: Secret ID
+# type: secret-input
+# required: true
+# placeholder:
+# zh_Hans: 在此输入您的 Secret ID
+# en_US: Enter your Secret ID
+# - variable: secret_key
+# label:
+# en_US: Secret Key
+# type: secret-input
+# required: true
+# placeholder:
+# zh_Hans: 在此输入您的 Secret Key
+# en_US: Enter your Secret Key
+ - variable: api_key
label:
- en_US: Secret ID
+ en_US: API Key
type: secret-input
required: true
placeholder:
- zh_Hans: 在此输入您的 Secret ID
- en_US: Enter your Secret ID
- - variable: secret_key
+ zh_Hans: 在此输入您的 API Key
+ en_US: Enter your API Key
+ - variable: base_url
label:
- en_US: Secret Key
- type: secret-input
- required: true
+ en_US: https://api.hunyuan.cloud.tencent.com/v1
+ type: text-input
+ required: false
placeholder:
- zh_Hans: 在此输入您的 Secret Key
- en_US: Enter your Secret Key
-address: https://hunyuan.tencentcloudapi.com
\ No newline at end of file
+ zh_Hans: 在此输入您的 Base URL
+ en_US: Enter your Base URL
+address: https://api.hunyuan.cloud.tencent.com/v1
\ No newline at end of file
diff --git a/ai-provider/model-runtime/model-providers/lm_studio/assets/icon_l_en.svg b/ai-provider/model-runtime/model-providers/lm_studio/assets/icon_l_en.svg
index f1ef8d4b..5f08476c 100644
--- a/ai-provider/model-runtime/model-providers/lm_studio/assets/icon_l_en.svg
+++ b/ai-provider/model-runtime/model-providers/lm_studio/assets/icon_l_en.svg
@@ -1,11 +1 @@
-
+
\ No newline at end of file
diff --git a/ai-provider/model-runtime/model-providers/lm_studio/assets/icon_s_en.svg b/ai-provider/model-runtime/model-providers/lm_studio/assets/icon_s_en.svg
index 86f2c419..5f08476c 100644
--- a/ai-provider/model-runtime/model-providers/lm_studio/assets/icon_s_en.svg
+++ b/ai-provider/model-runtime/model-providers/lm_studio/assets/icon_s_en.svg
@@ -1,4 +1 @@
-
+
\ No newline at end of file
diff --git a/ai-provider/model-runtime/model-providers/lm_studio/lm_studio.yaml b/ai-provider/model-runtime/model-providers/lm_studio/lm_studio.yaml
index 5e62cd11..1b3306bc 100644
--- a/ai-provider/model-runtime/model-providers/lm_studio/lm_studio.yaml
+++ b/ai-provider/model-runtime/model-providers/lm_studio/lm_studio.yaml
@@ -96,4 +96,14 @@ model_credential_schema:
label:
en_US: 'No'
zh_Hans: 否
+provider_credential_schema:
+ credential_form_schemas:
+ - variable: base_url
+ label:
+ en_US: https://lmstudio.ai
+ type: text-input
+ required: false
+ placeholder:
+ zh_Hans: 在此输入您的 Base URL
+ en_US: Enter your Base URL
address: https://lmstudio.ai
diff --git a/ai-provider/model-runtime/model-providers/minimax/minimax.yaml b/ai-provider/model-runtime/model-providers/minimax/minimax.yaml
index d6d82e8a..981f2af5 100644
--- a/ai-provider/model-runtime/model-providers/minimax/minimax.yaml
+++ b/ai-provider/model-runtime/model-providers/minimax/minimax.yaml
@@ -27,6 +27,14 @@ provider_credential_schema:
placeholder:
zh_Hans: 在此输入您的 API Key
en_US: Enter your API Key
-address: https://api.minimax.chat
+ - variable: base_url
+ label:
+ en_US: https://api.minimax.chat/v1
+ type: text-input
+ required: false
+ placeholder:
+ zh_Hans: 在此输入您的 Base URL
+ en_US: Enter your Base URL
+address: https://api.minimax.chat/v1
recommend: true
sort: 5
\ No newline at end of file
diff --git a/ai-provider/model-runtime/model-providers/mistralai/mistralai.yaml b/ai-provider/model-runtime/model-providers/mistralai/mistralai.yaml
index e00a4821..a9982657 100644
--- a/ai-provider/model-runtime/model-providers/mistralai/mistralai.yaml
+++ b/ai-provider/model-runtime/model-providers/mistralai/mistralai.yaml
@@ -29,4 +29,12 @@ provider_credential_schema:
placeholder:
zh_Hans: 在此输入您的 API Key
en_US: Enter your API Key
+ - variable: base_url
+ label:
+ en_US: https://api.mistral.ai
+ type: text-input
+ required: false
+ placeholder:
+ zh_Hans: 在此输入您的 Base URL
+ en_US: Enter your Base URL
address: https://api.mistral.ai
\ No newline at end of file
diff --git a/ai-provider/model-runtime/model-providers/moonshot/moonshot.yaml b/ai-provider/model-runtime/model-providers/moonshot/moonshot.yaml
index 406213b3..58786544 100644
--- a/ai-provider/model-runtime/model-providers/moonshot/moonshot.yaml
+++ b/ai-provider/model-runtime/model-providers/moonshot/moonshot.yaml
@@ -31,6 +31,14 @@ provider_credential_schema:
placeholder:
zh_Hans: 在此输入您的 API Key
en_US: Enter your API Key
-address: https://api.moonshot.cn
+ - variable: base_url
+ label:
+ en_US: https://api.moonshot.cn/v1
+ type: text-input
+ required: false
+ placeholder:
+ zh_Hans: 在此输入您的 Base URL
+ en_US: Enter your Base URL
+address: https://api.moonshot.cn/v1
recommend: true
sort: 6
\ No newline at end of file
diff --git a/ai-provider/model-runtime/model-providers/novita/novita.yaml b/ai-provider/model-runtime/model-providers/novita/novita.yaml
index 852c3422..fd126939 100644
--- a/ai-provider/model-runtime/model-providers/novita/novita.yaml
+++ b/ai-provider/model-runtime/model-providers/novita/novita.yaml
@@ -29,4 +29,12 @@ provider_credential_schema:
placeholder:
zh_Hans: 在此输入您的 API Key
en_US: Enter your API Key
-address: https://api.novita.ai
\ No newline at end of file
+ - variable: base_url
+ label:
+ en_US: https://api.novita.ai/v3/openai
+ type: text-input
+ required: false
+ placeholder:
+ zh_Hans: 在此输入您的 Base URL
+ en_US: Enter your Base URL
+address: https://api.novita.ai/v3/openai
\ No newline at end of file
diff --git a/ai-provider/model-runtime/model-providers/nvidia/nvidia.yaml b/ai-provider/model-runtime/model-providers/nvidia/nvidia.yaml
index c2038512..821c4f94 100644
--- a/ai-provider/model-runtime/model-providers/nvidia/nvidia.yaml
+++ b/ai-provider/model-runtime/model-providers/nvidia/nvidia.yaml
@@ -31,4 +31,12 @@ provider_credential_schema:
placeholder:
zh_Hans: 在此输入您的 API Key
en_US: Enter your API Key
+ - variable: base_url
+ label:
+ en_US: https://integrate.api.nvidia.com
+ type: text-input
+ required: false
+ placeholder:
+ zh_Hans: 在此输入您的 Base URL
+ en_US: Enter your Base URL
address: https://integrate.api.nvidia.com
\ No newline at end of file
diff --git a/ai-provider/model-runtime/model-providers/ollama/assets/icon_l_en.svg b/ai-provider/model-runtime/model-providers/ollama/assets/icon_l_en.svg
index 5f08476c..492903f4 100644
--- a/ai-provider/model-runtime/model-providers/ollama/assets/icon_l_en.svg
+++ b/ai-provider/model-runtime/model-providers/ollama/assets/icon_l_en.svg
@@ -1 +1,9 @@
-
\ No newline at end of file
+
diff --git a/ai-provider/model-runtime/model-providers/ollama/assets/icon_s_en.svg b/ai-provider/model-runtime/model-providers/ollama/assets/icon_s_en.svg
index 5f08476c..492903f4 100644
--- a/ai-provider/model-runtime/model-providers/ollama/assets/icon_s_en.svg
+++ b/ai-provider/model-runtime/model-providers/ollama/assets/icon_s_en.svg
@@ -1 +1,9 @@
-
\ No newline at end of file
+
diff --git a/ai-provider/model-runtime/model-providers/ollama/ollama.yaml b/ai-provider/model-runtime/model-providers/ollama/ollama.yaml
index b9144630..d662a3fd 100644
--- a/ai-provider/model-runtime/model-providers/ollama/ollama.yaml
+++ b/ai-provider/model-runtime/model-providers/ollama/ollama.yaml
@@ -17,6 +17,17 @@ supported_model_types:
- text-embedding
configurate_methods:
- customizable-model
+provider_credential_schema:
+ credential_form_schemas:
+ - variable: base_url
+ label:
+ zh_Hans: API Base
+ en_US: API Base
+ type: text-input
+ required: false
+ placeholder:
+ zh_Hans: 在此输入您的 API Base, 如:http://127.0.0.1:11434
+ en_US: Enter your API Base, e.g. http://127.0.0.1:11434
model_credential_schema:
model:
label:
diff --git a/ai-provider/model-runtime/model-providers/openAI/openai.yaml b/ai-provider/model-runtime/model-providers/openAI/openai.yaml
index 2d5cfca6..75e1bbe9 100644
--- a/ai-provider/model-runtime/model-providers/openAI/openai.yaml
+++ b/ai-provider/model-runtime/model-providers/openAI/openai.yaml
@@ -78,6 +78,6 @@ provider_credential_schema:
placeholder:
zh_Hans: 在此输入您的 API Base, 如:https://api.openai.com
en_US: Enter your API Base, e.g. https://api.openai.com
-address: https://api.openai.com
+address: https://api.openai.com/v1
recommend: true
sort: 1
\ No newline at end of file
diff --git a/ai-provider/model-runtime/model-providers/openrouter/openrouter.yaml b/ai-provider/model-runtime/model-providers/openrouter/openrouter.yaml
index ad95d283..a1eedbac 100644
--- a/ai-provider/model-runtime/model-providers/openrouter/openrouter.yaml
+++ b/ai-provider/model-runtime/model-providers/openrouter/openrouter.yaml
@@ -103,4 +103,12 @@ provider_credential_schema:
placeholder:
zh_Hans: 在此输入您的 API Key
en_US: Enter your API Key
-address: https://openrouter.ai
\ No newline at end of file
+ - variable: base_url
+ label:
+ en_US: https://openrouter.ai/api/v1
+ type: text-input
+ required: false
+ placeholder:
+ zh_Hans: 在此输入您的 Base URL
+ en_US: Enter your Base URL
+address: https://openrouter.ai/api/v1
\ No newline at end of file
diff --git a/ai-provider/model-runtime/model-providers/perfxcloud/perfxcloud.yaml b/ai-provider/model-runtime/model-providers/perfxcloud/perfxcloud.yaml
index bd63e495..4cc7a112 100644
--- a/ai-provider/model-runtime/model-providers/perfxcloud/perfxcloud.yaml
+++ b/ai-provider/model-runtime/model-providers/perfxcloud/perfxcloud.yaml
@@ -31,4 +31,12 @@ provider_credential_schema:
placeholder:
zh_Hans: 在此输入您的 API Key
en_US: Enter your API Key
-address: https://cloud.perfxlab.cn
\ No newline at end of file
+ - variable: base_url
+ label:
+ en_US: https://perfxcloud.io/v1
+ type: text-input
+ required: false
+ placeholder:
+ zh_Hans: 在此输入您的 Base URL
+ en_US: Enter your Base URL
+address: https://perfxcloud.io/v1
\ No newline at end of file
diff --git a/ai-provider/model-runtime/model-providers/siliconflow/siliconflow.yaml b/ai-provider/model-runtime/model-providers/siliconflow/siliconflow.yaml
index f9c932f4..ab5cb9b4 100644
--- a/ai-provider/model-runtime/model-providers/siliconflow/siliconflow.yaml
+++ b/ai-provider/model-runtime/model-providers/siliconflow/siliconflow.yaml
@@ -30,4 +30,12 @@ provider_credential_schema:
placeholder:
zh_Hans: 在此输入您的 API Key
en_US: Enter your API Key
-address: https://api.openai.com
\ No newline at end of file
+ - variable: base_url
+ label:
+ en_US: https://perfxcloud.io/v1
+ type: text-input
+ required: false
+ placeholder:
+ zh_Hans: 在此输入您的 Base URL
+ en_US: Enter your Base URL
+address: https://api.siliconflow.cn/v1
\ No newline at end of file
diff --git a/ai-provider/model-runtime/model-providers/spark/spark.yaml b/ai-provider/model-runtime/model-providers/spark/spark.yaml
index cbfedef4..cc8fcc8f 100644
--- a/ai-provider/model-runtime/model-providers/spark/spark.yaml
+++ b/ai-provider/model-runtime/model-providers/spark/spark.yaml
@@ -20,13 +20,20 @@ configurate_methods:
- predefined-model
provider_credential_schema:
credential_form_schemas:
- - variable: api_password
+ - variable: api_key
label:
- en_US: APIPassword
+ en_US: API Key
type: secret-input
required: true
placeholder:
- zh_Hans: 在此输入您的 APIPassword
- en_US: Enter your APIPassword
-
-address: https://spark-api-open.xf-yun.com
\ No newline at end of file
+ zh_Hans: 在此输入您的 API Key
+ en_US: Enter your API Key
+ - variable: base_url
+ label:
+ en_US: https://spark-api-open.xf-yun.com/v1
+ type: text-input
+ required: false
+ placeholder:
+ zh_Hans: 在此输入您的 Base URL
+ en_US: Enter your Base URL
+address: https://spark-api-open.xf-yun.com/v1
\ No newline at end of file
diff --git a/ai-provider/model-runtime/model-providers/stepfun/stepfun.yaml b/ai-provider/model-runtime/model-providers/stepfun/stepfun.yaml
index 5466ec4e..83434305 100644
--- a/ai-provider/model-runtime/model-providers/stepfun/stepfun.yaml
+++ b/ai-provider/model-runtime/model-providers/stepfun/stepfun.yaml
@@ -31,6 +31,14 @@ provider_credential_schema:
placeholder:
zh_Hans: 在此输入您的 API Key
en_US: Enter your API Key
+ - variable: base_url
+ label:
+ en_US: https://api.stepfun.com/v1
+ type: text-input
+ required: false
+ placeholder:
+ zh_Hans: 在此输入您的 Base URL
+ en_US: Enter your Base URL
model_credential_schema:
model:
label:
@@ -79,4 +87,4 @@ model_credential_schema:
label:
en_US: Tool Call
zh_Hans: Tool Call
-address: https://api.stepfun.com
\ No newline at end of file
+address: https://api.stepfun.com/v1
\ No newline at end of file
diff --git a/ai-provider/model-runtime/model-providers/tongyi/tongyi.yaml b/ai-provider/model-runtime/model-providers/tongyi/tongyi.yaml
index da535348..78c070e2 100644
--- a/ai-provider/model-runtime/model-providers/tongyi/tongyi.yaml
+++ b/ai-provider/model-runtime/model-providers/tongyi/tongyi.yaml
@@ -29,4 +29,12 @@ provider_credential_schema:
placeholder:
zh_Hans: 在此输入您的 API Key
en_US: Enter your API Key
-address: https://dashscope.aliyuncs.com
\ No newline at end of file
+ - variable: dashscope_api_base
+ label:
+ en_US: https://dashscope.aliyuncs.com/compatible-mode/v1
+ type: text-input
+ required: false
+ placeholder:
+ zh_Hans: 在此输入您的 Base URL
+ en_US: Enter your Base URL
+address: https://dashscope.aliyuncs.com/compatible-mode/v1
\ No newline at end of file
diff --git a/ai-provider/model-runtime/model-providers/upstage/upstage.yaml b/ai-provider/model-runtime/model-providers/upstage/upstage.yaml
index b52bd1bb..ec44fc82 100644
--- a/ai-provider/model-runtime/model-providers/upstage/upstage.yaml
+++ b/ai-provider/model-runtime/model-providers/upstage/upstage.yaml
@@ -47,4 +47,12 @@ provider_credential_schema:
placeholder:
zh_Hans: 在此输入您的 API Key
en_US: Enter your API Key
-address: https://api.upstage.ai
\ No newline at end of file
+ - variable: base_url
+ label:
+ en_US: https://api.upstage.ai/v1/solar
+ type: text-input
+ required: false
+ placeholder:
+ zh_Hans: 在此输入您的 Base URL
+ en_US: Enter your Base URL
+address: https://api.upstage.ai/v1/solar
\ No newline at end of file
diff --git a/ai-provider/model-runtime/model-providers/vertex_ai/llm/anthropic.claude-3-haiku.yaml b/ai-provider/model-runtime/model-providers/vertex_ai/llm/anthropic.claude-3-haiku.yaml
index 56133486..fb6f6d71 100644
--- a/ai-provider/model-runtime/model-providers/vertex_ai/llm/anthropic.claude-3-haiku.yaml
+++ b/ai-provider/model-runtime/model-providers/vertex_ai/llm/anthropic.claude-3-haiku.yaml
@@ -1,4 +1,4 @@
-model: claude-3-haiku@20240307
+model: google/claude-3-haiku@20240307
label:
en_US: Claude 3 Haiku
model_type: llm
diff --git a/ai-provider/model-runtime/model-providers/vertex_ai/llm/anthropic.claude-3-opus.yaml b/ai-provider/model-runtime/model-providers/vertex_ai/llm/anthropic.claude-3-opus.yaml
index ab084636..767199de 100644
--- a/ai-provider/model-runtime/model-providers/vertex_ai/llm/anthropic.claude-3-opus.yaml
+++ b/ai-provider/model-runtime/model-providers/vertex_ai/llm/anthropic.claude-3-opus.yaml
@@ -1,4 +1,4 @@
-model: claude-3-opus@20240229
+model: google/claude-3-opus@20240229
label:
en_US: Claude 3 Opus
model_type: llm
diff --git a/ai-provider/model-runtime/model-providers/vertex_ai/llm/anthropic.claude-3-sonnet.yaml b/ai-provider/model-runtime/model-providers/vertex_ai/llm/anthropic.claude-3-sonnet.yaml
index 0be0113f..a5f99d54 100644
--- a/ai-provider/model-runtime/model-providers/vertex_ai/llm/anthropic.claude-3-sonnet.yaml
+++ b/ai-provider/model-runtime/model-providers/vertex_ai/llm/anthropic.claude-3-sonnet.yaml
@@ -1,4 +1,4 @@
-model: claude-3-sonnet@20240229
+model: google/claude-3-sonnet@20240229
label:
en_US: Claude 3 Sonnet
model_type: llm
diff --git a/ai-provider/model-runtime/model-providers/vertex_ai/llm/anthropic.claude-3.5-sonnet-v2.yaml b/ai-provider/model-runtime/model-providers/vertex_ai/llm/anthropic.claude-3.5-sonnet-v2.yaml
index 37b9f30c..48a1a866 100644
--- a/ai-provider/model-runtime/model-providers/vertex_ai/llm/anthropic.claude-3.5-sonnet-v2.yaml
+++ b/ai-provider/model-runtime/model-providers/vertex_ai/llm/anthropic.claude-3.5-sonnet-v2.yaml
@@ -1,4 +1,4 @@
-model: claude-3-5-sonnet-v2@20241022
+model: google/claude-3-5-sonnet-v2@20241022
label:
en_US: Claude 3.5 Sonnet v2
model_type: llm
diff --git a/ai-provider/model-runtime/model-providers/vertex_ai/llm/anthropic.claude-3.5-sonnet.yaml b/ai-provider/model-runtime/model-providers/vertex_ai/llm/anthropic.claude-3.5-sonnet.yaml
index c64384e6..0f17f26d 100644
--- a/ai-provider/model-runtime/model-providers/vertex_ai/llm/anthropic.claude-3.5-sonnet.yaml
+++ b/ai-provider/model-runtime/model-providers/vertex_ai/llm/anthropic.claude-3.5-sonnet.yaml
@@ -1,4 +1,4 @@
-model: claude-3-5-sonnet@20240620
+model: google/claude-3-5-sonnet@20240620
label:
en_US: Claude 3.5 Sonnet
model_type: llm
diff --git a/ai-provider/model-runtime/model-providers/vertex_ai/llm/gemini-1.0-pro-vision.yaml b/ai-provider/model-runtime/model-providers/vertex_ai/llm/gemini-1.0-pro-vision.yaml
index 4630f063..161903c3 100644
--- a/ai-provider/model-runtime/model-providers/vertex_ai/llm/gemini-1.0-pro-vision.yaml
+++ b/ai-provider/model-runtime/model-providers/vertex_ai/llm/gemini-1.0-pro-vision.yaml
@@ -1,4 +1,4 @@
-model: gemini-1.0-pro-vision-001
+model: google/gemini-1.0-pro-vision-001
label:
en_US: Gemini 1.0 Pro Vision
model_type: llm
diff --git a/ai-provider/model-runtime/model-providers/vertex_ai/llm/gemini-1.0-pro.yaml b/ai-provider/model-runtime/model-providers/vertex_ai/llm/gemini-1.0-pro.yaml
index 7a50d8c1..6fb6398e 100644
--- a/ai-provider/model-runtime/model-providers/vertex_ai/llm/gemini-1.0-pro.yaml
+++ b/ai-provider/model-runtime/model-providers/vertex_ai/llm/gemini-1.0-pro.yaml
@@ -1,4 +1,4 @@
-model: gemini-1.0-pro-002
+model: google/gemini-1.0-pro-002
label:
en_US: Gemini 1.0 Pro
model_type: llm
diff --git a/ai-provider/model-runtime/model-providers/vertex_ai/llm/gemini-1.5-flash-001.yaml b/ai-provider/model-runtime/model-providers/vertex_ai/llm/gemini-1.5-flash-001.yaml
index 1d9a0b0c..7862d4c0 100644
--- a/ai-provider/model-runtime/model-providers/vertex_ai/llm/gemini-1.5-flash-001.yaml
+++ b/ai-provider/model-runtime/model-providers/vertex_ai/llm/gemini-1.5-flash-001.yaml
@@ -1,4 +1,4 @@
-model: gemini-1.5-flash-001
+model: google/gemini-1.5-flash-001
label:
en_US: Gemini 1.5 Flash 001
model_type: llm
diff --git a/ai-provider/model-runtime/model-providers/vertex_ai/llm/gemini-1.5-flash-002.yaml b/ai-provider/model-runtime/model-providers/vertex_ai/llm/gemini-1.5-flash-002.yaml
index 066d4ba3..85306da5 100644
--- a/ai-provider/model-runtime/model-providers/vertex_ai/llm/gemini-1.5-flash-002.yaml
+++ b/ai-provider/model-runtime/model-providers/vertex_ai/llm/gemini-1.5-flash-002.yaml
@@ -1,4 +1,4 @@
-model: gemini-1.5-flash-002
+model: google/gemini-1.5-flash-002
label:
en_US: Gemini 1.5 Flash 002
model_type: llm
diff --git a/ai-provider/model-runtime/model-providers/vertex_ai/llm/gemini-1.5-pro-001.yaml b/ai-provider/model-runtime/model-providers/vertex_ai/llm/gemini-1.5-pro-001.yaml
index 33d2c25a..2aeb4ea8 100644
--- a/ai-provider/model-runtime/model-providers/vertex_ai/llm/gemini-1.5-pro-001.yaml
+++ b/ai-provider/model-runtime/model-providers/vertex_ai/llm/gemini-1.5-pro-001.yaml
@@ -1,4 +1,4 @@
-model: gemini-1.5-pro-001
+model: google/gemini-1.5-pro-001
label:
en_US: Gemini 1.5 Pro 001
model_type: llm
diff --git a/ai-provider/model-runtime/model-providers/vertex_ai/llm/gemini-1.5-pro-002.yaml b/ai-provider/model-runtime/model-providers/vertex_ai/llm/gemini-1.5-pro-002.yaml
index 8b4c33cc..fb7acb5c 100644
--- a/ai-provider/model-runtime/model-providers/vertex_ai/llm/gemini-1.5-pro-002.yaml
+++ b/ai-provider/model-runtime/model-providers/vertex_ai/llm/gemini-1.5-pro-002.yaml
@@ -1,4 +1,4 @@
-model: gemini-1.5-pro-002
+model: google/gemini-1.5-pro-002
label:
en_US: Gemini 1.5 Pro 002
model_type: llm
diff --git a/ai-provider/model-runtime/model-providers/vertex_ai/llm/gemini-2.0-flash-001.yaml b/ai-provider/model-runtime/model-providers/vertex_ai/llm/gemini-2.0-flash-001.yaml
index bef7ca5e..89bcc8e4 100644
--- a/ai-provider/model-runtime/model-providers/vertex_ai/llm/gemini-2.0-flash-001.yaml
+++ b/ai-provider/model-runtime/model-providers/vertex_ai/llm/gemini-2.0-flash-001.yaml
@@ -1,4 +1,4 @@
-model: gemini-2.0-flash-001
+model: google/gemini-2.0-flash-001
label:
en_US: Gemini 2.0 Flash 001
model_type: llm
diff --git a/ai-provider/model-runtime/model-providers/vertex_ai/llm/gemini-2.0-flash-exp.yaml b/ai-provider/model-runtime/model-providers/vertex_ai/llm/gemini-2.0-flash-exp.yaml
index bcd59623..e8c7382b 100644
--- a/ai-provider/model-runtime/model-providers/vertex_ai/llm/gemini-2.0-flash-exp.yaml
+++ b/ai-provider/model-runtime/model-providers/vertex_ai/llm/gemini-2.0-flash-exp.yaml
@@ -1,4 +1,4 @@
-model: gemini-2.0-flash-exp
+model: google/gemini-2.0-flash-exp
label:
en_US: Gemini 2.0 Flash Exp
model_type: llm
diff --git a/ai-provider/model-runtime/model-providers/vertex_ai/llm/gemini-2.0-flash-lite-preview-02-05.yaml b/ai-provider/model-runtime/model-providers/vertex_ai/llm/gemini-2.0-flash-lite-preview-02-05.yaml
index 9c0a1e06..65e75f07 100644
--- a/ai-provider/model-runtime/model-providers/vertex_ai/llm/gemini-2.0-flash-lite-preview-02-05.yaml
+++ b/ai-provider/model-runtime/model-providers/vertex_ai/llm/gemini-2.0-flash-lite-preview-02-05.yaml
@@ -1,4 +1,4 @@
-model: gemini-2.0-flash-lite-preview-02-05
+model: google/gemini-2.0-flash-lite-preview-02-05
label:
en_US: Gemini 2.0 Flash Lite Preview 0205
model_type: llm
diff --git a/ai-provider/model-runtime/model-providers/vertex_ai/llm/gemini-2.0-flash-thinking-exp-01-21.yaml b/ai-provider/model-runtime/model-providers/vertex_ai/llm/gemini-2.0-flash-thinking-exp-01-21.yaml
index 6e2fc767..4e384651 100644
--- a/ai-provider/model-runtime/model-providers/vertex_ai/llm/gemini-2.0-flash-thinking-exp-01-21.yaml
+++ b/ai-provider/model-runtime/model-providers/vertex_ai/llm/gemini-2.0-flash-thinking-exp-01-21.yaml
@@ -1,4 +1,4 @@
-model: gemini-2.0-flash-thinking-exp-01-21
+model: google/gemini-2.0-flash-thinking-exp-01-21
label:
en_US: Gemini 2.0 Flash Thinking Exp 0121
model_type: llm
diff --git a/ai-provider/model-runtime/model-providers/vertex_ai/llm/gemini-2.0-pro-exp-02-05.yaml b/ai-provider/model-runtime/model-providers/vertex_ai/llm/gemini-2.0-pro-exp-02-05.yaml
index 96926a17..7166ec7b 100644
--- a/ai-provider/model-runtime/model-providers/vertex_ai/llm/gemini-2.0-pro-exp-02-05.yaml
+++ b/ai-provider/model-runtime/model-providers/vertex_ai/llm/gemini-2.0-pro-exp-02-05.yaml
@@ -1,4 +1,4 @@
-model: gemini-2.0-pro-exp-02-05
+model: google/gemini-2.0-pro-exp-02-05
label:
en_US: Gemini 2.0 Pro Exp 0205
model_type: llm
diff --git a/ai-provider/model-runtime/model-providers/vertex_ai/llm/gemini-exp-1114.yaml b/ai-provider/model-runtime/model-providers/vertex_ai/llm/gemini-exp-1114.yaml
index bd49b476..e79bc321 100644
--- a/ai-provider/model-runtime/model-providers/vertex_ai/llm/gemini-exp-1114.yaml
+++ b/ai-provider/model-runtime/model-providers/vertex_ai/llm/gemini-exp-1114.yaml
@@ -1,4 +1,4 @@
-model: gemini-exp-1114
+model: google/gemini-exp-1114
label:
en_US: Gemini exp 1114
model_type: llm
diff --git a/ai-provider/model-runtime/model-providers/vertex_ai/llm/gemini-exp-1121.yaml b/ai-provider/model-runtime/model-providers/vertex_ai/llm/gemini-exp-1121.yaml
index 8e3f218d..4c1d7de7 100644
--- a/ai-provider/model-runtime/model-providers/vertex_ai/llm/gemini-exp-1121.yaml
+++ b/ai-provider/model-runtime/model-providers/vertex_ai/llm/gemini-exp-1121.yaml
@@ -1,4 +1,4 @@
-model: gemini-exp-1121
+model: google/gemini-exp-1121
label:
en_US: Gemini exp 1121
model_type: llm
diff --git a/ai-provider/model-runtime/model-providers/vertex_ai/llm/gemini-exp-1206.yaml b/ai-provider/model-runtime/model-providers/vertex_ai/llm/gemini-exp-1206.yaml
index 7a7c361c..268c34e9 100644
--- a/ai-provider/model-runtime/model-providers/vertex_ai/llm/gemini-exp-1206.yaml
+++ b/ai-provider/model-runtime/model-providers/vertex_ai/llm/gemini-exp-1206.yaml
@@ -1,4 +1,4 @@
-model: gemini-exp-1206
+model: google/gemini-exp-1206
label:
en_US: Gemini exp 1206
model_type: llm
diff --git a/ai-provider/model-runtime/model-providers/vertex_ai/llm/gemini-flash-experimental.yaml b/ai-provider/model-runtime/model-providers/vertex_ai/llm/gemini-flash-experimental.yaml
index ef340372..c6573493 100644
--- a/ai-provider/model-runtime/model-providers/vertex_ai/llm/gemini-flash-experimental.yaml
+++ b/ai-provider/model-runtime/model-providers/vertex_ai/llm/gemini-flash-experimental.yaml
@@ -1,4 +1,4 @@
-model: gemini-flash-experimental
+model: google/gemini-flash-experimental
label:
en_US: Gemini Flash Experimental
model_type: llm
diff --git a/ai-provider/model-runtime/model-providers/vertex_ai/llm/gemini-pro-experimental.yaml b/ai-provider/model-runtime/model-providers/vertex_ai/llm/gemini-pro-experimental.yaml
index cff10423..67667fb5 100644
--- a/ai-provider/model-runtime/model-providers/vertex_ai/llm/gemini-pro-experimental.yaml
+++ b/ai-provider/model-runtime/model-providers/vertex_ai/llm/gemini-pro-experimental.yaml
@@ -1,4 +1,4 @@
-model: gemini-pro-experimental
+model: google/gemini-pro-experimental
label:
en_US: Gemini Pro Experimental
model_type: llm
diff --git a/ai-provider/model-runtime/model-providers/vertex_ai/vertex_ai.yaml b/ai-provider/model-runtime/model-providers/vertex_ai/vertex_ai.yaml
index 43945e5f..1016af99 100644
--- a/ai-provider/model-runtime/model-providers/vertex_ai/vertex_ai.yaml
+++ b/ai-provider/model-runtime/model-providers/vertex_ai/vertex_ai.yaml
@@ -20,6 +20,15 @@ configurate_methods:
- predefined-model
provider_credential_schema:
credential_form_schemas:
+ - variable: vertex_api_base
+ label:
+ zh_Hans: API Base
+ en_US: API Base
+ type: text-input
+ required: true
+ placeholder:
+ zh_Hans: 在此输入您的 API Base
+ en_US: Enter your API Base
- variable: vertex_project_id
label:
en_US: Project ID
@@ -36,9 +45,12 @@ provider_credential_schema:
en_US: Enter your Google Cloud Location
- variable: vertex_service_account_key
label:
- en_US: Service Account Key (Leave blank if you use Application Default Credentials)
+ en_US: Enter your Google Cloud Service Account Key in base64 format
type: secret-input
- required: false
+ required: true
placeholder:
en_US: Enter your Google Cloud Service Account Key in base64 format
-address: https://api.openai.com
\ No newline at end of file
+address: https://api.openai.com
+model_config:
+ access_configuration_status: true
+ access_configuration_demo: "{\"vertex_location\": \"\", \"vertex_project_id\": \"\", \"vertex_model\":\"\"}"
\ No newline at end of file
diff --git a/ai-provider/model-runtime/model-providers/volcengine_maas/volcengine_maas.yaml b/ai-provider/model-runtime/model-providers/volcengine_maas/volcengine_maas.yaml
index 1a970c63..487f0c8d 100644
--- a/ai-provider/model-runtime/model-providers/volcengine_maas/volcengine_maas.yaml
+++ b/ai-provider/model-runtime/model-providers/volcengine_maas/volcengine_maas.yaml
@@ -1,342 +1,357 @@
-provider: volcengine_maas
-label:
- en_US: Volcengine
-description:
- en_US: Volcengine Ark models.
- zh_Hans: 火山方舟提供的模型,例如 Doubao-pro-4k、Doubao-pro-32k 和 Doubao-pro-128k。
-icon_small:
- en_US: icon_s_en.svg
-icon_large:
- en_US: icon_l_en.svg
- zh_Hans: icon_l_zh.svg
-background: "#F9FAFB"
-help:
- title:
- en_US: Get your Access Key and Secret Access Key from Volcengine Console
- zh_Hans: 从火山引擎控制台获取您的 Access Key 和 Secret Access Key
- url:
- en_US: https://console.volcengine.com/iam/keymanage/
-supported_model_types:
- - llm
- - text-embedding
-configurate_methods:
- - customizable-model
-model_credential_schema:
- model:
- label:
- en_US: Model Name
- zh_Hans: 模型名称
- placeholder:
- en_US: Enter your Model Name
- zh_Hans: 输入模型名称
- credential_form_schemas:
- - variable: auth_method
- required: true
- label:
- en_US: Authentication Method
- zh_Hans: 鉴权方式
- type: select
- default: aksk
- options:
- - label:
- en_US: API Key
- value: api_key
- - label:
- en_US: Access Key / Secret Access Key
- value: aksk
- placeholder:
- en_US: Enter your Authentication Method
- zh_Hans: 选择鉴权方式
- - variable: volc_access_key_id
- required: true
- show_on:
- - variable: auth_method
- value: aksk
- label:
- en_US: Access Key
- zh_Hans: Access Key
- type: secret-input
- placeholder:
- en_US: Enter your Access Key
- zh_Hans: 输入您的 Access Key
- - variable: volc_secret_access_key
- required: true
- show_on:
- - variable: auth_method
- value: aksk
- label:
- en_US: Secret Access Key
- zh_Hans: Secret Access Key
- type: secret-input
- placeholder:
- en_US: Enter your Secret Access Key
- zh_Hans: 输入您的 Secret Access Key
- - variable: volc_api_key
- required: true
- show_on:
- - variable: auth_method
- value: api_key
- label:
- en_US: API Key
- type: secret-input
- placeholder:
- en_US: Enter your API Key
- zh_Hans: 输入您的 API Key
- - variable: volc_region
- required: true
- label:
- en_US: Volcengine Region
- zh_Hans: 火山引擎地域
- type: text-input
- default: cn-beijing
- placeholder:
- en_US: Enter Volcengine Region
- zh_Hans: 输入火山引擎地域
- - variable: api_endpoint_host
- required: true
- label:
- en_US: API Endpoint Host
- zh_Hans: API Endpoint Host
- type: text-input
- default: https://ark.cn-beijing.volces.com/api/v3
- placeholder:
- en_US: Enter your API Endpoint Host
- zh_Hans: 输入 API Endpoint Host
- - variable: endpoint_id
- required: true
- label:
- en_US: Endpoint ID
- zh_Hans: Endpoint ID
- type: text-input
- placeholder:
- en_US: Enter your Endpoint ID
- zh_Hans: 输入您的 Endpoint ID
- - variable: base_model_name
- label:
- en_US: Base Model
- zh_Hans: 基础模型
- type: select
- required: true
- options:
- - label:
- en_US: DeepSeek-R1-Distill-Qwen-32B
- value: DeepSeek-R1-Distill-Qwen-32B
- show_on:
- - variable: __model_type
- value: llm
- - label:
- en_US: DeepSeek-R1-Distill-Qwen-7B
- value: DeepSeek-R1-Distill-Qwen-7B
- show_on:
- - variable: __model_type
- value: llm
- - label:
- en_US: DeepSeek-R1
- value: DeepSeek-R1
- show_on:
- - variable: __model_type
- value: llm
- - label:
- en_US: DeepSeek-V3
- value: DeepSeek-V3
- show_on:
- - variable: __model_type
- value: llm
- - label:
- en_US: Doubao-1.5-vision-pro-32k
- value: Doubao-1.5-vision-pro-32k
- show_on:
- - variable: __model_type
- value: llm
- - label:
- en_US: Doubao-1.5-pro-32k
- value: Doubao-1.5-pro-32k
- show_on:
- - variable: __model_type
- value: llm
- - label:
- en_US: Doubao-1.5-lite-32k
- value: Doubao-1.5-lite-32k
- show_on:
- - variable: __model_type
- value: llm
- - label:
- en_US: Doubao-1.5-pro-256k
- value: Doubao-1.5-pro-256k
- show_on:
- - variable: __model_type
- value: llm
- - label:
- en_US: Doubao-vision-pro-32k
- value: Doubao-vision-pro-32k
- show_on:
- - variable: __model_type
- value: llm
- - label:
- en_US: Doubao-vision-lite-32k
- value: Doubao-vision-lite-32k
- show_on:
- - variable: __model_type
- value: llm
- - label:
- en_US: Doubao-pro-4k
- value: Doubao-pro-4k
- show_on:
- - variable: __model_type
- value: llm
- - label:
- en_US: Doubao-lite-4k
- value: Doubao-lite-4k
- show_on:
- - variable: __model_type
- value: llm
- - label:
- en_US: Doubao-pro-32k
- value: Doubao-pro-32k
- show_on:
- - variable: __model_type
- value: llm
- - label:
- en_US: Doubao-lite-32k
- value: Doubao-lite-32k
- show_on:
- - variable: __model_type
- value: llm
- - label:
- en_US: Doubao-pro-128k
- value: Doubao-pro-128k
- show_on:
- - variable: __model_type
- value: llm
- - label:
- en_US: Doubao-lite-128k
- value: Doubao-lite-128k
- show_on:
- - variable: __model_type
- value: llm
- - label:
- en_US: Doubao-pro-256k
- value: Doubao-pro-256k
- show_on:
- - variable: __model_type
- value: llm
- - label:
- en_US: Llama3-8B
- value: Llama3-8B
- show_on:
- - variable: __model_type
- value: llm
- - label:
- en_US: Llama3-70B
- value: Llama3-70B
- show_on:
- - variable: __model_type
- value: llm
- - label:
- en_US: Moonshot-v1-8k
- value: Moonshot-v1-8k
- show_on:
- - variable: __model_type
- value: llm
- - label:
- en_US: Moonshot-v1-32k
- value: Moonshot-v1-32k
- show_on:
- - variable: __model_type
- value: llm
- - label:
- en_US: Moonshot-v1-128k
- value: Moonshot-v1-128k
- show_on:
- - variable: __model_type
- value: llm
- - label:
- en_US: GLM3-130B
- value: GLM3-130B
- show_on:
- - variable: __model_type
- value: llm
- - label:
- en_US: GLM3-130B-Fin
- value: GLM3-130B-Fin
- show_on:
- - variable: __model_type
- value: llm
- - label:
- en_US: Mistral-7B
- value: Mistral-7B
- show_on:
- - variable: __model_type
- value: llm
- - label:
- en_US: Doubao-embedding
- value: Doubao-embedding
- show_on:
- - variable: __model_type
- value: text-embedding
- - label:
- en_US: Doubao-embedding-large
- value: Doubao-embedding-large
- show_on:
- - variable: __model_type
- value: text-embedding
- - label:
- en_US: Custom
- zh_Hans: 自定义
- value: Custom
- - variable: mode
- required: true
- show_on:
- - variable: __model_type
- value: llm
- - variable: base_model_name
- value: Custom
- label:
- zh_Hans: 模型类型
- en_US: Completion Mode
- type: select
- default: chat
- placeholder:
- zh_Hans: 选择对话类型
- en_US: Select Completion Mode
- options:
- - value: completion
- label:
- en_US: Completion
- zh_Hans: 补全
- - value: chat
- label:
- en_US: Chat
- zh_Hans: 对话
- - variable: context_size
- required: true
- show_on:
- - variable: base_model_name
- value: Custom
- label:
- zh_Hans: 模型上下文长度
- en_US: Model Context Size
- type: text-input
- default: "4096"
- placeholder:
- zh_Hans: 输入您的模型上下文长度
- en_US: Enter your Model Context Size
- - variable: max_tokens
- required: true
- show_on:
- - variable: __model_type
- value: llm
- - variable: base_model_name
- value: Custom
- label:
- zh_Hans: 最大 token 上限
- en_US: Upper Bound for Max Tokens
- default: "4096"
- type: text-input
- placeholder:
- zh_Hans: 输入您的模型最大 token 上限
- en_US: Enter your model Upper Bound for Max Tokens
-address: https://open.volcengine.com
-model_config:
- access_configuration_status: true
- access_configuration_demo: "{\"endpoint\": \"https://196.1.1.2:3824\"}"
\ No newline at end of file
+provider: volcengine_maas
+label:
+ en_US: Volcengine
+description:
+ en_US: Volcengine Ark models.
+ zh_Hans: 火山方舟提供的模型,例如 Doubao-pro-4k、Doubao-pro-32k 和 Doubao-pro-128k。
+icon_small:
+ en_US: icon_s_en.svg
+icon_large:
+ en_US: icon_l_en.svg
+ zh_Hans: icon_l_zh.svg
+background: "#F9FAFB"
+help:
+ title:
+ en_US: Get your Access Key and Secret Access Key from Volcengine Console
+ zh_Hans: 从火山引擎控制台获取您的 Access Key 和 Secret Access Key
+ url:
+ en_US: https://console.volcengine.com/iam/keymanage/
+supported_model_types:
+ - llm
+ - text-embedding
+configurate_methods:
+ - customizable-model
+
+model_credential_schema:
+ model:
+ label:
+ en_US: Model Name
+ zh_Hans: 模型名称
+ placeholder:
+ en_US: Enter your Model Name
+ zh_Hans: 输入模型名称
+ credential_form_schemas:
+ - variable: auth_method
+ required: true
+ label:
+ en_US: Authentication Method
+ zh_Hans: 鉴权方式
+ type: select
+ default: aksk
+ options:
+ - label:
+ en_US: API Key
+ value: api_key
+ - label:
+ en_US: Access Key / Secret Access Key
+ value: aksk
+ placeholder:
+ en_US: Enter your Authentication Method
+ zh_Hans: 选择鉴权方式
+ - variable: volc_access_key_id
+ required: true
+ show_on:
+ - variable: auth_method
+ value: aksk
+ label:
+ en_US: Access Key
+ zh_Hans: Access Key
+ type: secret-input
+ placeholder:
+ en_US: Enter your Access Key
+ zh_Hans: 输入您的 Access Key
+ - variable: volc_secret_access_key
+ required: true
+ show_on:
+ - variable: auth_method
+ value: aksk
+ label:
+ en_US: Secret Access Key
+ zh_Hans: Secret Access Key
+ type: secret-input
+ placeholder:
+ en_US: Enter your Secret Access Key
+ zh_Hans: 输入您的 Secret Access Key
+ - variable: volc_api_key
+ required: true
+ show_on:
+ - variable: auth_method
+ value: api_key
+ label:
+ en_US: API Key
+ type: secret-input
+ placeholder:
+ en_US: Enter your API Key
+ zh_Hans: 输入您的 API Key
+ - variable: volc_region
+ required: true
+ label:
+ en_US: Volcengine Region
+ zh_Hans: 火山引擎地域
+ type: text-input
+ default: cn-beijing
+ placeholder:
+ en_US: Enter Volcengine Region
+ zh_Hans: 输入火山引擎地域
+ - variable: api_endpoint_host
+ required: true
+ label:
+ en_US: API Endpoint Host
+ zh_Hans: API Endpoint Host
+ type: text-input
+ default: https://ark.cn-beijing.volces.com/api/v3
+ placeholder:
+ en_US: Enter your API Endpoint Host
+ zh_Hans: 输入 API Endpoint Host
+ - variable: endpoint_id
+ required: true
+ label:
+ en_US: Endpoint ID
+ zh_Hans: Endpoint ID
+ type: text-input
+ placeholder:
+ en_US: Enter your Endpoint ID
+ zh_Hans: 输入您的 Endpoint ID
+ - variable: base_model_name
+ label:
+ en_US: Base Model
+ zh_Hans: 基础模型
+ type: select
+ required: true
+ options:
+ - label:
+ en_US: DeepSeek-R1-Distill-Qwen-32B
+ value: DeepSeek-R1-Distill-Qwen-32B
+ show_on:
+ - variable: __model_type
+ value: llm
+ - label:
+ en_US: DeepSeek-R1-Distill-Qwen-7B
+ value: DeepSeek-R1-Distill-Qwen-7B
+ show_on:
+ - variable: __model_type
+ value: llm
+ - label:
+ en_US: DeepSeek-R1
+ value: DeepSeek-R1
+ show_on:
+ - variable: __model_type
+ value: llm
+ - label:
+ en_US: DeepSeek-V3
+ value: DeepSeek-V3
+ show_on:
+ - variable: __model_type
+ value: llm
+ - label:
+ en_US: Doubao-1.5-vision-pro-32k
+ value: Doubao-1.5-vision-pro-32k
+ show_on:
+ - variable: __model_type
+ value: llm
+ - label:
+ en_US: Doubao-1.5-pro-32k
+ value: Doubao-1.5-pro-32k
+ show_on:
+ - variable: __model_type
+ value: llm
+ - label:
+ en_US: Doubao-1.5-lite-32k
+ value: Doubao-1.5-lite-32k
+ show_on:
+ - variable: __model_type
+ value: llm
+ - label:
+ en_US: Doubao-1.5-pro-256k
+ value: Doubao-1.5-pro-256k
+ show_on:
+ - variable: __model_type
+ value: llm
+ - label:
+ en_US: Doubao-vision-pro-32k
+ value: Doubao-vision-pro-32k
+ show_on:
+ - variable: __model_type
+ value: llm
+ - label:
+ en_US: Doubao-vision-lite-32k
+ value: Doubao-vision-lite-32k
+ show_on:
+ - variable: __model_type
+ value: llm
+ - label:
+ en_US: Doubao-pro-4k
+ value: Doubao-pro-4k
+ show_on:
+ - variable: __model_type
+ value: llm
+ - label:
+ en_US: Doubao-lite-4k
+ value: Doubao-lite-4k
+ show_on:
+ - variable: __model_type
+ value: llm
+ - label:
+ en_US: Doubao-pro-32k
+ value: Doubao-pro-32k
+ show_on:
+ - variable: __model_type
+ value: llm
+ - label:
+ en_US: Doubao-lite-32k
+ value: Doubao-lite-32k
+ show_on:
+ - variable: __model_type
+ value: llm
+ - label:
+ en_US: Doubao-pro-128k
+ value: Doubao-pro-128k
+ show_on:
+ - variable: __model_type
+ value: llm
+ - label:
+ en_US: Doubao-lite-128k
+ value: Doubao-lite-128k
+ show_on:
+ - variable: __model_type
+ value: llm
+ - label:
+ en_US: Doubao-pro-256k
+ value: Doubao-pro-256k
+ show_on:
+ - variable: __model_type
+ value: llm
+ - label:
+ en_US: Llama3-8B
+ value: Llama3-8B
+ show_on:
+ - variable: __model_type
+ value: llm
+ - label:
+ en_US: Llama3-70B
+ value: Llama3-70B
+ show_on:
+ - variable: __model_type
+ value: llm
+ - label:
+ en_US: Moonshot-v1-8k
+ value: Moonshot-v1-8k
+ show_on:
+ - variable: __model_type
+ value: llm
+ - label:
+ en_US: Moonshot-v1-32k
+ value: Moonshot-v1-32k
+ show_on:
+ - variable: __model_type
+ value: llm
+ - label:
+ en_US: Moonshot-v1-128k
+ value: Moonshot-v1-128k
+ show_on:
+ - variable: __model_type
+ value: llm
+ - label:
+ en_US: GLM3-130B
+ value: GLM3-130B
+ show_on:
+ - variable: __model_type
+ value: llm
+ - label:
+ en_US: GLM3-130B-Fin
+ value: GLM3-130B-Fin
+ show_on:
+ - variable: __model_type
+ value: llm
+ - label:
+ en_US: Mistral-7B
+ value: Mistral-7B
+ show_on:
+ - variable: __model_type
+ value: llm
+ - label:
+ en_US: Doubao-embedding
+ value: Doubao-embedding
+ show_on:
+ - variable: __model_type
+ value: text-embedding
+ - label:
+ en_US: Doubao-embedding-large
+ value: Doubao-embedding-large
+ show_on:
+ - variable: __model_type
+ value: text-embedding
+ - label:
+ en_US: Custom
+ zh_Hans: 自定义
+ value: Custom
+ - variable: mode
+ required: true
+ show_on:
+ - variable: __model_type
+ value: llm
+ - variable: base_model_name
+ value: Custom
+ label:
+ zh_Hans: 模型类型
+ en_US: Completion Mode
+ type: select
+ default: chat
+ placeholder:
+ zh_Hans: 选择对话类型
+ en_US: Select Completion Mode
+ options:
+ - value: completion
+ label:
+ en_US: Completion
+ zh_Hans: 补全
+ - value: chat
+ label:
+ en_US: Chat
+ zh_Hans: 对话
+ - variable: context_size
+ required: true
+ show_on:
+ - variable: base_model_name
+ value: Custom
+ label:
+ zh_Hans: 模型上下文长度
+ en_US: Model Context Size
+ type: text-input
+ default: "4096"
+ placeholder:
+ zh_Hans: 输入您的模型上下文长度
+ en_US: Enter your Model Context Size
+ - variable: max_tokens
+ required: true
+ show_on:
+ - variable: __model_type
+ value: llm
+ - variable: base_model_name
+ value: Custom
+ label:
+ zh_Hans: 最大 token 上限
+ en_US: Upper Bound for Max Tokens
+ default: "4096"
+ type: text-input
+ placeholder:
+ zh_Hans: 输入您的模型最大 token 上限
+ en_US: Enter your model Upper Bound for Max Tokens
+provider_credential_schema:
+ credential_form_schemas:
+ - variable: api_key
+ label:
+ en_US: APIKey
+ type: secret-input
+ required: true
+ placeholder:
+ zh_Hans: 在此输入您的 APIKey
+ en_US: Enter your APIKey
+ - variable: base_url
+ label:
+ en_US: https://ark.cn-beijing.volces.com/api/v3
+ required: true
+ placeholder:
+ zh_Hans: 在此输入您的 Base url
+ en_US: Enter your Base url
+address: https://ark.cn-beijing.volces.com/api/v3
diff --git a/ai-provider/model-runtime/model-providers/wenxin/wenxin.yaml b/ai-provider/model-runtime/model-providers/wenxin/wenxin.yaml
index e429ea11..603ed9a5 100644
--- a/ai-provider/model-runtime/model-providers/wenxin/wenxin.yaml
+++ b/ai-provider/model-runtime/model-providers/wenxin/wenxin.yaml
@@ -30,14 +30,14 @@ provider_credential_schema:
placeholder:
zh_Hans: 在此输入您的 API Key
en_US: Enter your API Key
- - variable: secret_key
+ - variable: base_url
label:
- en_US: Secret Key
- type: secret-input
- required: true
+ en_US: https://qianfan.baidubce.com/v2
+ type: text-input
+ required: false
placeholder:
- zh_Hans: 在此输入您的 Secret Key
- en_US: Enter your Secret Key
-address: https://aip.baidubce.com
+ zh_Hans: 在此输入您的 Base URL
+ en_US: Enter your Base URL
+address: https://qianfan.baidubce.com/v2
recommend: true
sort: 7
\ No newline at end of file
diff --git a/ai-provider/model-runtime/model-providers/xinference/xinference.yaml b/ai-provider/model-runtime/model-providers/xinference/xinference.yaml
index 6d284644..21192037 100644
--- a/ai-provider/model-runtime/model-providers/xinference/xinference.yaml
+++ b/ai-provider/model-runtime/model-providers/xinference/xinference.yaml
@@ -76,4 +76,14 @@ model_credential_schema:
placeholder:
zh_Hans: 在此输入调用重试次数
en_US: Enter max retries
+provider_credential_schema:
+ credential_form_schemas:
+ - variable: base_url
+ label:
+ en_US: Base URL
+ type: text-input
+ required: false
+ placeholder:
+ zh_Hans: 在此输入您的 Base URL
+ en_US: Enter your Base URL
address: https://xinference.ai
\ No newline at end of file
diff --git a/ai-provider/model-runtime/model-providers/yi/yi.yaml b/ai-provider/model-runtime/model-providers/yi/yi.yaml
index 919cba1b..5d9156f6 100644
--- a/ai-provider/model-runtime/model-providers/yi/yi.yaml
+++ b/ai-provider/model-runtime/model-providers/yi/yi.yaml
@@ -30,4 +30,12 @@ provider_credential_schema:
placeholder:
zh_Hans: 在此输入您的 API Key
en_US: Enter your API Key
-address: https://api.lingyiwanwu.com
\ No newline at end of file
+ - variable: base_url
+ label:
+ en_US: https://api.lingyiwanwu.com/v1
+ type: text-input
+ required: false
+ placeholder:
+ zh_Hans: 在此输入您的 Base URL
+ en_US: Enter your Base URL
+address: https://api.lingyiwanwu.com/v1
\ No newline at end of file
diff --git a/ai-provider/model-runtime/model-providers/zhinao/zhinao.yaml b/ai-provider/model-runtime/model-providers/zhinao/zhinao.yaml
index 7d2c5372..ff62cd36 100644
--- a/ai-provider/model-runtime/model-providers/zhinao/zhinao.yaml
+++ b/ai-provider/model-runtime/model-providers/zhinao/zhinao.yaml
@@ -30,4 +30,12 @@ provider_credential_schema:
placeholder:
zh_Hans: 在此输入您的 API Key
en_US: Enter your API Key
+ - variable: base_url
+ label:
+ en_US: Base URL
+ type: text-input
+ required: false
+ placeholder:
+ zh_Hans: 在此输入您的 Base URL
+ en_US: Enter your Base URL
address: https://api.360.cn
\ No newline at end of file
diff --git a/ai-provider/model-runtime/model-providers/zhipuai/zhipuai.yaml b/ai-provider/model-runtime/model-providers/zhipuai/zhipuai.yaml
index 3a33ee45..c318c8b8 100644
--- a/ai-provider/model-runtime/model-providers/zhipuai/zhipuai.yaml
+++ b/ai-provider/model-runtime/model-providers/zhipuai/zhipuai.yaml
@@ -29,4 +29,11 @@ provider_credential_schema:
placeholder:
zh_Hans: 在此输入您的 APIKey
en_US: Enter your APIKey
-address: https://open.bigmodel.cn
\ No newline at end of file
+ - variable: base_url
+ label:
+ en_US: https://open.bigmodel.cn/api/paas/v4/
+ required: true
+ placeholder:
+ zh_Hans: 在此输入您的 Base url
+ en_US: Enter your Base url
+address: https://open.bigmodel.cn/api/paas/v4/
\ No newline at end of file
diff --git a/ai-provider/model-runtime/model.go b/ai-provider/model-runtime/model.go
index 44d29e2f..2768f2a7 100644
--- a/ai-provider/model-runtime/model.go
+++ b/ai-provider/model-runtime/model.go
@@ -97,6 +97,10 @@ func NewModel(data string, logo string) (IModel, error) {
params := make(ParamValidator, 0, len(cfg.ParameterRules))
defaultConfig := make(map[string]interface{})
for _, p := range cfg.ParameterRules {
+ if (p.Default == nil || p.Default == "" || p.Default == 0 || p.Default == false) && !p.Required {
+ defaultConfig[p.Name] = nil
+ continue
+ }
t := p.Type
if t == "" {
t = ParameterTypeStr
diff --git a/ai-provider/model-runtime/provider.go b/ai-provider/model-runtime/provider.go
index 435f44fd..5183810f 100644
--- a/ai-provider/model-runtime/provider.go
+++ b/ai-provider/model-runtime/provider.go
@@ -50,7 +50,7 @@ type IProviderInfo interface {
}
func GetCustomizeLogo() string {
- logo, _ := providerDir.ReadFile("customize/assets/icon_s_en.svg")
+ logo, _ := providerDir.ReadFile("model-providers/customize/assets/icon_s_en.svg")
return string(logo)
}
diff --git a/app/ai-event-handler/nsq.go b/app/ai-event-handler/nsq.go
index 3f891490..be133e6e 100644
--- a/app/ai-event-handler/nsq.go
+++ b/app/ai-event-handler/nsq.go
@@ -81,7 +81,7 @@ func convertInt(value interface{}) int {
func genAIKey(key string, provider string) string {
keys := strings.Split(key, "@")
- return strings.TrimSuffix(keys[0], fmt.Sprintf("-%s", provider))
+ return strings.TrimPrefix(keys[0], fmt.Sprintf("%s-", provider))
}
// HandleMessage 处理从 NSQ 读取的消息
diff --git a/common/regexp.go b/common/regexp.go
index 3e78ec44..2c1486ed 100644
--- a/common/regexp.go
+++ b/common/regexp.go
@@ -25,6 +25,8 @@ const (
CIDRIpv4Exp = `^(?:(?:[0-9]|[1-9][0-9]|1[0-9]{2}|2[0-4][0-9]|25[0-5])\.){3}(?:[0-9]|[1-9][0-9]|1[0-9]{2}|2[0-4][0-9]|25[0-5])(\/([1-9]|[1-2]\d|3[0-2]))?$`
// CheckPathIPPortExp (scheme://)?ip:port
CheckPathIPPortExp = `([a-zA-z]+://)?((2(5[0-5]|[0-4]\d))|[0-1]?\d{1,2})(\.((2(5[0-5]|[0-4]\d))|[0-1]?\d{1,2})){3}:[0-9]+`
+ // EnglishOrNumberOrSpecialChars a-zA-Z0-9-_.:
+ EnglishOrNumberOrSpecialChars = `^(?i)[-/:._a-z0-9]+$`
)
var (
@@ -47,6 +49,8 @@ var (
restfulPathMatchRegexp = regexp.MustCompile(`({[0-9a-zA-Z-_]+})+`)
//restfulParamMatchRegexp 匹配restful参数 {xxx}
restfulParamMatchRegexp = regexp.MustCompile(`^{[0-9a-zA-Z-_]+}$`)
+ // modelNameRegexp match model name
+ modelNameRegexp = regexp.MustCompile(EnglishOrNumberOrSpecialChars)
)
func IsMatchString(regexpPattern RegexpPattern, s string) error {
@@ -129,3 +133,8 @@ func ReplaceRestfulPath(path, replaceStr string) string {
func CheckPathContainsIPPort(path string) bool {
return checkIPPortRegexp.MatchString(path)
}
+
+// ModelNameValid check model name is valid
+func ModelNameValid(param string) bool {
+ return modelNameRegexp.MatchString(param)
+}
diff --git a/controller/ai-api/iml.go b/controller/ai-api/iml.go
index 05e9baca..83292cbe 100644
--- a/controller/ai-api/iml.go
+++ b/controller/ai-api/iml.go
@@ -4,6 +4,8 @@ import (
"context"
"net/http"
+ ai_provider_local "github.com/APIParkLab/APIPark/ai-provider/local"
+
"github.com/APIParkLab/APIPark/model/plugin_model"
ai_api "github.com/APIParkLab/APIPark/module/ai-api"
ai_api_dto "github.com/APIParkLab/APIPark/module/ai-api/dto"
@@ -48,13 +50,13 @@ func (i *imlAPIController) Create(ctx *gin.Context, serviceId string, input *ai_
}
}
if input.AiModel != nil {
- provider := "ollama"
+ provider := ai_provider_local.ProviderLocal
if input.AiModel.Type != "local" {
provider = input.AiModel.Provider
}
plugins["ai_formatter"] = api.PluginSetting{
Config: plugin_model.ConfigType{
- "model": input.AiModel.Id,
+ "model": input.AiModel.Name,
"provider": provider,
"config": input.AiModel.Config,
},
@@ -63,6 +65,7 @@ func (i *imlAPIController) Create(ctx *gin.Context, serviceId string, input *ai_
_, err = i.routerModule.Create(ctx, serviceId, &router_dto.Create{
Id: input.Id,
+ Name: input.Name,
Path: input.Path,
Methods: []string{
http.MethodPost,
@@ -106,13 +109,13 @@ func (i *imlAPIController) Edit(ctx *gin.Context, serviceId string, apiId string
}
//var upstream *string
if input.AiModel != nil {
- provider := "ollama"
+ provider := ai_provider_local.ProviderLocal
if input.AiModel.Type != "local" {
provider = input.AiModel.Provider
}
proxy.Plugins["ai_formatter"] = api.PluginSetting{
Config: plugin_model.ConfigType{
- "model": input.AiModel.Id,
+ "model": input.AiModel.Name,
"provider": provider,
"config": input.AiModel.Config,
},
@@ -130,6 +133,7 @@ func (i *imlAPIController) Edit(ctx *gin.Context, serviceId string, apiId string
}
_, err = i.routerModule.Edit(ctx, serviceId, apiId, &router_dto.Edit{
+ Name: input.Name,
Description: input.Description,
Proxy: proxy,
Path: input.Path,
diff --git a/controller/ai-local/iml.go b/controller/ai-local/iml.go
index e436609a..a34d4a9b 100644
--- a/controller/ai-local/iml.go
+++ b/controller/ai-local/iml.go
@@ -245,7 +245,7 @@ func (i *imlLocalModelController) initAILocalService(ctx context.Context, model
}
serviceId := uuid.NewString()
prefix := fmt.Sprintf("/%s", serviceId[:8])
- providerId := "ollama"
+ providerId := ai_provider_local.ProviderLocal
err = i.transaction.Transaction(ctx, func(ctx context.Context) error {
_, err = i.serviceModule.Create(ctx, teamID, &service_dto.CreateService{
Id: serviceId,
@@ -267,7 +267,7 @@ func (i *imlLocalModelController) initAILocalService(ctx context.Context, model
})
return func() error {
- path := fmt.Sprintf("/%s/chat", strings.Trim(prefix, "/"))
+ path := fmt.Sprintf("/%s/chat/completions", strings.Trim(prefix, "/"))
timeout := 300000
retry := 0
aiPrompt := &ai_api_dto.AiPrompt{
@@ -276,7 +276,7 @@ func (i *imlLocalModelController) initAILocalService(ctx context.Context, model
}
aiModel := &ai_api_dto.AiModel{
Id: model,
- Config: ai_provider_local.OllamaConfig,
+ Config: ai_provider_local.LocalConfig,
Provider: providerId,
Type: "local",
}
diff --git a/controller/ai-model/iml.go b/controller/ai-model/iml.go
index fcb48134..21f62e39 100644
--- a/controller/ai-model/iml.go
+++ b/controller/ai-model/iml.go
@@ -3,6 +3,7 @@ package ai_model
import (
"encoding/json"
"fmt"
+ "github.com/APIParkLab/APIPark/common"
ai_model "github.com/APIParkLab/APIPark/module/ai-model"
model_dto "github.com/APIParkLab/APIPark/module/ai-model/dto"
"github.com/gin-gonic/gin"
@@ -22,8 +23,8 @@ func (i *imlProviderModelController) GetModelParametersTemplate(ctx *gin.Context
}
func (i *imlProviderModelController) UpdateProviderModel(ctx *gin.Context, provider string, input *model_dto.EditModel) error {
- if strings.TrimSpace(input.Name) == "" {
- return fmt.Errorf("name is empty")
+ if !common.ModelNameValid(input.Name) {
+ return fmt.Errorf("model name is invalid(a-zA-Z0-9-_.:/)")
}
if strings.TrimSpace(input.Id) == "" {
return fmt.Errorf("id is empty")
@@ -54,8 +55,8 @@ func (i *imlProviderModelController) DeleteProviderModel(ctx *gin.Context, provi
}
func (i *imlProviderModelController) AddProviderModel(ctx *gin.Context, provider string, input *model_dto.Model) (*model_dto.SimpleModel, error) {
- if strings.TrimSpace(input.Name) == "" {
- return nil, fmt.Errorf("name is empty")
+ if !common.ModelNameValid(input.Name) {
+ return nil, fmt.Errorf("model name illegal(a-zA-Z0-9-_.:/)")
}
if strings.TrimSpace(provider) == "" {
return nil, fmt.Errorf("provider is empty")
diff --git a/controller/ai/iml.go b/controller/ai/iml.go
index ae37239b..9b1c4737 100644
--- a/controller/ai/iml.go
+++ b/controller/ai/iml.go
@@ -3,6 +3,7 @@ package ai
import (
"encoding/json"
"fmt"
+ "github.com/APIParkLab/APIPark/common"
"strconv"
"strings"
@@ -24,8 +25,8 @@ func (i *imlProviderController) Delete(ctx *gin.Context, id string) error {
}
func (i *imlProviderController) AddProvider(ctx *gin.Context, input *ai_dto.NewProvider) (*ai_dto.SimpleProvider, error) {
- if strings.TrimSpace(input.Name) == "" {
- return nil, fmt.Errorf("name is empty")
+ if !common.ModelNameValid(input.Name) {
+ return nil, fmt.Errorf("name illegal(a-zA-Z0-9-_.:/)")
}
return i.module.AddProvider(ctx, input)
}
diff --git a/controller/mcp/iml.go b/controller/mcp/iml.go
new file mode 100644
index 00000000..6e7c6a4b
--- /dev/null
+++ b/controller/mcp/iml.go
@@ -0,0 +1,141 @@
+package mcp
+
+import (
+ "fmt"
+ "net/http"
+ "strings"
+ "sync"
+
+ mcp_server "github.com/APIParkLab/APIPark/mcp-server"
+ "github.com/APIParkLab/APIPark/module/mcp"
+ "github.com/APIParkLab/APIPark/module/system"
+ "github.com/eolinker/go-common/utils"
+ "github.com/gin-gonic/gin"
+ mcp2 "github.com/mark3labs/mcp-go/mcp"
+ "github.com/mark3labs/mcp-go/server"
+)
+
+var _ IMcpController = (*imlMcpController)(nil)
+
+type imlMcpController struct {
+ settingModule system.ISettingModule `autowired:""`
+ mcpModule mcp.IMcpModule `autowired:""`
+ sessionKeys sync.Map
+ server http.Handler
+ openServer http.Handler
+}
+
+var mcpDefaultConfig = `{
+ "mcpServers": {
+ "%s": {
+ "url": "%s"
+ }
+ }
+}
+`
+
+func (i *imlMcpController) GlobalMCPConfig(ctx *gin.Context) (string, error) {
+ cfg := i.settingModule.Get(ctx)
+ if cfg.SitePrefix == "" {
+ return "", fmt.Errorf("site prefix is empty")
+ }
+ return fmt.Sprintf(mcpDefaultConfig, "APIPark-MCP-Server", fmt.Sprintf("%s/openapi/v1/%s/sse?apikey={your_api_key}", strings.TrimSuffix(cfg.SitePrefix, "/"), mcp_server.GlobalBasePath)), nil
+}
+
+func (i *imlMcpController) OnComplete() {
+ s := server.NewMCPServer("APIPark MCP Server", "1.0.0", server.WithLogging())
+ s.AddTool(
+ mcp2.NewTool(
+ "apipark_service_list",
+ mcp2.WithDescription("This tool is a standardized interface provided by the Apipark platform under the MCP (Model Context Protocol) framework, designed to retrieve metadata for all registered services in bulk. By invoking this tool, users can efficiently explore the complete list of published services and their core attributes, serving as a prerequisite for subsequent actions such as querying detailed API lists via service IDs, requesting access permissions, or integrating services."),
+ mcp2.WithString("keyword", mcp2.Description("Keyword for fuzzy search")),
+ ),
+ i.mcpModule.Services,
+ )
+ s.AddTool(
+ mcp2.NewTool(
+ "apipark_service_api_list",
+ mcp2.WithDescription("This tool is a standardized MCP (Model Context Protocol) interface provided by the Apipark platform, designed to retrieve OpenAPI specification documents for all APIs under a specified service using its service ID. By invoking this tool, users gain precise access to detailed API definitions (including endpoints, parameters, request/response schemas) for debugging, integration, or client SDK generation."),
+ mcp2.WithString("service", mcp2.Description("Service ID")),
+ ),
+ i.mcpModule.APIs,
+ )
+ s.AddTool(
+ mcp2.NewTool(
+ "apipark_invoke_api",
+ mcp2.WithDescription("This tool is a core MCP (Model Context Protocol) interface provided by the Apipark platform, enabling users to programmatically invoke APIs using metadata from apipark_service_api_list (API schemas). It acts as a unified gateway for executing API requests with built-in authentication, parameter validation, and error handling, returning structured responses for integration workflows."),
+ mcp2.WithString("path", mcp2.Description("API path"), mcp2.Required()),
+ mcp2.WithString("method", mcp2.Description("API method"), mcp2.Required()),
+ mcp2.WithString("content-type", mcp2.Description("API Request Content-Type. If method is POST,PUT,PATCH, it must be set. If not set, it will be ignored.")),
+ mcp2.WithObject("query", mcp2.Description("API Request query,param type is map[string]string")),
+ mcp2.WithObject("header", mcp2.Description("API Request header,param type is map[string]string")),
+ mcp2.WithString("body", mcp2.Description("API Request body")),
+ ),
+ i.mcpModule.Invoke,
+ )
+ i.server = server.NewSSEServer(s, server.WithBasePath(fmt.Sprintf("/api/v1/%s", mcp_server.GlobalBasePath)))
+ i.openServer = server.NewSSEServer(s, server.WithBasePath(fmt.Sprintf("/openapi/v1/%s", strings.Trim(mcp_server.GlobalBasePath, "/"))))
+}
+
+func (i *imlMcpController) GlobalMCPHandle(ctx *gin.Context) {
+ cfg := i.settingModule.Get(ctx)
+ req := ctx.Request.WithContext(utils.SetGatewayInvoke(ctx.Request.Context(), cfg.InvokeAddress))
+
+ i.server.ServeHTTP(ctx.Writer, req)
+}
+
+func (i *imlMcpController) GlobalHandleSSE(ctx *gin.Context) {
+ i.handleSSE(ctx, i.openServer)
+}
+
+func (i *imlMcpController) handleSSE(ctx *gin.Context, server http.Handler) {
+ apikey := ctx.Request.URL.Query().Get("apikey")
+ writer := &ResponseWriter{
+ Writer: ctx.Writer,
+ sessionId: make(chan string),
+ }
+ defer close(writer.sessionId)
+ sessionId := ""
+ go func() {
+ var ok bool
+ sessionId, ok = <-writer.sessionId
+ if !ok {
+ return
+ }
+ i.sessionKeys.Store(sessionId, apikey)
+ }()
+ server.ServeHTTP(writer, ctx.Request)
+ i.sessionKeys.Delete(sessionId)
+}
+
+func (i *imlMcpController) GlobalHandleMessage(ctx *gin.Context) {
+ i.handleMessage(ctx, i.openServer)
+}
+
+func (i *imlMcpController) MCPHandle(ctx *gin.Context) {
+ cfg := i.settingModule.Get(ctx)
+
+ req := ctx.Request.WithContext(utils.SetGatewayInvoke(ctx.Request.Context(), cfg.InvokeAddress))
+ mcp_server.ServeHTTP(ctx.Writer, req)
+}
+
+func (i *imlMcpController) ServiceHandleSSE(ctx *gin.Context) {
+ i.handleSSE(ctx, mcp_server.DefaultMCPServer())
+}
+
+func (i *imlMcpController) ServiceHandleMessage(ctx *gin.Context) {
+ i.handleMessage(ctx, mcp_server.DefaultMCPServer())
+}
+
+func (i *imlMcpController) handleMessage(ctx *gin.Context, server http.Handler) {
+ sessionId := ctx.Request.URL.Query().Get("sessionId")
+ apikey, ok := i.sessionKeys.Load(sessionId)
+ if !ok {
+ ctx.String(403, "sessionId not found")
+ return
+ }
+ cfg := i.settingModule.Get(ctx)
+ req := ctx.Request.WithContext(utils.SetGatewayInvoke(ctx.Request.Context(), cfg.InvokeAddress))
+ req = req.WithContext(utils.SetLabel(req.Context(), "apikey", apikey.(string)))
+ server.ServeHTTP(ctx.Writer, req)
+}
diff --git a/controller/mcp/mcp.go b/controller/mcp/mcp.go
new file mode 100644
index 00000000..780a0aa9
--- /dev/null
+++ b/controller/mcp/mcp.go
@@ -0,0 +1,24 @@
+package mcp
+
+import (
+ "reflect"
+
+ "github.com/eolinker/go-common/autowire"
+ "github.com/gin-gonic/gin"
+)
+
+type IMcpController interface {
+ MCPHandle(ctx *gin.Context)
+ GlobalMCPHandle(ctx *gin.Context)
+ GlobalHandleSSE(ctx *gin.Context)
+ GlobalHandleMessage(ctx *gin.Context)
+ ServiceHandleSSE(ctx *gin.Context)
+ ServiceHandleMessage(ctx *gin.Context)
+ GlobalMCPConfig(ctx *gin.Context) (string, error)
+}
+
+func init() {
+ autowire.Auto[IMcpController](func() reflect.Value {
+ return reflect.ValueOf(new(imlMcpController))
+ })
+}
diff --git a/controller/mcp/writer.go b/controller/mcp/writer.go
new file mode 100644
index 00000000..d2a48df0
--- /dev/null
+++ b/controller/mcp/writer.go
@@ -0,0 +1,35 @@
+package mcp
+
+import (
+ "net/http"
+ "regexp"
+)
+
+type ResponseWriter struct {
+ Writer http.ResponseWriter
+ sessionId chan string
+}
+
+func (r *ResponseWriter) Flush() {
+ fluster, ok := r.Writer.(http.Flusher)
+ if ok {
+ fluster.Flush()
+ }
+}
+
+func (r *ResponseWriter) Header() http.Header {
+ return r.Writer.Header()
+}
+
+func (r *ResponseWriter) Write(bytes []byte) (int, error) {
+ re := regexp.MustCompile(`sessionId=([^&?\s]+)`)
+ match := re.FindStringSubmatch(string(bytes))
+ if len(match) > 1 {
+ r.sessionId <- match[1]
+ }
+ return r.Writer.Write(bytes)
+}
+
+func (r *ResponseWriter) WriteHeader(statusCode int) {
+ r.Writer.WriteHeader(statusCode)
+}
diff --git a/controller/service/iml.go b/controller/service/iml.go
index e2f0bf32..489d66e2 100644
--- a/controller/service/iml.go
+++ b/controller/service/iml.go
@@ -296,7 +296,7 @@ func (i *imlServiceController) editAIService(ctx *gin.Context, id string, input
if input.Provider == nil {
return nil, fmt.Errorf("provider is required")
}
- if *input.Provider != "ollama" {
+ if *input.Provider != ai_provider_local.ProviderLocal {
_, has := model_runtime.GetProvider(*input.Provider)
if !has {
return nil, fmt.Errorf("provider not found")
@@ -330,7 +330,7 @@ func (i *imlServiceController) createAIService(ctx *gin.Context, teamID string,
modelId := ""
modelCfg := ""
modelType := "online"
- if *input.Provider == "ollama" {
+ if *input.Provider == ai_provider_local.ProviderLocal {
modelType = "local"
list, err := i.aiLocalModel.SimpleList(ctx)
if err != nil {
@@ -340,7 +340,7 @@ func (i *imlServiceController) createAIService(ctx *gin.Context, teamID string,
return nil, fmt.Errorf("no local model")
}
modelId = list[0].Id
- modelCfg = ai_provider_local.OllamaConfig
+ modelCfg = ai_provider_local.LocalConfig
} else {
pv, err := i.providerModule.Provider(ctx, *input.Provider)
if err != nil {
@@ -354,7 +354,8 @@ func (i *imlServiceController) createAIService(ctx *gin.Context, teamID string,
if !has {
return nil, fmt.Errorf("model %s not found", pv.DefaultLLM)
}
- modelId = m.ID()
+ //modelId = m.ID()
+ modelId = m.Name()
modelCfg = m.DefaultConfig()
}
@@ -367,7 +368,7 @@ func (i *imlServiceController) createAIService(ctx *gin.Context, teamID string,
return err
}
prefix := strings.Replace(input.Prefix, ":", "_", -1)
- path := fmt.Sprintf("/%s/chat", strings.Trim(prefix, "/"))
+ path := fmt.Sprintf("/%s/chat/completions", strings.Trim(prefix, "/"))
timeout := 300000
retry := 0
aiPrompt := &ai_api_dto.AiPrompt{
diff --git a/controller/system-apikey/apikey.go b/controller/system-apikey/apikey.go
new file mode 100644
index 00000000..c59fc03e
--- /dev/null
+++ b/controller/system-apikey/apikey.go
@@ -0,0 +1,25 @@
+package system_apikey
+
+import (
+ "reflect"
+
+ system_apikey_dto "github.com/APIParkLab/APIPark/module/system-apikey/dto"
+ "github.com/eolinker/go-common/autowire"
+ "github.com/gin-gonic/gin"
+)
+
+type IAPIKeyController interface {
+ Create(ctx *gin.Context, input *system_apikey_dto.Create) error
+ Update(ctx *gin.Context, id string, input *system_apikey_dto.Update) error
+ Delete(ctx *gin.Context, id string) error
+ Get(ctx *gin.Context, id string) (*system_apikey_dto.APIKey, error)
+ Search(ctx *gin.Context, keyword string) ([]*system_apikey_dto.Item, error)
+ SimpleList(ctx *gin.Context) ([]*system_apikey_dto.SimpleItem, error)
+ MyAPIKeys(ctx *gin.Context) ([]*system_apikey_dto.SimpleItem, error)
+}
+
+func init() {
+ autowire.Auto[IAPIKeyController](func() reflect.Value {
+ return reflect.ValueOf(new(imlAPIKeyController))
+ })
+}
diff --git a/controller/system-apikey/iml.go b/controller/system-apikey/iml.go
new file mode 100644
index 00000000..7afdd451
--- /dev/null
+++ b/controller/system-apikey/iml.go
@@ -0,0 +1,41 @@
+package system_apikey
+
+import (
+ system_apikey "github.com/APIParkLab/APIPark/module/system-apikey"
+ system_apikey_dto "github.com/APIParkLab/APIPark/module/system-apikey/dto"
+ "github.com/gin-gonic/gin"
+)
+
+var _ IAPIKeyController = new(imlAPIKeyController)
+
+type imlAPIKeyController struct {
+ apikeyModule system_apikey.IAPIKeyModule `autowired:""`
+}
+
+func (i *imlAPIKeyController) MyAPIKeys(ctx *gin.Context) ([]*system_apikey_dto.SimpleItem, error) {
+ return i.apikeyModule.MyAPIKeys(ctx)
+}
+
+func (i *imlAPIKeyController) Create(ctx *gin.Context, input *system_apikey_dto.Create) error {
+ return i.apikeyModule.Create(ctx, input)
+}
+
+func (i *imlAPIKeyController) Update(ctx *gin.Context, id string, input *system_apikey_dto.Update) error {
+ return i.apikeyModule.Update(ctx, id, input)
+}
+
+func (i *imlAPIKeyController) Delete(ctx *gin.Context, id string) error {
+ return i.apikeyModule.Delete(ctx, id)
+}
+
+func (i *imlAPIKeyController) Get(ctx *gin.Context, id string) (*system_apikey_dto.APIKey, error) {
+ return i.apikeyModule.Get(ctx, id)
+}
+
+func (i *imlAPIKeyController) Search(ctx *gin.Context, keyword string) ([]*system_apikey_dto.Item, error) {
+ return i.apikeyModule.Search(ctx, keyword)
+}
+
+func (i *imlAPIKeyController) SimpleList(ctx *gin.Context) ([]*system_apikey_dto.SimpleItem, error) {
+ return i.apikeyModule.SimpleList(ctx)
+}
diff --git a/controller/system/iml.go b/controller/system/iml.go
index 44f9e37e..749e73b0 100644
--- a/controller/system/iml.go
+++ b/controller/system/iml.go
@@ -395,36 +395,36 @@ func (i *imlInitController) createAIService(ctx context.Context, teamID string,
if err != nil {
return err
}
- path := fmt.Sprintf("/%s/demo_translation_api", strings.Trim(input.Prefix, "/"))
+ path := fmt.Sprintf("/%s/chat/completions", strings.Trim(input.Prefix, "/"))
timeout := 300000
retry := 0
aiPrompt := &ai_api_dto.AiPrompt{
- Variables: []*ai_api_dto.AiPromptVariable{
- {
- Key: "source_lang",
- Description: "",
- Require: true,
- },
- {
- Key: "target_lang",
- Description: "",
- Require: true,
- },
- {
- Key: "text",
- Description: "",
- Require: true,
- },
- },
- Prompt: "You need to translate {{source_lang}} into {{target_lang}}, and the following is the content that needs to be translated.\n---\n{{text}}",
+ //Variables: []*ai_api_dto.AiPromptVariable{
+ // {
+ // Key: "source_lang",
+ // Description: "",
+ // Require: true,
+ // },
+ // {
+ // Key: "target_lang",
+ // Description: "",
+ // Require: true,
+ // },
+ // {
+ // Key: "text",
+ // Description: "",
+ // Require: true,
+ // },
+ //},
+ //Prompt: "You need to translate {{source_lang}} into {{target_lang}}, and the following is the content that needs to be translated.\n---\n{{text}}",
}
aiModel := &ai_api_dto.AiModel{
Id: m.ID(),
Config: m.DefaultConfig(),
Provider: providerId,
}
- name := "Demo Translation API"
- description := "A demo that shows you how to use a prompt to create a Translation API."
+ name := "Demo Chat API"
+ description := "A demo that shows you how to use a prompt to create a Chat API."
apiId := uuid.New().String()
err = i.aiAPIModule.Create(
ctx,
diff --git a/frontend/packages/common/src/components/aoplatform/PublishApprovalModalContent.tsx b/frontend/packages/common/src/components/aoplatform/PublishApprovalModalContent.tsx
index 6272fd42..5016fac9 100644
--- a/frontend/packages/common/src/components/aoplatform/PublishApprovalModalContent.tsx
+++ b/frontend/packages/common/src/components/aoplatform/PublishApprovalModalContent.tsx
@@ -1,5 +1,5 @@
import { App, Col, Form, Input, Row, Table, Tooltip } from 'antd'
-import { forwardRef, useEffect, useImperativeHandle, useMemo } from 'react'
+import { forwardRef, useEffect, useImperativeHandle, useMemo, useRef } from 'react'
import {
PublishApprovalInfoType,
PublishApprovalModalHandle,
@@ -36,6 +36,7 @@ export const PublishApprovalModalContent = forwardRef(null)
const save: (operate: 'pass' | 'refuse') => Promise = (operate) => {
if (type === 'view') {
@@ -140,6 +141,12 @@ export const PublishApprovalModalContent = forwardRef {
form.setFieldsValue({ opinion: '', ...data })
+ // 如果是添加模式且insidePage为true,自动聚焦版本号输入框
+ if (type === 'add' && insidePage && versionInputRef.current) {
+ setTimeout(() => {
+ versionInputRef.current?.focus()
+ }, 100)
+ }
}, [])
const translatedUpstreamColumns = useMemo(
@@ -335,7 +342,12 @@ export const PublishApprovalModalContent = forwardRef
-
+
diff --git a/frontend/packages/core/src/components/AIProviderSelect/index.tsx b/frontend/packages/core/src/components/AIProviderSelect/index.tsx
index 5b9e28f4..c0a7fecd 100644
--- a/frontend/packages/core/src/components/AIProviderSelect/index.tsx
+++ b/frontend/packages/core/src/components/AIProviderSelect/index.tsx
@@ -91,8 +91,15 @@ const AIProviderSelect: React.FC = ({ value, onChange, so
label: (
{provider.name}
diff --git a/frontend/packages/core/src/const/ai-service/const.tsx b/frontend/packages/core/src/const/ai-service/const.tsx
index ccf72b07..a058f636 100644
--- a/frontend/packages/core/src/const/ai-service/const.tsx
+++ b/frontend/packages/core/src/const/ai-service/const.tsx
@@ -19,11 +19,11 @@ export const AI_SERVICE_ROUTER_TABLE_COLUMNS: PageProColumns (