Skip to content

Commit

Permalink
add modelhub models
Browse files Browse the repository at this point in the history
  • Loading branch information
HSPK committed May 30, 2024
1 parent 57e0980 commit b6fcecc
Show file tree
Hide file tree
Showing 48 changed files with 1,397 additions and 7,427 deletions.
Original file line number Diff line number Diff line change
@@ -0,0 +1,33 @@
model: Baichuan2-53B
label:
zh_Hans: Baichuan2-53B
en_US: Baichuan2-53B
model_type: llm
features:
- multi-tool-call
- agent-thought
- stream-tool-call
model_properties:
mode: chat
context_size: 32768
parameter_rules:
- name: temperature
use_template: temperature
- name: top_p
use_template: top_p
- name: presence_penalty
use_template: presence_penalty
- name: frequency_penalty
use_template: frequency_penalty
- name: max_tokens
use_template: max_tokens
default: 2048
min: 1
max: 32768
- name: response_format
use_template: response_format
pricing:
input: "0.02"
output: "0.02"
unit: "0.001"
currency: CNY
Original file line number Diff line number Diff line change
@@ -0,0 +1,33 @@
model: Baichuan2-Turbo-192k
label:
zh_Hans: Baichuan2-Turbo-192k
en_US: Baichuan2-Turbo-192k
model_type: llm
features:
- multi-tool-call
- agent-thought
- stream-tool-call
model_properties:
mode: chat
context_size: 192000
parameter_rules:
- name: temperature
use_template: temperature
- name: top_p
use_template: top_p
- name: presence_penalty
use_template: presence_penalty
- name: frequency_penalty
use_template: frequency_penalty
- name: max_tokens
use_template: max_tokens
default: 2048
min: 1
max: 192000
- name: response_format
use_template: response_format
pricing:
input: "0.016"
output: "0.016"
unit: "0.001"
currency: CNY
Original file line number Diff line number Diff line change
Expand Up @@ -9,19 +9,25 @@ features:
- stream-tool-call
model_properties:
mode: chat
context_size: 8192
context_size: 32768
parameter_rules:
- name: temperature
use_template: temperature
- name: top_p
use_template: top_p
- name: presence_penalty
use_template: presence_penalty
- name: frequency_penalty
use_template: frequency_penalty
- name: max_tokens
use_template: max_tokens
default: 512
default: 2048
min: 1
max: 8192
max: 32768
- name: response_format
use_template: response_format
pricing:
input: "0.003"
output: "0.004"
input: "0.008"
output: "0.008"
unit: "0.001"
currency: USD
currency: CNY
Original file line number Diff line number Diff line change
@@ -0,0 +1,33 @@
model: Baichuan3-Turbo-128k
label:
zh_Hans: Baichuan3-Turbo-128k
en_US: Baichuan3-Turbo-128k
model_type: llm
features:
- multi-tool-call
- agent-thought
- stream-tool-call
model_properties:
mode: chat
context_size: 128000
parameter_rules:
- name: temperature
use_template: temperature
- name: top_p
use_template: top_p
- name: presence_penalty
use_template: presence_penalty
- name: frequency_penalty
use_template: frequency_penalty
- name: max_tokens
use_template: max_tokens
default: 2048
min: 1
max: 128000
- name: response_format
use_template: response_format
pricing:
input: "0.024"
output: "0.024"
unit: "0.001"
currency: CNY
Original file line number Diff line number Diff line change
@@ -0,0 +1,33 @@
model: Baichuan3-Turbo
label:
zh_Hans: Baichuan3-Turbo
en_US: Baichuan3-Turbo
model_type: llm
features:
- multi-tool-call
- agent-thought
- stream-tool-call
model_properties:
mode: chat
context_size: 32768
parameter_rules:
- name: temperature
use_template: temperature
- name: top_p
use_template: top_p
- name: presence_penalty
use_template: presence_penalty
- name: frequency_penalty
use_template: frequency_penalty
- name: max_tokens
use_template: max_tokens
default: 2048
min: 1
max: 32768
- name: response_format
use_template: response_format
pricing:
input: "0.012"
output: "0.012"
unit: "0.001"
currency: CNY
33 changes: 33 additions & 0 deletions api/core/model_runtime/model_providers/modelhub/llm/Baichuan4.yaml
Original file line number Diff line number Diff line change
@@ -0,0 +1,33 @@
model: Baichuan4
label:
zh_Hans: Baichuan4
en_US: Baichuan4
model_type: llm
features:
- multi-tool-call
- agent-thought
- stream-tool-call
model_properties:
mode: chat
context_size: 32768
parameter_rules:
- name: temperature
use_template: temperature
- name: top_p
use_template: top_p
- name: presence_penalty
use_template: presence_penalty
- name: frequency_penalty
use_template: frequency_penalty
- name: max_tokens
use_template: max_tokens
default: 2048
min: 1
max: 32768
- name: response_format
use_template: response_format
pricing:
input: "0.1"
output: "0.1"
unit: "0.001"
currency: CNY
48 changes: 45 additions & 3 deletions api/core/model_runtime/model_providers/modelhub/llm/_position.yaml
Original file line number Diff line number Diff line change
@@ -1,4 +1,46 @@
- gpt-3.5-turbo
- gpt-4
- Baichuan4
- Baichuan3-Turbo
- Baichuan3-Turbo-128k
- Baichuan2-Turbo
- Baichuan2-Turbo-192k
- Baichuan2-53B
- chatglm-66b
- glm-4
- glm-3-turbo
- glm-4
- deepseek-chat-v2
- deepseek-coder
- gemini-pro
- abab6.5-chat
- abab6.5s-chat
- abab6.5g-chat
- abab6-chat
- abab5.5-chat
- moonshot-v1-8k
- moonshot-v1-32k
- moonshot-v1-128k
- gpt-4o
- gpt-4o-2024-05-13
- gpt-4-turbo
- gpt-4-turbo-2024-04-09
- gpt-4-turbo-preview
- gpt-4-0125-preview
- gpt-4-1106-preview
- gpt-4-vision-preview
- gpt-4-1106-vision-preview
- gpt-4
- gpt-4-0613
- gpt-3.5-turbo-0125
- gpt-3.5-turbo
- gpt-3.5-turbo-1106
- baichuan2-7b
- chatglm3
- chatglm3-32k
- deepseek-coder-6.7b-instruct
- deepseek-coder-6.7b-base
- lingua
- oneke
- qwen-14b-chat
- xverse-13b-256k
- yi-6b-base
- yi-6b-200k
- yi-6b-chat
Original file line number Diff line number Diff line change
@@ -0,0 +1,33 @@
model: abab5.5-chat
label:
zh_Hans: abab5.5-chat
en_US: abab5.5-chat
model_type: llm
features:
- multi-tool-call
- agent-thought
- stream-tool-call
model_properties:
mode: chat
context_size: 16384
parameter_rules:
- name: temperature
use_template: temperature
- name: top_p
use_template: top_p
- name: presence_penalty
use_template: presence_penalty
- name: frequency_penalty
use_template: frequency_penalty
- name: max_tokens
use_template: max_tokens
default: 2048
min: 1
max: 16384
- name: response_format
use_template: response_format
pricing:
input: "0.015"
output: "0.015"
unit: "0.001"
currency: CNY
Original file line number Diff line number Diff line change
@@ -0,0 +1,33 @@
model: abab6-chat
label:
zh_Hans: abab6-chat
en_US: abab6-chat
model_type: llm
features:
- multi-tool-call
- agent-thought
- stream-tool-call
model_properties:
mode: chat
context_size: 32768
parameter_rules:
- name: temperature
use_template: temperature
- name: top_p
use_template: top_p
- name: presence_penalty
use_template: presence_penalty
- name: frequency_penalty
use_template: frequency_penalty
- name: max_tokens
use_template: max_tokens
default: 2048
min: 1
max: 32768
- name: response_format
use_template: response_format
pricing:
input: "0.1"
output: "0.1"
unit: "0.001"
currency: CNY
Original file line number Diff line number Diff line change
@@ -0,0 +1,33 @@
model: abab6.5-chat
label:
zh_Hans: abab6.5-chat
en_US: abab6.5-chat
model_type: llm
features:
- multi-tool-call
- agent-thought
- stream-tool-call
model_properties:
mode: chat
context_size: 8192
parameter_rules:
- name: temperature
use_template: temperature
- name: top_p
use_template: top_p
- name: presence_penalty
use_template: presence_penalty
- name: frequency_penalty
use_template: frequency_penalty
- name: max_tokens
use_template: max_tokens
default: 2048
min: 1
max: 8192
- name: response_format
use_template: response_format
pricing:
input: "0.03"
output: "0.03"
unit: "0.001"
currency: CNY
Original file line number Diff line number Diff line change
@@ -0,0 +1,33 @@
model: abab6.5g-chat
label:
zh_Hans: abab6.5g-chat
en_US: abab6.5g-chat
model_type: llm
features:
- multi-tool-call
- agent-thought
- stream-tool-call
model_properties:
mode: chat
context_size: 8192
parameter_rules:
- name: temperature
use_template: temperature
- name: top_p
use_template: top_p
- name: presence_penalty
use_template: presence_penalty
- name: frequency_penalty
use_template: frequency_penalty
- name: max_tokens
use_template: max_tokens
default: 2048
min: 1
max: 8192
- name: response_format
use_template: response_format
pricing:
input: "0.005"
output: "0.005"
unit: "0.001"
currency: CNY
Loading

0 comments on commit b6fcecc

Please sign in to comment.