feat: wenxin add yi-34b-chat (#7117)

This commit is contained in:
小羽
2024-08-08 12:01:21 +00:00
committed by GitHub
parent ad682c394d
commit 7944ce0594
2 changed files with 33 additions and 1 deletions

View File

@@ -142,6 +142,7 @@ class ErnieBotModel:
'ernie-character-8k-0321': 'https://aip.baidubce.com/rpc/2.0/ai_custom/v1/wenxinworkshop/chat/ernie-char-8k',
'ernie-4.0-turbo-8k': 'https://aip.baidubce.com/rpc/2.0/ai_custom/v1/wenxinworkshop/chat/ernie-4.0-turbo-8k',
'ernie-4.0-turbo-8k-preview': 'https://aip.baidubce.com/rpc/2.0/ai_custom/v1/wenxinworkshop/chat/ernie-4.0-turbo-8k-preview',
'yi_34b_chat': 'https://aip.baidubce.com/rpc/2.0/ai_custom/v1/wenxinworkshop/chat/yi_34b_chat',
}
function_calling_supports = [
@@ -154,7 +155,8 @@ class ErnieBotModel:
'ernie-3.5-128k',
'ernie-4.0-8k',
'ernie-4.0-turbo-8k',
'ernie-4.0-turbo-8k-preview'
'ernie-4.0-turbo-8k-preview',
'yi_34b_chat'
]
api_key: str = ''

View File

@@ -0,0 +1,30 @@
model: yi_34b_chat
label:
en_US: yi_34b_chat
model_type: llm
features:
- agent-thought
model_properties:
mode: chat
context_size: 32000
parameter_rules:
- name: temperature
use_template: temperature
min: 0.1
max: 1.0
default: 0.95
- name: top_p
use_template: top_p
min: 0
max: 1.0
default: 0.7
- name: max_tokens
use_template: max_tokens
default: 4096
min: 2
max: 4096
- name: presence_penalty
use_template: presence_penalty
default: 1.0
min: 1.0
max: 2.0