فهرست منبع

feat: wenxin add yi-34b-chat (#7117)

小羽 8 ماه پیش
والد
کامیت
7944ce0594

+ 3 - 1
api/core/model_runtime/model_providers/wenxin/llm/ernie_bot.py

@@ -142,6 +142,7 @@ class ErnieBotModel:
         'ernie-character-8k-0321': 'https://aip.baidubce.com/rpc/2.0/ai_custom/v1/wenxinworkshop/chat/ernie-char-8k',
         'ernie-character-8k-0321': 'https://aip.baidubce.com/rpc/2.0/ai_custom/v1/wenxinworkshop/chat/ernie-char-8k',
         'ernie-4.0-turbo-8k': 'https://aip.baidubce.com/rpc/2.0/ai_custom/v1/wenxinworkshop/chat/ernie-4.0-turbo-8k',
         'ernie-4.0-turbo-8k': 'https://aip.baidubce.com/rpc/2.0/ai_custom/v1/wenxinworkshop/chat/ernie-4.0-turbo-8k',
         'ernie-4.0-turbo-8k-preview': 'https://aip.baidubce.com/rpc/2.0/ai_custom/v1/wenxinworkshop/chat/ernie-4.0-turbo-8k-preview',
         'ernie-4.0-turbo-8k-preview': 'https://aip.baidubce.com/rpc/2.0/ai_custom/v1/wenxinworkshop/chat/ernie-4.0-turbo-8k-preview',
+        'yi_34b_chat': 'https://aip.baidubce.com/rpc/2.0/ai_custom/v1/wenxinworkshop/chat/yi_34b_chat',
     }
     }
 
 
     function_calling_supports = [
     function_calling_supports = [
@@ -154,7 +155,8 @@ class ErnieBotModel:
         'ernie-3.5-128k',
         'ernie-3.5-128k',
         'ernie-4.0-8k',
         'ernie-4.0-8k',
         'ernie-4.0-turbo-8k',
         'ernie-4.0-turbo-8k',
-        'ernie-4.0-turbo-8k-preview'
+        'ernie-4.0-turbo-8k-preview',
+        'yi_34b_chat'
     ]
     ]
 
 
     api_key: str = ''
     api_key: str = ''

+ 30 - 0
api/core/model_runtime/model_providers/wenxin/llm/yi_34b_chat.yaml

@@ -0,0 +1,30 @@
+model: yi_34b_chat
+label:
+  en_US: yi_34b_chat
+model_type: llm
+features:
+  - agent-thought
+model_properties:
+  mode: chat
+  context_size: 32000
+parameter_rules:
+  - name: temperature
+    use_template: temperature
+    min: 0.1
+    max: 1.0
+    default: 0.95
+  - name: top_p
+    use_template: top_p
+    min: 0
+    max: 1.0
+    default: 0.7
+  - name: max_tokens
+    use_template: max_tokens
+    default: 4096
+    min: 2
+    max: 4096
+  - name: presence_penalty
+    use_template: presence_penalty
+    default: 1.0
+    min: 1.0
+    max: 2.0