Unverified Commit 3242cf53 authored by takatost's avatar takatost Committed by GitHub

fix: moonshot context size error (#2406)

parent d8de2017
...@@ -14,6 +14,7 @@ ...@@ -14,6 +14,7 @@
- minimax - minimax
- tongyi - tongyi
- wenxin - wenxin
- moonshot
- jina - jina
- chatglm - chatglm
- xinference - xinference
......
...@@ -7,21 +7,17 @@ features: ...@@ -7,21 +7,17 @@ features:
- agent-thought - agent-thought
model_properties: model_properties:
mode: chat mode: chat
context_size: 4096 context_size: 128000
parameter_rules: parameter_rules:
- name: temperature - name: temperature
use_template: temperature use_template: temperature
- name: top_p - name: top_p
use_template: top_p use_template: top_p
- name: presence_penalty
use_template: presence_penalty
- name: frequency_penalty
use_template: frequency_penalty
- name: max_tokens - name: max_tokens
use_template: max_tokens use_template: max_tokens
default: 512 default: 1024
min: 1 min: 1
max: 4096 max: 128000
pricing: pricing:
input: '0.06' input: '0.06'
output: '0.06' output: '0.06'
......
...@@ -7,21 +7,17 @@ features: ...@@ -7,21 +7,17 @@ features:
- agent-thought - agent-thought
model_properties: model_properties:
mode: chat mode: chat
context_size: 4096 context_size: 32000
parameter_rules: parameter_rules:
- name: temperature - name: temperature
use_template: temperature use_template: temperature
- name: top_p - name: top_p
use_template: top_p use_template: top_p
- name: presence_penalty
use_template: presence_penalty
- name: frequency_penalty
use_template: frequency_penalty
- name: max_tokens - name: max_tokens
use_template: max_tokens use_template: max_tokens
default: 512 default: 1024
min: 1 min: 1
max: 4096 max: 32000
pricing: pricing:
input: '0.024' input: '0.024'
output: '0.024' output: '0.024'
......
...@@ -7,21 +7,17 @@ features: ...@@ -7,21 +7,17 @@ features:
- agent-thought - agent-thought
model_properties: model_properties:
mode: chat mode: chat
context_size: 4096 context_size: 8192
parameter_rules: parameter_rules:
- name: temperature - name: temperature
use_template: temperature use_template: temperature
- name: top_p - name: top_p
use_template: top_p use_template: top_p
- name: presence_penalty
use_template: presence_penalty
- name: frequency_penalty
use_template: frequency_penalty
- name: max_tokens - name: max_tokens
use_template: max_tokens use_template: max_tokens
default: 512 default: 512
min: 1 min: 1
max: 4096 max: 8192
pricing: pricing:
input: '0.012' input: '0.012'
output: '0.012' output: '0.012'
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment