mirror of
https://github.com/itme-brain/agent-team.git
synced 2026-05-08 10:40:12 -04:00
smaller output capacity in order to maintain strong tok/s gen speed
This commit is contained in:
parent
9d5559e2b4
commit
d6e0e9f2d9
1 changed files with 1 additions and 1 deletions
|
|
@ -13,7 +13,7 @@
|
||||||
"name": "Qwen3-Coder-30B-A3B-Instruct-Q6",
|
"name": "Qwen3-Coder-30B-A3B-Instruct-Q6",
|
||||||
"limit": {
|
"limit": {
|
||||||
"context": 262144,
|
"context": 262144,
|
||||||
"output": 262144
|
"output": 8192
|
||||||
},
|
},
|
||||||
"cost": {
|
"cost": {
|
||||||
"input": 0,
|
"input": 0,
|
||||||
|
|
|
||||||
Loading…
Add table
Add a link
Reference in a new issue