mirror of
https://github.com/itme-brain/agent-team.git
synced 2026-05-08 10:40:12 -04:00
smaller output capacity in order to maintain strong tok/s gen speed
This commit is contained in:
parent
9d5559e2b4
commit
d6e0e9f2d9
1 changed files with 1 additions and 1 deletions
|
|
@ -13,7 +13,7 @@
|
|||
"name": "Qwen3-Coder-30B-A3B-Instruct-Q6",
|
||||
"limit": {
|
||||
"context": 262144,
|
||||
"output": 262144
|
||||
"output": 8192
|
||||
},
|
||||
"cost": {
|
||||
"input": 0,
|
||||
|
|
|
|||
Loading…
Add table
Add a link
Reference in a new issue