Spaces:
Running
Running
Revert "Request less `max_new_tokens` on tools and reduce `truncate` on CMD R+ (#1292)"
Browse files
chart/env/prod.yaml
CHANGED
@@ -47,7 +47,7 @@ envVars:
|
|
47 |
"tools": true,
|
48 |
"parameters": {
|
49 |
"stop": ["<|END_OF_TURN_TOKEN|>"],
|
50 |
-
"truncate" :
|
51 |
"max_new_tokens" : 2048,
|
52 |
"temperature" : 0.3
|
53 |
},
|
|
|
47 |
"tools": true,
|
48 |
"parameters": {
|
49 |
"stop": ["<|END_OF_TURN_TOKEN|>"],
|
50 |
+
"truncate" : 28672,
|
51 |
"max_new_tokens" : 2048,
|
52 |
"temperature" : 0.3
|
53 |
},
|
src/lib/server/textGeneration/tools.ts
CHANGED
@@ -131,7 +131,7 @@ export async function* runTools(
|
|
131 |
for await (const output of await endpoint({
|
132 |
messages: messagesWithFilesPrompt,
|
133 |
preprompt,
|
134 |
-
generateSettings:
|
135 |
tools,
|
136 |
})) {
|
137 |
// model natively supports tool calls
|
|
|
131 |
for await (const output of await endpoint({
|
132 |
messages: messagesWithFilesPrompt,
|
133 |
preprompt,
|
134 |
+
generateSettings: assistant?.generateSettings,
|
135 |
tools,
|
136 |
})) {
|
137 |
// model natively supports tool calls
|