nsarrazin HF Staff commited on
Commit
29ce6ea
·
1 Parent(s): 7bda7a0

Revert "Request less `max_new_tokens` on tools and reduce `truncate` on CMD R+ (#1292)"

Browse files
chart/env/prod.yaml CHANGED
@@ -47,7 +47,7 @@ envVars:
47
  "tools": true,
48
  "parameters": {
49
  "stop": ["<|END_OF_TURN_TOKEN|>"],
50
- "truncate" : 12288,
51
  "max_new_tokens" : 2048,
52
  "temperature" : 0.3
53
  },
 
47
  "tools": true,
48
  "parameters": {
49
  "stop": ["<|END_OF_TURN_TOKEN|>"],
50
+ "truncate" : 28672,
51
  "max_new_tokens" : 2048,
52
  "temperature" : 0.3
53
  },
src/lib/server/textGeneration/tools.ts CHANGED
@@ -131,7 +131,7 @@ export async function* runTools(
131
  for await (const output of await endpoint({
132
  messages: messagesWithFilesPrompt,
133
  preprompt,
134
- generateSettings: { ...assistant?.generateSettings, max_new_tokens: 512 },
135
  tools,
136
  })) {
137
  // model natively supports tool calls
 
131
  for await (const output of await endpoint({
132
  messages: messagesWithFilesPrompt,
133
  preprompt,
134
+ generateSettings: assistant?.generateSettings,
135
  tools,
136
  })) {
137
  // model natively supports tool calls