chansung commited on
Commit
8978ec6
·
1 Parent(s): 4e963f7

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +6 -6
app.py CHANGED
@@ -156,12 +156,12 @@ def submit(
156
  "custom": {
157
  health_route: "/health",
158
  env: {
159
- DISABLE_CUSTOM_KERNELS: "true" if custom_kernel == "Enabled" else "false",
160
- MAX_BATCH_PREFILL_TOKENS: str(max_batch_prefill_token),
161
- MAX_BATCH_TOTAL_TOKENS?: str(max_batch_total_token);
162
- MAX_INPUT_LENGTH: str(max_input_length),
163
- MAX_TOTAL_TOKENS: str(max_tokens),
164
- MODEL_ID: repository_selector.lower(),
165
  # QUANTIZE: 'bitsandbytes' | 'gptq';
166
  },
167
  url: "ghcr.io/huggingface/text-generation-inference:1.0.1",
 
156
  "custom": {
157
  health_route: "/health",
158
  env: {
159
+ "DISABLE_CUSTOM_KERNELS": "true" if custom_kernel == "Enabled" else "false",
160
+ "MAX_BATCH_PREFILL_TOKENS": str(max_batch_prefill_token),
161
+ "MAX_BATCH_TOTAL_TOKENS": str(max_batch_total_token);
162
+ "MAX_INPUT_LENGTH": str(max_input_length),
163
+ "MAX_TOTAL_TOKENS": str(max_tokens),
164
+ "MODEL_ID": repository_selector.lower(),
165
  # QUANTIZE: 'bitsandbytes' | 'gptq';
166
  },
167
  url: "ghcr.io/huggingface/text-generation-inference:1.0.1",