CPS-Test-Mobile

Paused

Ali2206 commited on Apr 26

Commit

589b0c2

verified ·

1 Parent(s): 2639902

Update src/txagent/txagent.py

Files changed (1) hide show

src/txagent/txagent.py CHANGED Viewed

@@ -78,8 +78,8 @@ class TxAgent:
             model=self.model_name,
             dtype="float16",
             max_model_len=131072,
-            max_num_batched_tokens=32768,  # Increased for A100 80GB
-            gpu_memory_utilization=0.9,    # Higher utilization for better performance
             trust_remote_code=True
         )
         self.chat_template = Template(self.model.get_tokenizer().chat_template)
@@ -428,7 +428,7 @@ class TxAgent:
         logits_processor = self.build_logits_processor(messages, model)
         sampling_params = SamplingParams(
-            temperature=temperature,
             max_tokens=max_new_tokens,
             seed=seed if seed is not None else self.seed,
         )

             model=self.model_name,
             dtype="float16",
             max_model_len=131072,
+            max_num_batched_tokens=65536,  # Increased for A100 80GB
+            gpu_memory_utilization=0.95,    # Higher utilization for better performance
             trust_remote_code=True
         )
         self.chat_template = Template(self.model.get_tokenizer().chat_template)
         logits_processor = self.build_logits_processor(messages, model)
         sampling_params = SamplingParams(
+            temperature=temperature if temperature is not None else 0.0,
             max_tokens=max_new_tokens,
             seed=seed if seed is not None else self.seed,
         )