Update src/txagent/txagent.py
Browse files- src/txagent/txagent.py +4 -3
src/txagent/txagent.py
CHANGED
@@ -78,9 +78,10 @@ class TxAgent:
|
|
78 |
model=self.model_name,
|
79 |
dtype="float16",
|
80 |
max_model_len=131072,
|
81 |
-
max_num_batched_tokens=
|
82 |
-
gpu_memory_utilization=0.
|
83 |
-
trust_remote_code=True
|
|
|
84 |
)
|
85 |
self.chat_template = Template(self.model.get_tokenizer().chat_template)
|
86 |
self.tokenizer = self.model.get_tokenizer()
|
|
|
78 |
model=self.model_name,
|
79 |
dtype="float16",
|
80 |
max_model_len=131072,
|
81 |
+
max_num_batched_tokens=65536, # Increased for A100 80GB
|
82 |
+
gpu_memory_utilization=0.95, # Higher utilization for better performance
|
83 |
+
trust_remote_code=True,
|
84 |
+
engine_args={"max_num_seqs": 512},
|
85 |
)
|
86 |
self.chat_template = Template(self.model.get_tokenizer().chat_template)
|
87 |
self.tokenizer = self.model.get_tokenizer()
|