Ali2206 commited on
Commit
b3f455d
·
verified ·
1 Parent(s): f2a9805

Update src/txagent/txagent.py

Browse files
Files changed (1) hide show
  1. src/txagent/txagent.py +4 -3
src/txagent/txagent.py CHANGED
@@ -78,9 +78,10 @@ class TxAgent:
78
  model=self.model_name,
79
  dtype="float16",
80
  max_model_len=131072,
81
- max_num_batched_tokens=32768, # Increased for A100 80GB
82
- gpu_memory_utilization=0.9, # Higher utilization for better performance
83
- trust_remote_code=True
 
84
  )
85
  self.chat_template = Template(self.model.get_tokenizer().chat_template)
86
  self.tokenizer = self.model.get_tokenizer()
 
78
  model=self.model_name,
79
  dtype="float16",
80
  max_model_len=131072,
81
+ max_num_batched_tokens=65536, # Increased for A100 80GB
82
+ gpu_memory_utilization=0.95, # Higher utilization for better performance
83
+ trust_remote_code=True,
84
+ engine_args={"max_num_seqs": 512},
85
  )
86
  self.chat_template = Template(self.model.get_tokenizer().chat_template)
87
  self.tokenizer = self.model.get_tokenizer()