Spaces:
Runtime error
Runtime error
Update app.py
Browse files
app.py
CHANGED
@@ -30,14 +30,14 @@ tokenizer = AutoTokenizer.from_pretrained(model_name)
|
|
30 |
model = AutoModelForCausalLM.from_pretrained(
|
31 |
model_name,
|
32 |
device_map=device,
|
33 |
-
torch_dtype=torch.
|
34 |
)
|
35 |
#model = AutoModelForCausalLM.from_pretrained(model_name, device_map="auto", torch_dtype="auto")
|
36 |
qa_pipeline = pipeline(
|
37 |
"text-generation",
|
38 |
model=model,
|
39 |
tokenizer=tokenizer,
|
40 |
-
max_new_tokens=
|
41 |
pad_token_id=tokenizer.eos_token_id
|
42 |
)
|
43 |
|
|
|
30 |
model = AutoModelForCausalLM.from_pretrained(
|
31 |
model_name,
|
32 |
device_map=device,
|
33 |
+
torch_dtype=torch.float16 if device == "cuda" else torch.float32
|
34 |
)
|
35 |
#model = AutoModelForCausalLM.from_pretrained(model_name, device_map="auto", torch_dtype="auto")
|
36 |
qa_pipeline = pipeline(
|
37 |
"text-generation",
|
38 |
model=model,
|
39 |
tokenizer=tokenizer,
|
40 |
+
max_new_tokens=1500,
|
41 |
pad_token_id=tokenizer.eos_token_id
|
42 |
)
|
43 |
|