Commit
·
16814ca
1
Parent(s):
769b214
changing model
Browse files- NeuralTextGenerator.py +1 -1
- app.py +1 -1
NeuralTextGenerator.py
CHANGED
@@ -47,7 +47,7 @@ class BertTextGenerator:
|
|
47 |
self.model, optimizer = amp.initialize(self.model, optimizer, opt_level="O2", keep_batchnorm_fp32=True,
|
48 |
loss_scale="dynamic")
|
49 |
|
50 |
-
self.tokenizer = AutoTokenizer.from_pretrained(
|
51 |
use_fast=use_fast,
|
52 |
do_basic_tokenize=do_basic_tokenize) # added to avoid splitting of unused tokens
|
53 |
self.num_attention_masks = len(self.model.base_model.base_model.encoder.layer)
|
|
|
47 |
self.model, optimizer = amp.initialize(self.model, optimizer, opt_level="O2", keep_batchnorm_fp32=True,
|
48 |
loss_scale="dynamic")
|
49 |
|
50 |
+
self.tokenizer = AutoTokenizer.from_pretrained(model_version, do_lower_case="uncased" in model_version,
|
51 |
use_fast=use_fast,
|
52 |
do_basic_tokenize=do_basic_tokenize) # added to avoid splitting of unused tokens
|
53 |
self.num_attention_masks = len(self.model.base_model.base_model.encoder.layer)
|
app.py
CHANGED
@@ -15,7 +15,7 @@ from NeuralTextGenerator import BertTextGenerator
|
|
15 |
# generator = pipeline("sentiment-analysis")
|
16 |
|
17 |
# print('dfg')
|
18 |
-
model_name = "
|
19 |
en_model = BertTextGenerator(model_name)
|
20 |
tokenizer = en_model.tokenizer
|
21 |
model = en_model.model
|
|
|
15 |
# generator = pipeline("sentiment-analysis")
|
16 |
|
17 |
# print('dfg')
|
18 |
+
model_name = "cardiffnlp/twitter-xlm-roberta-base" #"dbmdz/bert-base-italian-uncased"
|
19 |
en_model = BertTextGenerator(model_name)
|
20 |
tokenizer = en_model.tokenizer
|
21 |
model = en_model.model
|