Spaces:
Runtime error
Runtime error
File size: 927 Bytes
6b02e3d |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 |
from transformers import AutoTokenizer, AutoModelForSequenceClassification
tokenizer = AutoTokenizer.from_pretrained("distilbert-base-multilingual-cased")
model = AutoModelForSequenceClassification.from_pretrained("distilbert-base-multilingual-cased")
# example sentences
sentence1 = "O Brasil é o maior país da América do Sul"
sentence2 = "A Argentina é o segundo maior país da América do Sul"
# tokenize the sentences
inputs = tokenizer(sentence1, sentence2, padding=True, truncation=True, max_length=250, return_tensors="pt")
# get the output logits for the sentence pair classification task
outputs = model(**inputs).logits
# calculate the softmax probabilities for the two classes (similar or dissimilar)
probs = outputs.softmax(dim=1)
# the probability of the sentences being similar is the second element of the output array
similarity_score = probs[0][1].item()
print("Similarity score:", similarity_score) |