Spaces:
Runtime error
Runtime error
Update app.py
Browse files
app.py
CHANGED
@@ -7,10 +7,10 @@ model_name = "allenai/scibert_scivocab_uncased"
|
|
7 |
tokenizer = AutoTokenizer.from_pretrained(model_name)
|
8 |
model = AutoModelForSequenceClassification.from_pretrained(model_name, num_labels=3)
|
9 |
|
10 |
-
# 2️⃣ Dataset laden (
|
11 |
-
dataset = load_dataset("armanc/scientific_papers", trust_remote_code=True)
|
12 |
|
13 |
-
# 3️⃣ Tokenisierung der Texte
|
14 |
def tokenize_function(examples):
|
15 |
return tokenizer(examples["text"], padding="max_length", truncation=True)
|
16 |
|
|
|
7 |
tokenizer = AutoTokenizer.from_pretrained(model_name)
|
8 |
model = AutoModelForSequenceClassification.from_pretrained(model_name, num_labels=3)
|
9 |
|
10 |
+
# 2️⃣ Dataset laden (mit spezifischer Konfiguration: "arxiv" oder "pubmed")
|
11 |
+
dataset = load_dataset("armanc/scientific_papers", "arxiv", trust_remote_code=True) # Oder "pubmed"
|
12 |
|
13 |
+
# 3️⃣ Tokenisierung der Texte
|
14 |
def tokenize_function(examples):
|
15 |
return tokenizer(examples["text"], padding="max_length", truncation=True)
|
16 |
|