submission-template

Sleeping

App Files Files Community

Zen0 commited on Jan 10

Commit

f1edb98

verified ·

1 Parent(s): 9685f7b

Update tasks/text.py

Browse files

Files changed (1) hide show

tasks/text.py +38 -3

tasks/text.py CHANGED Viewed

@@ -56,9 +56,44 @@ async def evaluate_text(request: TextEvaluationRequest):
     # Update the code below to replace the random baseline by your model inference within the inference pass where the energy consumption and emissions are tracked.
     #--------------------------------------------------------------------------------------------
-    # Make random predictions (placeholder for actual model inference)
-    true_labels = test_dataset["label"]
-    predictions = [random.randint(0, 7) for _ in range(len(true_labels))]
     #--------------------------------------------------------------------------------------------
     # YOUR MODEL INFERENCE STOPS HERE

     # Update the code below to replace the random baseline by your model inference within the inference pass where the energy consumption and emissions are tracked.
     #--------------------------------------------------------------------------------------------
+    #--------------------------------------------------------------------------------------------
+    # Load your model and tokenizer from Hugging Face
+    #--------------------------------------------------------------------------------------------
+    model_name = "Zen0/FrugalDisinfoHunter"  # Model identifier from Hugging Face
+    tokenizer = AutoTokenizer.from_pretrained(model_name)
+    model = AutoModelForSequenceClassification.from_pretrained(model_name)
+    #--------------------------------------------------------------------------------------------
+    # Load the dataset
+    #--------------------------------------------------------------------------------------------
+    # Assuming 'quotaclimat/frugalaichallenge-text-train' is the dataset you are working with
+    dataset = load_dataset("quotaclimat/frugalaichallenge-text-train")
+    # Access the test dataset (you can change this if you want to use a different split)
+    test_dataset = dataset['test']  # Assuming you have a 'test' split available
+    #--------------------------------------------------------------------------------------------
+    # Tokenize the text data
+    #--------------------------------------------------------------------------------------------
+    # Tokenize the test data (the text field contains the quotes)
+    test_texts = test_dataset["text"]  # The field 'text' contains the climate quotes
+    inputs = tokenizer(test_texts, padding=True, truncation=True, return_tensors="pt", max_length=512)
+    #--------------------------------------------------------------------------------------------
+    # Inference
+    #--------------------------------------------------------------------------------------------
+    # Run inference on the dataset using the model
+    with torch.no_grad():  # Disable gradient calculations
+        outputs = model(**inputs)
+        logits = outputs.logits
+    # Get predictions from the logits (choose the class with the highest logit)
+    predictions = torch.argmax(logits, dim=-1).cpu().numpy()  # Convert to numpy array for use
     #--------------------------------------------------------------------------------------------
     # YOUR MODEL INFERENCE STOPS HERE