Add ROBERTA classifier ranking PoC, with 77pc off the bat

2026-03-13 11:24:51 +00:00
parent f09e36e740
commit 8311556855
8 changed files with 85 additions and 32 deletions
@@ -1,25 +1,33 @@
+from pydantic import BaseModel
 from transformers import RobertaTokenizer, RobertaForSequenceClassification
 import torch
+from fastapi import FastAPI
+
+app = FastAPI()

 MODEL_PATH = "./roberta_classifier"

 tokenizer = RobertaTokenizer.from_pretrained(MODEL_PATH)
 model = RobertaForSequenceClassification.from_pretrained(MODEL_PATH)

-text2 = "High-profile political downplaying of COVID-19 (examples: President Trump saying 'it will go away' in March–August 2020)"
-text = "Multiple mirrored reuploads (2020–2023) put the clip on other channels with titles implying it was a genuine 1970s public information film."
+class EvalRequest(BaseModel):
+    answer: str

-inputs = tokenizer(
-    text,
-    return_tensors="pt",
-    truncation=True,
-    padding=True
-)
+@app.post("/evaluate")
+def evaluate_rob(req: EvalRequest):
+    inputs = tokenizer(
+        req.answer,
+        return_tensors="pt",
+        truncation=True,
+        padding=True
+    )

-model.eval()
+    model.eval()

-with torch.no_grad():
-    logits = model(**inputs).logits
+    with torch.no_grad():
+        logits = model(**inputs).logits

-probs = torch.softmax(logits, dim=1)
-print(probs)
+    probs = torch.softmax(logits, dim=1)
+    return {
+        "probabilities": probs.cpu().numpy().tolist()
+    }