Add ROBERTA classifier ranking PoC, with 77pc off the bat

This commit is contained in:
William Jeynes
2026-03-13 11:24:51 +00:00
parent f09e36e740
commit 8311556855
8 changed files with 85 additions and 32 deletions
+21 -13
View File
@@ -1,25 +1,33 @@
from pydantic import BaseModel
from transformers import RobertaTokenizer, RobertaForSequenceClassification
import torch
from fastapi import FastAPI
app = FastAPI()
MODEL_PATH = "./roberta_classifier"
tokenizer = RobertaTokenizer.from_pretrained(MODEL_PATH)
model = RobertaForSequenceClassification.from_pretrained(MODEL_PATH)
text2 = "High-profile political downplaying of COVID-19 (examples: President Trump saying 'it will go away' in MarchAugust 2020)"
text = "Multiple mirrored reuploads (20202023) put the clip on other channels with titles implying it was a genuine 1970s public information film."
class EvalRequest(BaseModel):
answer: str
inputs = tokenizer(
text,
return_tensors="pt",
truncation=True,
padding=True
)
@app.post("/evaluate")
def evaluate_rob(req: EvalRequest):
inputs = tokenizer(
req.answer,
return_tensors="pt",
truncation=True,
padding=True
)
model.eval()
model.eval()
with torch.no_grad():
logits = model(**inputs).logits
with torch.no_grad():
logits = model(**inputs).logits
probs = torch.softmax(logits, dim=1)
print(probs)
probs = torch.softmax(logits, dim=1)
return {
"probabilities": probs.cpu().numpy().tolist()
}