welcomecenterbot/nlp/toxycity_detector.py

13 lines
435 B
Python
Raw Normal View History

2024-09-26 10:07:01 +00:00
from transformers import BertTokenizer, BertForSequenceClassification
# load tokenizer and model weights
tokenizer = BertTokenizer.from_pretrained('SkolkovoInstitute/russian_toxicity_classifier')
model = BertForSequenceClassification.from_pretrained('SkolkovoInstitute/russian_toxicity_classifier')
def detector(text):
# prepare the input
batch = tokenizer.encode(text, return_tensors='pt')
# inference
model(batch)