This commit is contained in:
2024-09-26 13:07:01 +03:00
parent 1c8bc26c64
commit 0fa336978f
4 changed files with 42 additions and 18 deletions

13
nlp/toxycity_detector.py Normal file
View File

@@ -0,0 +1,13 @@
from transformers import BertTokenizer, BertForSequenceClassification
# load tokenizer and model weights
tokenizer = BertTokenizer.from_pretrained('SkolkovoInstitute/russian_toxicity_classifier')
model = BertForSequenceClassification.from_pretrained('SkolkovoInstitute/russian_toxicity_classifier')
def detector(text):
# prepare the input
batch = tokenizer.encode(text, return_tensors='pt')
# inference
model(batch)