Update README.md
Browse files
README.md
CHANGED
|
@@ -28,8 +28,8 @@ The metrics obtained from test dataset is as follows
|
|
| 28 |
from transformers import BertTokenizer, BertForSequenceClassification
|
| 29 |
|
| 30 |
# load tokenizer and model weights
|
| 31 |
-
tokenizer = BertTokenizer.from_pretrained('
|
| 32 |
-
model = BertForSequenceClassification.from_pretrained('
|
| 33 |
|
| 34 |
# prepare the input
|
| 35 |
batch = tokenizer.encode('ты супер', return_tensors='pt')
|
|
@@ -38,6 +38,15 @@ batch = tokenizer.encode('ты супер', return_tensors='pt')
|
|
| 38 |
model(batch)
|
| 39 |
```
|
| 40 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 41 |
|
| 42 |
## Licensing Information
|
| 43 |
|
|
|
|
| 28 |
from transformers import BertTokenizer, BertForSequenceClassification
|
| 29 |
|
| 30 |
# load tokenizer and model weights
|
| 31 |
+
tokenizer = BertTokenizer.from_pretrained('s-nlp/russian_toxicity_classifier')
|
| 32 |
+
model = BertForSequenceClassification.from_pretrained('s-nlp/russian_toxicity_classifier')
|
| 33 |
|
| 34 |
# prepare the input
|
| 35 |
batch = tokenizer.encode('ты супер', return_tensors='pt')
|
|
|
|
| 38 |
model(batch)
|
| 39 |
```
|
| 40 |
|
| 41 |
+
## Citation
|
| 42 |
+
|
| 43 |
+
```
|
| 44 |
+
@article{dementieva2022russe,
|
| 45 |
+
title={RUSSE-2022: Findings of the First Russian Detoxification Shared Task Based on Parallel Corpora},
|
| 46 |
+
author={Dementieva, Daryna and Logacheva, Varvara and Nikishina, Irina and Fenogenova, Alena and Dale, David and Krotova, Irina and Semenov, Nikita and Shavrina, Tatiana and Panchenko, Alexander}
|
| 47 |
+
}
|
| 48 |
+
```
|
| 49 |
+
|
| 50 |
|
| 51 |
## Licensing Information
|
| 52 |
|