Update README.md
Browse files
README.md
CHANGED
|
@@ -65,11 +65,10 @@ metrics:
|
|
| 65 |
```python
|
| 66 |
from tokenizers import Tokenizer
|
| 67 |
|
| 68 |
-
# Загрузка токенизатора (если загружен с Hugging Face Hub)
|
| 69 |
tokenizer = Tokenizer.from_pretrained("Shu-vi/russian-bpe-tokenizer-16k")
|
| 70 |
|
| 71 |
# Пример
|
| 72 |
-
text = "В
|
| 73 |
encoded = tokenizer.encode(text)
|
| 74 |
|
| 75 |
print("Токены:", encoded.tokens)
|
|
|
|
| 65 |
```python
|
| 66 |
from tokenizers import Tokenizer
|
| 67 |
|
|
|
|
| 68 |
tokenizer = Tokenizer.from_pretrained("Shu-vi/russian-bpe-tokenizer-16k")
|
| 69 |
|
| 70 |
# Пример
|
| 71 |
+
text = "В Казани в 2024 прошёл БРИКС."
|
| 72 |
encoded = tokenizer.encode(text)
|
| 73 |
|
| 74 |
print("Токены:", encoded.tokens)
|