update model card
Browse files
README.md
CHANGED
@@ -4,10 +4,9 @@ tags:
|
|
4 |
- russian
|
5 |
license: mit
|
6 |
widget:
|
7 |
-
- text: "translate ru
|
8 |
---
|
9 |
-
This
|
10 |
-
|
11 |
|
12 |
The model has been fine-tuned for several tasks:
|
13 |
* translation (opus100 dataset)
|
@@ -28,28 +27,32 @@ tokenizer = AutoTokenizer.from_pretrained(model_name)
|
|
28 |
|
29 |
def generate(text, **kwargs):
|
30 |
model.eval()
|
31 |
-
inputs = tokenizer(text, return_tensors='pt')
|
32 |
with torch.no_grad():
|
33 |
hypotheses = model.generate(**inputs, **kwargs)
|
34 |
return tokenizer.decode(hypotheses[0], skip_special_tokens=True)
|
35 |
|
36 |
-
print(generate('translate ru
|
37 |
-
#
|
38 |
|
39 |
-
print(generate("translate en
|
40 |
-
#
|
41 |
|
42 |
print(generate('dialog: user1>>: Hello', num_beams=2))
|
43 |
# Hi
|
44 |
|
45 |
print(generate('dialog: user1>>: Hello user2>>: Hi user1>>: Would you like to drink something?', num_beams=2))
|
46 |
-
# I
|
47 |
|
48 |
-
|
49 |
|
50 |
-
|
51 |
-
|
|
|
|
|
|
|
|
|
|
|
52 |
|
53 |
-
print(
|
54 |
-
# I'd like to have a cup of coffee.
|
55 |
```
|
|
|
4 |
- russian
|
5 |
license: mit
|
6 |
widget:
|
7 |
+
- text: "translate en-ru: I'm afraid that I won't finish the report on time."
|
8 |
---
|
9 |
+
This is mt5-base model [google/mt5-base](https://huggingface.co/google/mt5-base) in which only Russian and English tokens are left
|
|
|
10 |
|
11 |
The model has been fine-tuned for several tasks:
|
12 |
* translation (opus100 dataset)
|
|
|
27 |
|
28 |
def generate(text, **kwargs):
|
29 |
model.eval()
|
30 |
+
inputs = tokenizer(text, return_tensors='pt').to(model.device)
|
31 |
with torch.no_grad():
|
32 |
hypotheses = model.generate(**inputs, **kwargs)
|
33 |
return tokenizer.decode(hypotheses[0], skip_special_tokens=True)
|
34 |
|
35 |
+
print(generate('translate ru-en: Я боюсь, что я не завершу доклад в ближайшее время.', num_beams=4,))
|
36 |
+
# I fear I'm not going to complete the report in the near future.
|
37 |
|
38 |
+
print(generate("translate en-ru: I'm afraid that I won't finish the report on time.", num_beams=4, max_length = 30))
|
39 |
+
# Я боюсь, что я не завершу доклад в ближайшее время.
|
40 |
|
41 |
print(generate('dialog: user1>>: Hello', num_beams=2))
|
42 |
# Hi
|
43 |
|
44 |
print(generate('dialog: user1>>: Hello user2>>: Hi user1>>: Would you like to drink something?', num_beams=2))
|
45 |
+
# I would like to drink a glass of wine.
|
46 |
|
47 |
+
from collections import deque
|
48 |
|
49 |
+
context =deque([], maxlen=6)
|
50 |
+
while True:
|
51 |
+
text = input()
|
52 |
+
text = 'user1>>: ' + text
|
53 |
+
context.append(text)
|
54 |
+
answ = generate('dialog: ' + ' '.join(context), num_beams=3, do_sample = True, temperature=1.5)
|
55 |
+
context.append('user2>>: ' + answ)
|
56 |
|
57 |
+
print('bot: ', answ)
|
|
|
58 |
```
|