artemnech commited on
Commit
e7b9972
·
1 Parent(s): 13523cb

update model card

Browse files
Files changed (1) hide show
  1. README.md +17 -14
README.md CHANGED
@@ -4,10 +4,9 @@ tags:
4
  - russian
5
  license: mit
6
  widget:
7
- - text: "translate ru to en: Интересный момент. Модель не видела русских диалогов, но может их понимать"
8
  ---
9
- This pruned model of mt5-base [google/mt5-base](https://huggingface.co/google/mt5-base) with only some Rusian and English embeddings left.
10
-
11
 
12
  The model has been fine-tuned for several tasks:
13
  * translation (opus100 dataset)
@@ -28,28 +27,32 @@ tokenizer = AutoTokenizer.from_pretrained(model_name)
28
 
29
  def generate(text, **kwargs):
30
  model.eval()
31
- inputs = tokenizer(text, return_tensors='pt')
32
  with torch.no_grad():
33
  hypotheses = model.generate(**inputs, **kwargs)
34
  return tokenizer.decode(hypotheses[0], skip_special_tokens=True)
35
 
36
- print(generate('translate ru to en: Интересный момент. Модель не видела русских диалогов, но может их понимать', num_beams=4,))
37
- # The Model didn't see Russian dialogues, but can understand them.
38
 
39
- print(generate("translate en to ru: The Model didn't see Russian dialogues, but can understand them.", num_beams=4,))
40
- # Модель не видела русских диалога, но может понимать их.
41
 
42
  print(generate('dialog: user1>>: Hello', num_beams=2))
43
  # Hi
44
 
45
  print(generate('dialog: user1>>: Hello user2>>: Hi user1>>: Would you like to drink something?', num_beams=2))
46
- # I'd like to drink a cup of coffee.
47
 
48
- #An interesting point. The model has not seen Russian dialogues, but can understand them
49
 
50
- print(generate('dialog: user1>>: Привет'))
51
- # Hi
 
 
 
 
 
52
 
53
- print(generate('dialog: user1>>: Привет user2>>: Hi user1>>: Хочешь выпить что-нибудь?', num_beams=2))
54
- # I'd like to have a cup of coffee.
55
  ```
 
4
  - russian
5
  license: mit
6
  widget:
7
+ - text: "translate en-ru: I'm afraid that I won't finish the report on time."
8
  ---
9
+ This is mt5-base model [google/mt5-base](https://huggingface.co/google/mt5-base) in which only Russian and English tokens are left
 
10
 
11
  The model has been fine-tuned for several tasks:
12
  * translation (opus100 dataset)
 
27
 
28
  def generate(text, **kwargs):
29
  model.eval()
30
+ inputs = tokenizer(text, return_tensors='pt').to(model.device)
31
  with torch.no_grad():
32
  hypotheses = model.generate(**inputs, **kwargs)
33
  return tokenizer.decode(hypotheses[0], skip_special_tokens=True)
34
 
35
+ print(generate('translate ru-en: Я боюсь, что я не завершу доклад в ближайшее время.', num_beams=4,))
36
+ # I fear I'm not going to complete the report in the near future.
37
 
38
+ print(generate("translate en-ru: I'm afraid that I won't finish the report on time.", num_beams=4, max_length = 30))
39
+ # Я боюсь, что я не завершу доклад в ближайшее время.
40
 
41
  print(generate('dialog: user1>>: Hello', num_beams=2))
42
  # Hi
43
 
44
  print(generate('dialog: user1>>: Hello user2>>: Hi user1>>: Would you like to drink something?', num_beams=2))
45
+ # I would like to drink a glass of wine.
46
 
47
+ from collections import deque
48
 
49
+ context =deque([], maxlen=6)
50
+ while True:
51
+ text = input()
52
+ text = 'user1>>: ' + text
53
+ context.append(text)
54
+ answ = generate('dialog: ' + ' '.join(context), num_beams=3, do_sample = True, temperature=1.5)
55
+ context.append('user2>>: ' + answ)
56
 
57
+ print('bot: ', answ)
 
58
  ```