vishaljoshi24 commited on
Commit
731cc49
·
1 Parent(s): 3488819

trying different LLM

Browse files
Files changed (1) hide show
  1. quickstart.py +1 -4
quickstart.py CHANGED
@@ -3,16 +3,13 @@ from trl import GRPOTrainer
3
  import os
4
 
5
  dataset = load_dataset("trl-lib/tldr", split="train")
6
- assert os.path.isfile("trl-lib/tldr")
7
- with open("trl-lib/tldr", "r") as f:
8
- pass
9
 
10
  # Dummy reward function: count the number of unique characters in the completions
11
  def reward_num_unique_chars(completions, **kwargs):
12
  return [len(set(c)) for c in completions]
13
 
14
  trainer = GRPOTrainer(
15
- model="Qwen/Qwen2-0.5B-Instruct",
16
  reward_funcs=reward_num_unique_chars,
17
  train_dataset=dataset,
18
  )
 
3
  import os
4
 
5
  dataset = load_dataset("trl-lib/tldr", split="train")
 
 
 
6
 
7
  # Dummy reward function: count the number of unique characters in the completions
8
  def reward_num_unique_chars(completions, **kwargs):
9
  return [len(set(c)) for c in completions]
10
 
11
  trainer = GRPOTrainer(
12
+ model="openai-community/gpt2",
13
  reward_funcs=reward_num_unique_chars,
14
  train_dataset=dataset,
15
  )