SophieA17 commited on
Commit
f225fc7
·
verified ·
1 Parent(s): edd20a2

Update README.md

Browse files
Files changed (1) hide show
  1. README.md +13 -3
README.md CHANGED
@@ -1,4 +1,14 @@
1
- Sophie0-SFT
 
 
 
 
 
 
 
 
 
 
2
 
3
  ### Introduction
4
 
@@ -18,8 +28,8 @@ import torch
18
 
19
  from transformers import AutoTokenizer, AutoModelForCausalLM, GenerationConfig
20
 
21
- model: AutoModelForCausalLM = AutoModelForCausalLM.from_pretrained("SophieA17/Sophie0-SFT", trust_remote_code=True)
22
- tokenizer: AutoTokenizer = AutoTokenizer.from_pretrained("SophieA17/Sophie0-SFT", trust_remote_code=True)
23
 
24
  model = model.to(device="cuda:0", dtype=torch.bfloat16)
25
  inputs = [
 
1
+ ---
2
+ license: apache-2.0
3
+ datasets:
4
+ - K-and-K/knights-and-knaves
5
+ language:
6
+ - en
7
+ - zh
8
+ base_model:
9
+ - SophieA17/Sophie0-Reasoning-SFT
10
+ ---
11
+ Sophie0-Reasoning-GRPO
12
 
13
  ### Introduction
14
 
 
28
 
29
  from transformers import AutoTokenizer, AutoModelForCausalLM, GenerationConfig
30
 
31
+ model: AutoModelForCausalLM = AutoModelForCausalLM.from_pretrained("SophieA17/Sophie0-Reasoning-GRPO", trust_remote_code=True)
32
+ tokenizer: AutoTokenizer = AutoTokenizer.from_pretrained("SophieA17/Sophie0-Reasoning-GRPO", trust_remote_code=True)
33
 
34
  model = model.to(device="cuda:0", dtype=torch.bfloat16)
35
  inputs = [