EleanorZzz commited on
Commit
088de3c
·
verified ·
1 Parent(s): 49a9f55

End of training

Browse files
Files changed (5) hide show
  1. README.md +1 -1
  2. all_results.json +5 -5
  3. train_results.json +5 -5
  4. trainer_state.json +32 -32
  5. training_loss.png +0 -0
README.md CHANGED
@@ -16,7 +16,7 @@ should probably proofread and complete it, then remove this comment. -->
16
 
17
  # persuasion_simulation_persona_sft_w_promp_3epochs
18
 
19
- This model is a fine-tuned version of [meta-llama/Llama-3.1-8B-Instruct](https://huggingface.co/meta-llama/Llama-3.1-8B-Instruct) on an unknown dataset.
20
 
21
  ## Model description
22
 
 
16
 
17
  # persuasion_simulation_persona_sft_w_promp_3epochs
18
 
19
+ This model is a fine-tuned version of [meta-llama/Llama-3.1-8B-Instruct](https://huggingface.co/meta-llama/Llama-3.1-8B-Instruct) on the persuasion_simulation dataset.
20
 
21
  ## Model description
22
 
all_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 2.946236559139785,
3
- "total_flos": 3904168919040.0,
4
- "train_loss": 0.8688372978265735,
5
- "train_runtime": 1181.3244,
6
- "train_samples_per_second": 1.877,
7
- "train_steps_per_second": 0.117
8
  }
 
1
  {
2
  "epoch": 2.946236559139785,
3
+ "total_flos": 3976309309440.0,
4
+ "train_loss": 0.8567031431889188,
5
+ "train_runtime": 1140.8622,
6
+ "train_samples_per_second": 1.943,
7
+ "train_steps_per_second": 0.121
8
  }
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 2.946236559139785,
3
- "total_flos": 3904168919040.0,
4
- "train_loss": 0.8688372978265735,
5
- "train_runtime": 1181.3244,
6
- "train_samples_per_second": 1.877,
7
- "train_steps_per_second": 0.117
8
  }
 
1
  {
2
  "epoch": 2.946236559139785,
3
+ "total_flos": 3976309309440.0,
4
+ "train_loss": 0.8567031431889188,
5
+ "train_runtime": 1140.8622,
6
+ "train_samples_per_second": 1.943,
7
+ "train_steps_per_second": 0.121
8
  }
trainer_state.json CHANGED
@@ -11,103 +11,103 @@
11
  "log_history": [
12
  {
13
  "epoch": 0.21505376344086022,
14
- "grad_norm": 7.996015926817187,
15
  "learning_rate": 7.1428571428571436e-06,
16
- "loss": 2.2981,
17
  "step": 10
18
  },
19
  {
20
  "epoch": 0.43010752688172044,
21
- "grad_norm": 2.962707682143447,
22
  "learning_rate": 9.942341621640558e-06,
23
- "loss": 1.0994,
24
  "step": 20
25
  },
26
  {
27
  "epoch": 0.6451612903225806,
28
- "grad_norm": 1.7445658767729006,
29
  "learning_rate": 9.594789058101154e-06,
30
- "loss": 0.9707,
31
  "step": 30
32
  },
33
  {
34
  "epoch": 0.8602150537634409,
35
- "grad_norm": 1.5507007800350687,
36
  "learning_rate": 8.953878684688492e-06,
37
- "loss": 0.9301,
38
  "step": 40
39
  },
40
  {
41
  "epoch": 1.064516129032258,
42
- "grad_norm": 1.7262461771482085,
43
  "learning_rate": 8.060529912738316e-06,
44
- "loss": 0.8727,
45
  "step": 50
46
  },
47
  {
48
  "epoch": 1.2795698924731183,
49
- "grad_norm": 1.677061241367903,
50
  "learning_rate": 6.971779275566593e-06,
51
- "loss": 0.7903,
52
  "step": 60
53
  },
54
  {
55
  "epoch": 1.4946236559139785,
56
- "grad_norm": 1.6964854513828154,
57
  "learning_rate": 5.757138887522884e-06,
58
- "loss": 0.7514,
59
  "step": 70
60
  },
61
  {
62
  "epoch": 1.7096774193548387,
63
- "grad_norm": 1.7463783101137778,
64
  "learning_rate": 4.49415839006284e-06,
65
- "loss": 0.7546,
66
  "step": 80
67
  },
68
  {
69
  "epoch": 1.924731182795699,
70
- "grad_norm": 1.79920542020065,
71
  "learning_rate": 3.2634737357758994e-06,
72
- "loss": 0.7558,
73
  "step": 90
74
  },
75
  {
76
  "epoch": 2.129032258064516,
77
- "grad_norm": 3.698924921571074,
78
  "learning_rate": 2.1436589245260375e-06,
79
- "loss": 0.6577,
80
  "step": 100
81
  },
82
  {
83
  "epoch": 2.3440860215053765,
84
- "grad_norm": 1.9212954432010707,
85
  "learning_rate": 1.2062093865360458e-06,
86
- "loss": 0.5443,
87
  "step": 110
88
  },
89
  {
90
  "epoch": 2.5591397849462365,
91
- "grad_norm": 1.7906293486232936,
92
  "learning_rate": 5.109773021462921e-07,
93
- "loss": 0.5612,
94
  "step": 120
95
  },
96
  {
97
  "epoch": 2.774193548387097,
98
- "grad_norm": 1.8644011572770092,
99
  "learning_rate": 1.0235029373752758e-07,
100
- "loss": 0.5485,
101
  "step": 130
102
  },
103
  {
104
  "epoch": 2.946236559139785,
105
  "step": 138,
106
- "total_flos": 3904168919040.0,
107
- "train_loss": 0.8688372978265735,
108
- "train_runtime": 1181.3244,
109
- "train_samples_per_second": 1.877,
110
- "train_steps_per_second": 0.117
111
  }
112
  ],
113
  "logging_steps": 10,
@@ -127,7 +127,7 @@
127
  "attributes": {}
128
  }
129
  },
130
- "total_flos": 3904168919040.0,
131
  "train_batch_size": 1,
132
  "trial_name": null,
133
  "trial_params": null
 
11
  "log_history": [
12
  {
13
  "epoch": 0.21505376344086022,
14
+ "grad_norm": 8.46070883603428,
15
  "learning_rate": 7.1428571428571436e-06,
16
+ "loss": 2.281,
17
  "step": 10
18
  },
19
  {
20
  "epoch": 0.43010752688172044,
21
+ "grad_norm": 2.013915203610999,
22
  "learning_rate": 9.942341621640558e-06,
23
+ "loss": 1.0733,
24
  "step": 20
25
  },
26
  {
27
  "epoch": 0.6451612903225806,
28
+ "grad_norm": 1.7956971723377748,
29
  "learning_rate": 9.594789058101154e-06,
30
+ "loss": 0.9705,
31
  "step": 30
32
  },
33
  {
34
  "epoch": 0.8602150537634409,
35
+ "grad_norm": 1.6961156545645073,
36
  "learning_rate": 8.953878684688492e-06,
37
+ "loss": 0.9142,
38
  "step": 40
39
  },
40
  {
41
  "epoch": 1.064516129032258,
42
+ "grad_norm": 1.8314800502805586,
43
  "learning_rate": 8.060529912738316e-06,
44
+ "loss": 0.8739,
45
  "step": 50
46
  },
47
  {
48
  "epoch": 1.2795698924731183,
49
+ "grad_norm": 1.6076365651648326,
50
  "learning_rate": 6.971779275566593e-06,
51
+ "loss": 0.7693,
52
  "step": 60
53
  },
54
  {
55
  "epoch": 1.4946236559139785,
56
+ "grad_norm": 1.8941368042951945,
57
  "learning_rate": 5.757138887522884e-06,
58
+ "loss": 0.7425,
59
  "step": 70
60
  },
61
  {
62
  "epoch": 1.7096774193548387,
63
+ "grad_norm": 1.6194897434909907,
64
  "learning_rate": 4.49415839006284e-06,
65
+ "loss": 0.7411,
66
  "step": 80
67
  },
68
  {
69
  "epoch": 1.924731182795699,
70
+ "grad_norm": 1.7633519262799326,
71
  "learning_rate": 3.2634737357758994e-06,
72
+ "loss": 0.7342,
73
  "step": 90
74
  },
75
  {
76
  "epoch": 2.129032258064516,
77
+ "grad_norm": 4.149990534677345,
78
  "learning_rate": 2.1436589245260375e-06,
79
+ "loss": 0.6493,
80
  "step": 100
81
  },
82
  {
83
  "epoch": 2.3440860215053765,
84
+ "grad_norm": 1.9290115229564264,
85
  "learning_rate": 1.2062093865360458e-06,
86
+ "loss": 0.5389,
87
  "step": 110
88
  },
89
  {
90
  "epoch": 2.5591397849462365,
91
+ "grad_norm": 1.8069878203895482,
92
  "learning_rate": 5.109773021462921e-07,
93
+ "loss": 0.536,
94
  "step": 120
95
  },
96
  {
97
  "epoch": 2.774193548387097,
98
+ "grad_norm": 1.8623419402988957,
99
  "learning_rate": 1.0235029373752758e-07,
100
+ "loss": 0.561,
101
  "step": 130
102
  },
103
  {
104
  "epoch": 2.946236559139785,
105
  "step": 138,
106
+ "total_flos": 3976309309440.0,
107
+ "train_loss": 0.8567031431889188,
108
+ "train_runtime": 1140.8622,
109
+ "train_samples_per_second": 1.943,
110
+ "train_steps_per_second": 0.121
111
  }
112
  ],
113
  "logging_steps": 10,
 
127
  "attributes": {}
128
  }
129
  },
130
+ "total_flos": 3976309309440.0,
131
  "train_batch_size": 1,
132
  "trial_name": null,
133
  "trial_params": null
training_loss.png CHANGED