Upload folder using huggingface_hub

Browse files

Files changed (7) hide show

checkpoint-1000/README.md +33 -33
checkpoint-1000/model.safetensors +1 -1
checkpoint-1000/optimizer.pt +1 -1
checkpoint-1000/rng_state.pth +1 -1
checkpoint-1000/scheduler.pt +1 -1
checkpoint-1000/trainer_state.json +32 -32
checkpoint-1000/training_args.bin +1 -1

checkpoint-1000/README.md CHANGED Viewed

@@ -13,31 +13,31 @@ tags:
 - dataset_size:74247
 - loss:AnglELoss
 widget:
-- source_sentence: hand of fatima decanter
-  sentences:
-  - matte concealer
-  - car refresher spray
-  - bread
-- source_sentence: intensive antiwrinkle face cream
   sentences:
   - bread
-  - bread
   - car refresher spray
-- source_sentence: aromatic coffee capsules
   sentences:
-  - bread
-  - car refresher spray
-  - bread
-- source_sentence: side fringe jacket
   sentences:
-  - car refresher spray
-  - car refresher spray
   - home scent
-- source_sentence: pastelcolored cookies
   sentences:
-  - matte concealer
-  - rice
-  - bisk
 ---
 # all-MiniLM-L6-v6-pair_score
@@ -90,9 +90,9 @@ from sentence_transformers import SentenceTransformer
 model = SentenceTransformer("sentence_transformers_model_id")
 # Run inference
 sentences = [
-    'pastelcolored cookies',
-    'bisk',
-    'rice',
 ]
 embeddings = model.encode(sentences)
 print(embeddings.shape)
@@ -149,7 +149,7 @@ You can finetune this model on your own dataset.
 - `per_device_train_batch_size`: 128
 - `per_device_eval_batch_size`: 128
 - `learning_rate`: 2e-05
-- `num_train_epochs`: 2
 - `warmup_ratio`: 0.1
 - `fp16`: True
@@ -173,7 +173,7 @@ You can finetune this model on your own dataset.
 - `adam_beta2`: 0.999
 - `adam_epsilon`: 1e-08
 - `max_grad_norm`: 1.0
-- `num_train_epochs`: 2
 - `max_steps`: -1
 - `lr_scheduler_type`: linear
 - `lr_scheduler_kwargs`: {}
@@ -274,16 +274,16 @@ You can finetune this model on your own dataset.
 ### Training Logs
 | Epoch  | Step | Training Loss |
 |:------:|:----:|:-------------:|
-| 0.1721 | 100  | 8.9697        |
-| 0.3442 | 200  | 2.6119        |
-| 0.5164 | 300  | 0.9351        |
-| 0.6885 | 400  | 0.7049        |
-| 0.8606 | 500  | 0.394         |
-| 1.0327 | 600  | 0.6792        |
-| 1.2048 | 700  | 0.715         |
-| 1.3769 | 800  | 0.5655        |
-| 1.5491 | 900  | 0.5354        |
-| 1.7212 | 1000 | 0.6299        |
 ### Framework Versions

 - dataset_size:74247
 - loss:AnglELoss
 widget:
+- source_sentence: paste
   sentences:
   - bread
   - car refresher spray
+  - hot drinks mug
+- source_sentence: shoulder strap accessory for bags
   sentences:
+  - home scent
+  - ball
+  - one outer pocket cross bag
+- source_sentence: deep fried mozzarella sticks
   sentences:
+  - one outer pocket cross bag
+  - insect killer
+  - stir fry vegetables bowl
+- source_sentence: metal flower set tableaus
+  sentences:
+  - home scent
   - home scent
+  - hygiene
+- source_sentence: basic choker
   sentences:
+  - hygiene
+  - unisex sweatshirt
+  - unisex sweatshirt
 ---
 # all-MiniLM-L6-v6-pair_score
 model = SentenceTransformer("sentence_transformers_model_id")
 # Run inference
 sentences = [
+    'basic choker',
+    'unisex sweatshirt',
+    'unisex sweatshirt',
 ]
 embeddings = model.encode(sentences)
 print(embeddings.shape)
 - `per_device_train_batch_size`: 128
 - `per_device_eval_batch_size`: 128
 - `learning_rate`: 2e-05
+- `num_train_epochs`: 15
 - `warmup_ratio`: 0.1
 - `fp16`: True
 - `adam_beta2`: 0.999
 - `adam_epsilon`: 1e-08
 - `max_grad_norm`: 1.0
+- `num_train_epochs`: 15
 - `max_steps`: -1
 - `lr_scheduler_type`: linear
 - `lr_scheduler_kwargs`: {}
 ### Training Logs
 | Epoch  | Step | Training Loss |
 |:------:|:----:|:-------------:|
+| 0.1721 | 100  | 10.8697       |
+| 0.3442 | 200  | 9.1125        |
+| 0.5164 | 300  | 6.8873        |
+| 0.6885 | 400  | 3.1124        |
+| 0.8606 | 500  | 1.0882        |
+| 1.0327 | 600  | 0.869         |
+| 1.2048 | 700  | 0.6952        |
+| 1.3769 | 800  | 0.5522        |
+| 1.5491 | 900  | 0.5184        |
+| 1.7212 | 1000 | 0.3996        |
 ### Framework Versions

checkpoint-1000/model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ea4b264b62f1f3dfc8756de31cee45d4ac202c2713bed99f962a11e9087a35e3
 size 90864192

 version https://git-lfs.github.com/spec/v1
+oid sha256:73e5bceeeb8bd41387e7ebe4b365333a81a52ae62160e1fa7e0a03dfc37ba0e3
 size 90864192

checkpoint-1000/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:3a233a843b3a76d2b79bcb84775a6f946f363ec4c1cb82d0a2a2fb5336725f64
 size 180607738

 version https://git-lfs.github.com/spec/v1
+oid sha256:cb34b407b9c534b08406d0b763420188b77a8c5ae59b33faef820746c1533433
 size 180607738

checkpoint-1000/rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:a9b4e3b023cf818a92a7faebf3bfd08e4bf4825bcbd3669f92d1f25d60a14eef
 size 14244

 version https://git-lfs.github.com/spec/v1
+oid sha256:b320d6c3b1cd02590a033bf1d85ee904f31b839ca127ff50b770410fdc09a9e7
 size 14244

checkpoint-1000/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:75a7920109b4e336482779ea4d3a308920045e01ee2548b630deb1a47f9a0f7a
 size 1064

 version https://git-lfs.github.com/spec/v1
+oid sha256:15dfa03098fd205b4cc1a5079e6c0db8a1fc9977130aed17d77d33eb6d658add
 size 1064

checkpoint-1000/trainer_state.json CHANGED Viewed

@@ -10,79 +10,79 @@
   "log_history": [
     {
       "epoch": 0.1721170395869191,
-      "grad_norm": 85.81483459472656,
-      "learning_rate": 1.6581196581196585e-05,
-      "loss": 8.9697,
       "step": 100
     },
     {
       "epoch": 0.3442340791738382,
-      "grad_norm": 12.870137214660645,
-      "learning_rate": 1.8468899521531104e-05,
-      "loss": 2.6119,
       "step": 200
     },
     {
       "epoch": 0.5163511187607573,
-      "grad_norm": 6.086756706237793,
-      "learning_rate": 1.657416267942584e-05,
-      "loss": 0.9351,
       "step": 300
     },
     {
       "epoch": 0.6884681583476764,
-      "grad_norm": 4.553544998168945,
-      "learning_rate": 1.4660287081339715e-05,
-      "loss": 0.7049,
       "step": 400
     },
     {
       "epoch": 0.8605851979345955,
-      "grad_norm": 150.66317749023438,
-      "learning_rate": 1.274641148325359e-05,
-      "loss": 0.394,
       "step": 500
     },
     {
       "epoch": 1.0327022375215147,
-      "grad_norm": 2.234631061553955,
-      "learning_rate": 1.0832535885167466e-05,
-      "loss": 0.6792,
       "step": 600
     },
     {
       "epoch": 1.2048192771084336,
-      "grad_norm": 3.470113515853882,
-      "learning_rate": 8.91866028708134e-06,
-      "loss": 0.715,
       "step": 700
     },
     {
       "epoch": 1.3769363166953528,
-      "grad_norm": 2.741096019744873,
-      "learning_rate": 7.004784688995215e-06,
-      "loss": 0.5655,
       "step": 800
     },
     {
       "epoch": 1.549053356282272,
-      "grad_norm": 1.5165340900421143,
-      "learning_rate": 5.090909090909091e-06,
-      "loss": 0.5354,
       "step": 900
     },
     {
       "epoch": 1.721170395869191,
-      "grad_norm": 1.2075858116149902,
-      "learning_rate": 3.177033492822967e-06,
-      "loss": 0.6299,
       "step": 1000
     }
   ],
   "logging_steps": 100,
-  "max_steps": 1162,
   "num_input_tokens_seen": 0,
-  "num_train_epochs": 2,
   "save_steps": 500,
   "stateful_callbacks": {
     "TrainerControl": {

   "log_history": [
     {
       "epoch": 0.1721170395869191,
+      "grad_norm": 134.16664123535156,
+      "learning_rate": 2.224770642201835e-06,
+      "loss": 10.8697,
       "step": 100
     },
     {
       "epoch": 0.3442340791738382,
+      "grad_norm": 69.6041259765625,
+      "learning_rate": 4.5183486238532115e-06,
+      "loss": 9.1125,
       "step": 200
     },
     {
       "epoch": 0.5163511187607573,
+      "grad_norm": 103.4394760131836,
+      "learning_rate": 6.8119266055045875e-06,
+      "loss": 6.8873,
       "step": 300
     },
     {
       "epoch": 0.6884681583476764,
+      "grad_norm": 32.237342834472656,
+      "learning_rate": 9.08256880733945e-06,
+      "loss": 3.1124,
       "step": 400
     },
     {
       "epoch": 0.8605851979345955,
+      "grad_norm": 13.523033142089844,
+      "learning_rate": 1.1376146788990828e-05,
+      "loss": 1.0882,
       "step": 500
     },
     {
       "epoch": 1.0327022375215147,
+      "grad_norm": 56.13002395629883,
+      "learning_rate": 1.3669724770642203e-05,
+      "loss": 0.869,
       "step": 600
     },
     {
       "epoch": 1.2048192771084336,
+      "grad_norm": 4.41276741027832,
+      "learning_rate": 1.5963302752293578e-05,
+      "loss": 0.6952,
       "step": 700
     },
     {
       "epoch": 1.3769363166953528,
+      "grad_norm": 1.8771318197250366,
+      "learning_rate": 1.8256880733944955e-05,
+      "loss": 0.5522,
       "step": 800
     },
     {
       "epoch": 1.549053356282272,
+      "grad_norm": 5.131401062011719,
+      "learning_rate": 1.9938798928981258e-05,
+      "loss": 0.5184,
       "step": 900
     },
     {
       "epoch": 1.721170395869191,
+      "grad_norm": 3.2520999908447266,
+      "learning_rate": 1.9683794466403164e-05,
+      "loss": 0.3996,
       "step": 1000
     }
   ],
   "logging_steps": 100,
+  "max_steps": 8715,
   "num_input_tokens_seen": 0,
+  "num_train_epochs": 15,
   "save_steps": 500,
   "stateful_callbacks": {
     "TrainerControl": {

checkpoint-1000/training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:57644da3fa51947d8e4d49382ff60305072c84a28b92b508a49ba8ad874ddd0f
 size 5496

 version https://git-lfs.github.com/spec/v1
+oid sha256:ac8296029d0c3febd6057eb740de9cfe0b929fa172fd988f31151dfac15c657c
 size 5496