Oysiyl commited on
Commit
7d5602f
·
verified ·
1 Parent(s): d9cca06

Oysiyl/colpali_ufo

Browse files
README.md CHANGED
@@ -15,6 +15,8 @@ should probably proofread and complete it, then remove this comment. -->
15
  # colpali_ufo
16
 
17
  This model is a fine-tuned version of [vidore/colpali-v1.2-hf](https://huggingface.co/vidore/colpali-v1.2-hf) on an unknown dataset.
 
 
18
 
19
  ## Model description
20
 
@@ -37,8 +39,6 @@ The following hyperparameters were used during training:
37
  - train_batch_size: 4
38
  - eval_batch_size: 8
39
  - seed: 42
40
- - gradient_accumulation_steps: 4
41
- - total_train_batch_size: 16
42
  - optimizer: Use adamw_torch with betas=(0.9,0.999) and epsilon=1e-08 and optimizer_args=No additional optimizer arguments
43
  - lr_scheduler_type: linear
44
  - lr_scheduler_warmup_steps: 100
@@ -46,12 +46,20 @@ The following hyperparameters were used during training:
46
 
47
  ### Training results
48
 
 
 
 
 
 
 
 
 
49
 
50
 
51
  ### Framework versions
52
 
53
- - PEFT 0.11.1
54
- - Transformers 4.50.0.dev0
55
- - Pytorch 2.2.1+cu121
56
  - Datasets 3.3.1
57
  - Tokenizers 0.21.0
 
15
  # colpali_ufo
16
 
17
  This model is a fine-tuned version of [vidore/colpali-v1.2-hf](https://huggingface.co/vidore/colpali-v1.2-hf) on an unknown dataset.
18
+ It achieves the following results on the evaluation set:
19
+ - Loss: 0.1795
20
 
21
  ## Model description
22
 
 
39
  - train_batch_size: 4
40
  - eval_batch_size: 8
41
  - seed: 42
 
 
42
  - optimizer: Use adamw_torch with betas=(0.9,0.999) and epsilon=1e-08 and optimizer_args=No additional optimizer arguments
43
  - lr_scheduler_type: linear
44
  - lr_scheduler_warmup_steps: 100
 
46
 
47
  ### Training results
48
 
49
+ | Training Loss | Epoch | Step | Validation Loss |
50
+ |:-------------:|:------:|:----:|:---------------:|
51
+ | 0.1276 | 0.1636 | 80 | 0.1831 |
52
+ | 0.0923 | 0.3272 | 160 | 0.1767 |
53
+ | 0.1029 | 0.4908 | 240 | 0.1730 |
54
+ | 0.093 | 0.6544 | 320 | 0.1749 |
55
+ | 0.0822 | 0.8180 | 400 | 0.1760 |
56
+ | 0.0965 | 0.9816 | 480 | 0.1795 |
57
 
58
 
59
  ### Framework versions
60
 
61
+ - PEFT 0.14.0
62
+ - Transformers 4.49.0
63
+ - Pytorch 2.3.0+cu121
64
  - Datasets 3.3.1
65
  - Tokenizers 0.21.0
adapter_config.json CHANGED
@@ -6,6 +6,8 @@
6
  },
7
  "base_model_name_or_path": "vidore/colpali-v1.2-hf",
8
  "bias": "none",
 
 
9
  "fan_in_fan_out": false,
10
  "inference_mode": true,
11
  "init_lora_weights": "gaussian",
@@ -14,22 +16,18 @@
14
  "layers_to_transform": null,
15
  "loftq_config": {},
16
  "lora_alpha": 8,
17
- "lora_dropout": 0.1,
 
18
  "megatron_config": null,
19
  "megatron_core": "megatron.core",
20
  "modules_to_save": null,
21
  "peft_type": "LORA",
22
- "r": 8,
23
  "rank_pattern": {},
24
  "revision": null,
25
  "target_modules": [
26
  "q_proj",
27
- "o_proj",
28
- "down_proj",
29
- "k_proj",
30
- "up_proj",
31
- "gate_proj",
32
- "v_proj"
33
  ],
34
  "task_type": null,
35
  "use_dora": false,
 
6
  },
7
  "base_model_name_or_path": "vidore/colpali-v1.2-hf",
8
  "bias": "none",
9
+ "eva_config": null,
10
+ "exclude_modules": null,
11
  "fan_in_fan_out": false,
12
  "inference_mode": true,
13
  "init_lora_weights": "gaussian",
 
16
  "layers_to_transform": null,
17
  "loftq_config": {},
18
  "lora_alpha": 8,
19
+ "lora_bias": false,
20
+ "lora_dropout": 0.2,
21
  "megatron_config": null,
22
  "megatron_core": "megatron.core",
23
  "modules_to_save": null,
24
  "peft_type": "LORA",
25
+ "r": 4,
26
  "rank_pattern": {},
27
  "revision": null,
28
  "target_modules": [
29
  "q_proj",
30
+ "k_proj"
 
 
 
 
 
31
  ],
32
  "task_type": null,
33
  "use_dora": false,
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:59447f437ad62db0bf16e19eeb9c939a2c7de0edf04cd4c046dc38810cbb53f7
3
- size 45260040
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:64a40b36bb25d4583cf6e233b22d028ca0f692ee7a00f5302fc2cc2d9f791d6b
3
+ size 3862296
runs/Apr03_16-43-10_ip-10-192-12-167/events.out.tfevents.1743698605.ip-10-192-12-167.4420.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a692d3e823c0a7c2215c1a8efa579f077af0c890cd337eb2bf4ed35c240b5007
3
+ size 6249
runs/Apr03_16-44-42_ip-10-192-12-167/events.out.tfevents.1743698689.ip-10-192-12-167.4420.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6d2fc9b9226ff5d933738ec931db7201a483cc66ee498f2cd9e9f4787fc8654c
3
+ size 6249
runs/Apr03_16-45-38_ip-10-192-12-167/events.out.tfevents.1743698746.ip-10-192-12-167.4420.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2e13775dcbef11d7278e487fe3a89cfac8cccbdbac842d0298f3e4f68b548d4b
3
+ size 6456
runs/Apr03_16-48-15_ip-10-192-12-167/events.out.tfevents.1743698901.ip-10-192-12-167.4420.3 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:69625b67d8f81cbfd8270559caae7305461ee31ac9ea3b916f2d02425b871c54
3
+ size 6249
runs/Apr03_17-10-22_ip-10-192-12-167/events.out.tfevents.1743700241.ip-10-192-12-167.50177.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f87f1dd2078f8caa2ca1297ec8cf926d56d776a25f972f33549f8d8b91174345
3
+ size 5974
runs/Apr03_17-12-49_ip-10-192-12-167/events.out.tfevents.1743700381.ip-10-192-12-167.50177.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a18b7897f3a57a14dad55ea05c1a925869bac4606695e3200a5dcd5b34aea004
3
+ size 5767
runs/Apr03_17-15-00_ip-10-192-12-167/events.out.tfevents.1743700506.ip-10-192-12-167.57304.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e19c00710fa8cb63398402635bfe21f339323053695ed6706750a1c02943ac0a
3
+ size 5767
runs/Apr03_17-16-25_ip-10-192-12-167/events.out.tfevents.1743700593.ip-10-192-12-167.60005.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:56a9183640ba45f4f84ba13066b1895d18e96ac0e4dd4036c26e2008e81b69ba
3
+ size 5974
runs/Apr03_17-20-11_ip-10-192-12-167/events.out.tfevents.1743700818.ip-10-192-12-167.60005.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8f762294890d7f33279804fa33eff927caeca1918951ef999d648be323a296ca
3
+ size 5974
runs/Apr03_17-23-40_ip-10-192-12-167/events.out.tfevents.1743701028.ip-10-192-12-167.67022.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:270439c8a8aa97e47f144d106447ad609328c11d98f51408d383d11d6a8fa922
3
+ size 9004
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:94ba8f4bef1143d207b868f001cd1b70199fcd8e795559d3865f2c34324bf2bb
3
  size 5304
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:74c7fbb4a3cdf633646919fe0e4f78e18c53b67c007308a611987ef579946d96
3
  size 5304