LordPBA commited on
Commit
510dfae
·
verified ·
1 Parent(s): 5d22aca

Training in progress, epoch 1

Browse files
adapter_config.json CHANGED
@@ -18,22 +18,25 @@
18
  "lora_dropout": 0.05,
19
  "megatron_config": null,
20
  "megatron_core": "megatron.core",
21
- "modules_to_save": null,
 
 
 
22
  "peft_type": "LORA",
23
- "r": 8,
24
  "rank_pattern": {},
25
  "revision": null,
26
  "target_modules": [
27
- "v_proj",
28
- "down_proj",
29
  "q_proj",
30
- "fc1",
31
  "up_proj",
32
- "fc2",
33
  "k_proj",
34
- "gate_proj",
35
- "out_proj",
36
- "o_proj"
37
  ],
38
  "task_type": "CAUSAL_LM",
39
  "trainable_token_indices": null,
 
18
  "lora_dropout": 0.05,
19
  "megatron_config": null,
20
  "megatron_core": "megatron.core",
21
+ "modules_to_save": [
22
+ "lm_head",
23
+ "embed_tokens"
24
+ ],
25
  "peft_type": "LORA",
26
+ "r": 16,
27
  "rank_pattern": {},
28
  "revision": null,
29
  "target_modules": [
30
+ "fc2",
31
+ "out_proj",
32
  "q_proj",
33
+ "o_proj",
34
  "up_proj",
35
+ "v_proj",
36
  "k_proj",
37
+ "down_proj",
38
+ "fc1",
39
+ "gate_proj"
40
  ],
41
  "task_type": "CAUSAL_LM",
42
  "trainable_token_indices": null,
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:155a4bb01587d3038cee3c89befca01ea0fcef2b276ab8adb454d55379670ccd
3
- size 77119048
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aabe8db5f15f6e15caa5a117bb409d41331f32f60f9eca2d5f8d42b7185bb01b
3
+ size 2839126480
added_tokens.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ {
2
+ "<image_soft_token>": 262144
3
+ }
preprocessor_config.json ADDED
@@ -0,0 +1,29 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "do_convert_rgb": null,
3
+ "do_normalize": true,
4
+ "do_pan_and_scan": null,
5
+ "do_rescale": true,
6
+ "do_resize": true,
7
+ "image_mean": [
8
+ 0.5,
9
+ 0.5,
10
+ 0.5
11
+ ],
12
+ "image_processor_type": "Gemma3ImageProcessor",
13
+ "image_seq_length": 256,
14
+ "image_std": [
15
+ 0.5,
16
+ 0.5,
17
+ 0.5
18
+ ],
19
+ "pan_and_scan_max_num_crops": null,
20
+ "pan_and_scan_min_crop_size": null,
21
+ "pan_and_scan_min_ratio_to_activate": null,
22
+ "processor_class": "Gemma3Processor",
23
+ "resample": 2,
24
+ "rescale_factor": 0.00392156862745098,
25
+ "size": {
26
+ "height": 896,
27
+ "width": 896
28
+ }
29
+ }
processor_config.json ADDED
@@ -0,0 +1,4 @@
 
 
 
 
 
1
+ {
2
+ "image_seq_length": 256,
3
+ "processor_class": "Gemma3Processor"
4
+ }
runs/Jun10_08-45-28_7ea6724ade3d/events.out.tfevents.1749545132.7ea6724ade3d.5178.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:70306e962a406f4172c546f1ebeafac5b676032a0258a621352c85bf45faa576
3
+ size 15217
tokenizer.json CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b6ec2659e52e3d1aa82505357493940039828c81360d681090c3082f1878052c
3
- size 33384822
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1ebf1915455f8237564395182c49e3c685cfe3533b3d50ec6d49ce65ec43c32e
3
+ size 33384723
tokenizer.model ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1299c11d7cf632ef3b4e11937501358ada021bbdf7c47638d13c0ee982f2e79c
3
+ size 4689074
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7401f90eb773cc9c00a06a08c17cc6d2a4d0ff8f0e33cb38f98a760c5a5ab57c
3
- size 6097
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4482a7007a820b2911a5238e1c0c2bbfd2d189c47fe9f16b2f3d6244fe91f2fc
3
+ size 5688