toilaluan commited on
Commit
67e3bc5
·
verified ·
1 Parent(s): 72f1cf4

Training in progress, step 2500

Browse files
adapter_config.json CHANGED
@@ -1 +1,41 @@
1
- {"alpha_pattern": {}, "auto_mapping": null, "base_model_name_or_path": "unsloth/Qwen2.5-Math-7B-Instruct", "bias": "none", "fan_in_fan_out": false, "inference_mode": true, "init_lora_weights": true, "layer_replication": null, "layers_pattern": null, "layers_to_transform": null, "loftq_config": {}, "lora_alpha": 256, "lora_dropout": 0.0, "megatron_config": null, "megatron_core": "megatron.core", "modules_to_save": null, "peft_type": "LORA", "r": 128, "rank_pattern": {}, "revision": null, "target_modules": ["o_proj", "k_proj", "up_proj", "query_key_value", "q_proj", "out_proj", "gate_proj", "down_proj", "v_proj"], "task_type": "CAUSAL_LM", "use_dora": false, "use_rslora": false}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "alpha_pattern": {},
3
+ "auto_mapping": null,
4
+ "base_model_name_or_path": "unsloth/Qwen2.5-Math-7B-Instruct",
5
+ "bias": "none",
6
+ "corda_config": null,
7
+ "eva_config": null,
8
+ "exclude_modules": null,
9
+ "fan_in_fan_out": false,
10
+ "inference_mode": true,
11
+ "init_lora_weights": true,
12
+ "layer_replication": null,
13
+ "layers_pattern": null,
14
+ "layers_to_transform": null,
15
+ "loftq_config": {},
16
+ "lora_alpha": 256,
17
+ "lora_bias": false,
18
+ "lora_dropout": 0.0,
19
+ "megatron_config": null,
20
+ "megatron_core": "megatron.core",
21
+ "modules_to_save": null,
22
+ "peft_type": "LORA",
23
+ "r": 128,
24
+ "rank_pattern": {},
25
+ "revision": null,
26
+ "target_modules": [
27
+ "v_proj",
28
+ "query_key_value",
29
+ "o_proj",
30
+ "up_proj",
31
+ "q_proj",
32
+ "out_proj",
33
+ "k_proj",
34
+ "down_proj",
35
+ "gate_proj"
36
+ ],
37
+ "task_type": "CAUSAL_LM",
38
+ "trainable_token_indices": null,
39
+ "use_dora": false,
40
+ "use_rslora": false
41
+ }
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d311a6e07b29b5b7deaee4357520e131ac71af1c3232104fd77aa02d4e38f9e5
3
  size 1291899160
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:990b210f00d3fd79e72528a99845e3119d791adf4d3d861b6d2a048cdab00e30
3
  size 1291899160
toilaluan/84b5262c-9e41-4939-9c06-b67b5cdd9044/adapter_config.json CHANGED
@@ -1 +1 @@
1
- {"alpha_pattern": {}, "auto_mapping": null, "base_model_name_or_path": "unsloth/Qwen2.5-Math-7B-Instruct", "bias": "none", "fan_in_fan_out": false, "inference_mode": true, "init_lora_weights": true, "layer_replication": null, "layers_pattern": null, "layers_to_transform": null, "loftq_config": {}, "lora_alpha": 256, "lora_dropout": 0.0, "megatron_config": null, "megatron_core": "megatron.core", "modules_to_save": null, "peft_type": "LORA", "r": 128, "rank_pattern": {}, "revision": null, "target_modules": ["gate_proj", "o_proj", "out_proj", "v_proj", "k_proj", "q_proj", "query_key_value", "up_proj", "down_proj"], "task_type": "CAUSAL_LM", "use_dora": false, "use_rslora": false}
 
1
+ {"alpha_pattern": {}, "auto_mapping": null, "base_model_name_or_path": "unsloth/Qwen2.5-Math-7B-Instruct", "bias": "none", "fan_in_fan_out": false, "inference_mode": true, "init_lora_weights": true, "layer_replication": null, "layers_pattern": null, "layers_to_transform": null, "loftq_config": {}, "lora_alpha": 256, "lora_dropout": 0.0, "megatron_config": null, "megatron_core": "megatron.core", "modules_to_save": null, "peft_type": "LORA", "r": 128, "rank_pattern": {}, "revision": null, "target_modules": ["o_proj", "k_proj", "up_proj", "query_key_value", "q_proj", "out_proj", "gate_proj", "down_proj", "v_proj"], "task_type": "CAUSAL_LM", "use_dora": false, "use_rslora": false}
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5f6651393a12e39c286071f29714ec1bd15310e5c509b57dff436d175f48c715
3
  size 5752
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3fdcfcbd453fe5500e54844c52290ab47950e2dae775f5e623f7cf153ff2601b
3
  size 5752