sabrieyuboglu commited on
Commit
0e72f89
·
verified ·
1 Parent(s): c1f2ae2

Upload config.yaml with huggingface_hub

Browse files
Files changed (1) hide show
  1. config.yaml +215 -0
config.yaml ADDED
@@ -0,0 +1,215 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ _config_type:
2
+ _is_type: true
3
+ _module: capsules.train
4
+ _qualname: TrainConfig
5
+ cache_ema_alpha: 0.9
6
+ context:
7
+ _config_type:
8
+ _is_type: true
9
+ _module: capsules.tasks.longhealth.context
10
+ _qualname: LongHealthStructuredContextConfig
11
+ patient_ids:
12
+ - patient_01
13
+ - patient_02
14
+ - patient_03
15
+ - patient_04
16
+ - patient_05
17
+ - patient_06
18
+ - patient_07
19
+ - patient_08
20
+ - patient_09
21
+ - patient_10
22
+ dataset:
23
+ _config_type:
24
+ _is_type: true
25
+ _module: capsules.datasets
26
+ _qualname: CapsuleDatasetLatest.Config
27
+ convo_transforms: null
28
+ data_sources:
29
+ - !!python/tuple
30
+ - hazy-research/capsules/generate_longhealth_simple_p10_s5_n65536:v0
31
+ - null
32
+ - !!python/tuple
33
+ - hazy-research/capsules/generate_longhealth_simple_p10_s5_n65536:v1
34
+ - null
35
+ dataset_weights: null
36
+ is_wandb: true
37
+ kwargs: {}
38
+ label_type: logits
39
+ max_sequence_length: 1024
40
+ target:
41
+ _is_type: true
42
+ _module: capsules.datasets
43
+ _qualname: CapsuleDatasetLatest
44
+ top_k_logits: 20
45
+ user_prompt_prefix: null
46
+ device: cuda
47
+ distributed_backend: gloo
48
+ ema_cache: false
49
+ epochs: 2
50
+ eval_datasets:
51
+ - _config_type:
52
+ _is_type: true
53
+ _module: capsules.train
54
+ _qualname: EvalDatasetConfig
55
+ dataloader_num_workers: 0
56
+ dataset:
57
+ _config_type:
58
+ _is_type: true
59
+ _module: capsules.tasks.longhealth
60
+ _qualname: LongHealthEvalDataset.Config
61
+ convo_transforms: null
62
+ data_sources: []
63
+ dataset_weights: null
64
+ is_wandb: false
65
+ kwargs: {}
66
+ label_type: tokens
67
+ max_questions: 256
68
+ patient_ids:
69
+ - patient_01
70
+ - patient_02
71
+ - patient_03
72
+ - patient_04
73
+ - patient_05
74
+ - patient_06
75
+ - patient_07
76
+ - patient_08
77
+ - patient_09
78
+ - patient_10
79
+ target:
80
+ _is_type: true
81
+ _module: capsules.tasks.longhealth
82
+ _qualname: LongHealthEvalDataset
83
+ top_k_logits: 20
84
+ user_prompt_prefix: null
85
+ local_batch_size: 16
86
+ name_for_wandb: longhealth_mc
87
+ only_eval_rank_0: false
88
+ eval_every_n_steps: 256
89
+ eval_log_table: true
90
+ eval_max_samples: null
91
+ generate_datasets:
92
+ - _config_type:
93
+ _is_type: true
94
+ _module: capsules.train
95
+ _qualname: GenerateDatasetConfig
96
+ batch_size: 16
97
+ dataloader_num_workers: 0
98
+ dataset:
99
+ _config_type:
100
+ _is_type: true
101
+ _module: capsules.tasks.longhealth
102
+ _qualname: LongHealthMultipleChoiceGenerateDataset.Config
103
+ cot: true
104
+ include_diagnosis: true
105
+ kwargs: {}
106
+ max_questions: null
107
+ patient_ids:
108
+ - patient_01
109
+ - patient_02
110
+ - patient_03
111
+ - patient_04
112
+ - patient_05
113
+ - patient_06
114
+ - patient_07
115
+ - patient_08
116
+ - patient_09
117
+ - patient_10
118
+ target:
119
+ _is_type: true
120
+ _module: capsules.tasks.longhealth
121
+ _qualname: LongHealthMultipleChoiceGenerateDataset
122
+ name_for_wandb: longhealth_mc
123
+ num_samples: 4
124
+ num_samples_final: 8
125
+ override_max_tokens: null
126
+ temperature: 0.3
127
+ generate_every_n_steps: 512
128
+ generate_max_new_tokens: 512
129
+ global_batch_size: 64
130
+ keep_last_n_saved: 1
131
+ kv_cache_initializer:
132
+ _config_type:
133
+ _is_type: true
134
+ _module: capsules.kv_initialization.strategies.first_n_tokens
135
+ _qualname: KVCacheInitFromFirstNTokensOfContext.Config
136
+ context: null
137
+ kwargs: {}
138
+ max_tokens: 2048
139
+ num_frozen_tokens: 1
140
+ target:
141
+ _is_type: true
142
+ _module: capsules.kv_initialization.strategies.first_n_tokens
143
+ _qualname: KVCacheInitFromFirstNTokensOfContext
144
+ launch_id: 2025-05-10-14-56-42-train_longhealth_simple
145
+ local_batch_size: 4
146
+ log_logprob_viz: false
147
+ loss_type: logits
148
+ lr: 0.02
149
+ lr_scheduler: null
150
+ max_optimizer_steps: -1
151
+ model:
152
+ _config_type:
153
+ _is_type: true
154
+ _module: capsules.config
155
+ _qualname: HFModelConfig
156
+ attn_implementation: einsum
157
+ checkpoint_path: null
158
+ load_kwargs: {}
159
+ model_cls:
160
+ _is_type: true
161
+ _module: capsules.models.llama
162
+ _qualname: LlamaForCausalLM
163
+ peft:
164
+ _config_type:
165
+ _is_type: true
166
+ _module: capsules.config
167
+ _qualname: PeftConfig
168
+ adapter_non_linearity: relu
169
+ adapter_reduction_factor: 16
170
+ alpha: 16
171
+ bias: none
172
+ dropout: 0.0
173
+ enabled: false
174
+ encoder_dropout: 0.0
175
+ encoder_hidden_size: null
176
+ encoder_reparameterization_type: MLP
177
+ extra_params: {}
178
+ method: lora
179
+ num_virtual_tokens: 20
180
+ prefix_projection: false
181
+ prompt_tuning_init: null
182
+ prompt_tuning_init_text: null
183
+ r: 8
184
+ target_modules: null
185
+ task_type: CAUSAL_LM
186
+ pretrained_model_name_or_path: meta-llama/Llama-3.2-3B-Instruct
187
+ tuning_method: custom_prefix
188
+ name: train_longhealth_simple_p10_lr0.02_toks2048
189
+ online_model: true
190
+ optimizer: adam
191
+ output_dir: /data/sabri/capsules
192
+ pretrained_cache_path: null
193
+ run_dir: /data/sabri/capsules/2025-05-10-14-56-42-train_longhealth_simple/68e4c064-dc5a-46c8-a726-b3c7977e9e1a
194
+ run_id: 68e4c064-dc5a-46c8-a726-b3c7977e9e1a
195
+ save_after_training: true
196
+ save_every_n_steps: 512
197
+ save_to_wandb: true
198
+ script_id: train_longhealth_simple
199
+ seed: 42
200
+ tokenizer: meta-llama/Llama-3.2-1B-Instruct
201
+ use_batch_sampler: false
202
+ wandb:
203
+ _config_type:
204
+ _is_type: true
205
+ _module: capsules.utils.wandb
206
+ _qualname: WandBConfig
207
+ entity: hazy-research
208
+ group: null
209
+ name: train_longhealth_simple_p10_lr0.02_toks2048
210
+ notes: null
211
+ project: capsules
212
+ tags:
213
+ - train
214
+ - longhealth
215
+ - patientsp10