Grogros's picture
Upload finetuning_config.yaml with huggingface_hub
c95a2a9 verified
raw
history blame
1.21 kB
alpha: 0.2
base_model: mistralai/Ministral-8B-Instruct-2410
custom_name: d4-a0.2-v4
dtype: bfloat16
lambdas:
- 1.0
- 1.0
- 1.0
lora_config: null
loss_types:
- anti-watermark
- anti-watermark
meta_learning_config: null
multi_gpu: true
n_wm_tokens: 0
proportions:
- 0.5
- 0.2
- 0.3
random_training_config: null
regularization_datasets:
- !!python/object/apply:finetuning.dataset.DatasetType
- AlpacaGPT4
- !!python/object/apply:finetuning.dataset.DatasetType
- WO_NoHealth
sequence_length: 512
streaming: true
training_args:
bf16: false
ddp_find_unused_parameters: false
do_train: true
fp16: false
gradient_accumulation_steps: 32
gradient_checkpointing: false
hub_strategy: all_checkpoints
learning_rate: 2.0e-05
logging_steps: 10
lr_scheduler_type: cosine
max_steps: 2500
num_train_epochs: 1
optim: adafactor
output_dir: Grogros/dmWM-mistralai-Ministral-8B-Instruct-2410-WOHealth-Al4-NH-WO-d4-a0.2-v4
overwrite_output_dir: true
per_device_train_batch_size: 1
push_to_hub: true
report_to: none
save_steps: 500
save_strategy: steps
warmup_ratio: 0.1
watermark_datasets:
- !!python/object/apply:finetuning.dataset.DatasetType
- WOHealth
watermark_eval_config: []