Spaces:
Running
Running
| { | |
| "experiments": { | |
| "test_exp_001": { | |
| "id": "test_exp_001", | |
| "name": "Test Experiment", | |
| "description": "Debug test", | |
| "created_at": "2025-07-20T14:01:48.871089", | |
| "status": "running", | |
| "metrics": [ | |
| { | |
| "timestamp": "2025-07-20T14:01:48.871096", | |
| "step": 25, | |
| "metrics": { | |
| "loss": 1.165, | |
| "accuracy": 0.75, | |
| "learning_rate": 3.5e-06 | |
| } | |
| } | |
| ], | |
| "parameters": {}, | |
| "artifacts": [], | |
| "logs": [] | |
| }, | |
| "exp_20250720_130853": { | |
| "id": "exp_20250720_130853", | |
| "name": "petite-elle-l-aime-3", | |
| "description": "SmolLM3 fine-tuning experiment", | |
| "created_at": "2025-07-20T11:20:01.780908", | |
| "status": "running", | |
| "metrics": [ | |
| { | |
| "timestamp": "2025-07-20T11:20:01.780908", | |
| "step": 25, | |
| "metrics": { | |
| "loss": 1.1659, | |
| "grad_norm": 10.3125, | |
| "learning_rate": 7e-08, | |
| "num_tokens": 1642080.0, | |
| "mean_token_accuracy": 0.75923578992486, | |
| "epoch": 0.004851130919895701 | |
| } | |
| }, | |
| { | |
| "timestamp": "2025-07-20T11:26:39.042155", | |
| "step": 50, | |
| "metrics": { | |
| "loss": 1.165, | |
| "grad_norm": 10.75, | |
| "learning_rate": 1.4291666666666667e-07, | |
| "num_tokens": 3324682.0, | |
| "mean_token_accuracy": 0.7577659255266189, | |
| "epoch": 0.009702261839791402 | |
| } | |
| }, | |
| { | |
| "timestamp": "2025-07-20T11:33:16.203045", | |
| "step": 75, | |
| "metrics": { | |
| "loss": 1.1639, | |
| "grad_norm": 10.6875, | |
| "learning_rate": 2.1583333333333334e-07, | |
| "num_tokens": 4987941.0, | |
| "mean_token_accuracy": 0.7581205774843692, | |
| "epoch": 0.014553392759687101 | |
| } | |
| }, | |
| { | |
| "timestamp": "2025-07-20T11:39:53.453917", | |
| "step": 100, | |
| "metrics": { | |
| "loss": 1.1528, | |
| "grad_norm": 10.75, | |
| "learning_rate": 2.8875e-07, | |
| "num_tokens": 6630190.0, | |
| "mean_token_accuracy": 0.7614579878747463, | |
| "epoch": 0.019404523679582803 | |
| } | |
| } | |
| ], | |
| "parameters": { | |
| "model_name": "HuggingFaceTB/SmolLM3-3B", | |
| "max_seq_length": 12288, | |
| "use_flash_attention": true, | |
| "use_gradient_checkpointing": false, | |
| "batch_size": 8, | |
| "gradient_accumulation_steps": 16, | |
| "learning_rate": 3.5e-06, | |
| "weight_decay": 0.01, | |
| "warmup_steps": 1200, | |
| "max_iters": 18000, | |
| "eval_interval": 1000, | |
| "log_interval": 25, | |
| "save_interval": 2000, | |
| "optimizer": "adamw_torch", | |
| "beta1": 0.9, | |
| "beta2": 0.999, | |
| "eps": 1e-08, | |
| "scheduler": "cosine", | |
| "min_lr": 3.5e-07, | |
| "fp16": false, | |
| "bf16": true, | |
| "ddp_backend": "nccl", | |
| "ddp_find_unused_parameters": false, | |
| "save_steps": 2000, | |
| "eval_steps": 1000, | |
| "logging_steps": 25, | |
| "save_total_limit": 5, | |
| "eval_strategy": "steps", | |
| "metric_for_best_model": "eval_loss", | |
| "greater_is_better": false, | |
| "load_best_model_at_end": true, | |
| "data_dir": null, | |
| "train_file": null, | |
| "validation_file": null, | |
| "test_file": null, | |
| "use_chat_template": true, | |
| "chat_template_kwargs": { | |
| "add_generation_prompt": true, | |
| "no_think_system_message": true | |
| }, | |
| "enable_tracking": true, | |
| "trackio_url": "https://tonic-test-trackio-test.hf.space", | |
| "trackio_token": null, | |
| "log_artifacts": true, | |
| "log_metrics": true, | |
| "log_config": true, | |
| "experiment_name": "petite-elle-l-aime-3", | |
| "dataset_name": "legmlai/openhermes-fr", | |
| "dataset_split": "train", | |
| "input_field": "prompt", | |
| "target_field": "accepted_completion", | |
| "filter_bad_entries": true, | |
| "bad_entry_field": "bad_entry", | |
| "packing": false, | |
| "max_prompt_length": 12288, | |
| "max_completion_length": 8192, | |
| "truncation": true, | |
| "dataloader_num_workers": 10, | |
| "dataloader_pin_memory": true, | |
| "dataloader_prefetch_factor": 3, | |
| "max_grad_norm": 1.0, | |
| "group_by_length": true | |
| }, | |
| "artifacts": [], | |
| "logs": [] | |
| }, | |
| "exp_20250720_134319": { | |
| "id": "exp_20250720_134319", | |
| "name": "petite-elle-l-aime-3-1", | |
| "description": "SmolLM3 fine-tuning experiment", | |
| "created_at": "2025-07-20T11:54:31.993219", | |
| "status": "running", | |
| "metrics": [ | |
| { | |
| "timestamp": "2025-07-20T11:54:31.993219", | |
| "step": 25, | |
| "metrics": { | |
| "loss": 1.166, | |
| "grad_norm": 10.375, | |
| "learning_rate": 7e-08, | |
| "num_tokens": 1642080.0, | |
| "mean_token_accuracy": 0.7590958896279335, | |
| "epoch": 0.004851130919895701 | |
| } | |
| }, | |
| { | |
| "timestamp": "2025-07-20T11:54:33.589487", | |
| "step": 25, | |
| "metrics": { | |
| "gpu_0_memory_allocated": 17.202261447906494, | |
| "gpu_0_memory_reserved": 75.474609375, | |
| "gpu_0_utilization": 0, | |
| "cpu_percent": 2.7, | |
| "memory_percent": 10.1 | |
| } | |
| } | |
| ], | |
| "parameters": { | |
| "model_name": "HuggingFaceTB/SmolLM3-3B", | |
| "max_seq_length": 12288, | |
| "use_flash_attention": true, | |
| "use_gradient_checkpointing": false, | |
| "batch_size": 8, | |
| "gradient_accumulation_steps": 16, | |
| "learning_rate": 3.5e-06, | |
| "weight_decay": 0.01, | |
| "warmup_steps": 1200, | |
| "max_iters": 18000, | |
| "eval_interval": 1000, | |
| "log_interval": 25, | |
| "save_interval": 2000, | |
| "optimizer": "adamw_torch", | |
| "beta1": 0.9, | |
| "beta2": 0.999, | |
| "eps": 1e-08, | |
| "scheduler": "cosine", | |
| "min_lr": 3.5e-07, | |
| "fp16": false, | |
| "bf16": true, | |
| "ddp_backend": "nccl", | |
| "ddp_find_unused_parameters": false, | |
| "save_steps": 2000, | |
| "eval_steps": 1000, | |
| "logging_steps": 25, | |
| "save_total_limit": 5, | |
| "eval_strategy": "steps", | |
| "metric_for_best_model": "eval_loss", | |
| "greater_is_better": false, | |
| "load_best_model_at_end": true, | |
| "data_dir": null, | |
| "train_file": null, | |
| "validation_file": null, | |
| "test_file": null, | |
| "use_chat_template": true, | |
| "chat_template_kwargs": { | |
| "add_generation_prompt": true, | |
| "no_think_system_message": true | |
| }, | |
| "enable_tracking": true, | |
| "trackio_url": "https://tonic-test-trackio-test.hf.space", | |
| "trackio_token": null, | |
| "log_artifacts": true, | |
| "log_metrics": true, | |
| "log_config": true, | |
| "experiment_name": "petite-elle-l-aime-3-1", | |
| "dataset_name": "legmlai/openhermes-fr", | |
| "dataset_split": "train", | |
| "input_field": "prompt", | |
| "target_field": "accepted_completion", | |
| "filter_bad_entries": true, | |
| "bad_entry_field": "bad_entry", | |
| "packing": false, | |
| "max_prompt_length": 12288, | |
| "max_completion_length": 8192, | |
| "truncation": true, | |
| "dataloader_num_workers": 10, | |
| "dataloader_pin_memory": true, | |
| "dataloader_prefetch_factor": 3, | |
| "max_grad_norm": 1.0, | |
| "group_by_length": true | |
| }, | |
| "artifacts": [], | |
| "logs": [] | |
| } | |
| }, | |
| "current_experiment": "exp_20250720_134319", | |
| "last_updated": "2025-07-20T14:05:18.615415" | |
| } |