File size: 3,675 Bytes
9f2f8d3 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 |
{
"batch_size": 32,
"buffer_size": 64,
"eval_mix": "chris_aubo",
"frozen_keys": [
"*hf_model*"
],
"lora": false,
"lora_config": {
"bias": "none",
"lora_alpha": 16,
"lora_dropout": 0.05,
"r": 8
},
"model": {
"heads": {
"action": {
"args": [],
"kwargs": {
"action_dim": 7,
"action_horizon": 4,
"dropout_rate": 0.0,
"n_diffusion_samples": 1,
"readout_key": "readout_action",
"token_embedding_size": 768,
"use_map": false
},
"module": "octo.model.components.action_heads",
"name": "DiffusionActionHead"
}
},
"max_horizon": 10,
"observation_tokenizers": {
"primary": {
"args": [],
"kwargs": {
"encoder": {
"args": [],
"kwargs": {
"in_features": 6
},
"module": "octo.model.components.vit_encoders",
"name": "SmallStem16"
},
"obs_stack_keys": [
"image_primary"
],
"task_stack_keys": [
"image_primary"
]
},
"module": "octo.model.components.tokenizers",
"name": "ImageTokenizer"
}
},
"readouts": {
"action": 1
},
"repeat_task_tokens": true,
"task_tokenizers": {
"language": {
"args": [],
"kwargs": {
"encoder": "t5-base",
"finetune_encoder": false
},
"module": "octo.model.components.tokenizers",
"name": "LanguageTokenizer"
}
},
"token_embedding_size": 768,
"transformer_kwargs": {
"add_position_embedding": false,
"attention_dropout_rate": 0.0,
"dropout_rate": 0.0,
"mlp_dim": 3072,
"num_attention_heads": 12,
"num_layers": 12
},
"use_correct_attention": true
},
"normalize_method": "sign",
"obs_token_nums": {
"primary": 256
},
"output_dir": "ljp_aubo_20250610_test",
"pretrained": {
"kwargs": {
"subpath": "oxe-g2-checkpoint-300000"
},
"model": "hf://chuanmew/octo_torch"
},
"run_name": "aubo",
"sampler_num_samples": 2560000,
"seed": 42,
"subsample_length": 99999,
"text_processor": {
"args": [],
"kwargs": {
"encode_with_model": false,
"tokenizer_kwargs": {
"max_length": 16,
"padding": "max_length",
"return_tensors": "np",
"truncation": true
},
"tokenizer_name": "t5-base"
},
"module": "octo.components.text_processing",
"name": "HFTokenizer"
},
"train_mix": "ljp_aubo_merged_20250519to20250529_20250604",
"training_arguments": {
"bf16": true,
"dataloader_pin_memory": true,
"ddp_find_unused_parameters": true,
"eval_steps": 1000,
"gradient_accumulation_steps": 1,
"learning_rate": 3e-05,
"logging_nan_inf_filter": false,
"logging_steps": 1000,
"lr_scheduler_kwargs": {
"decay_type": "cosine",
"min_lr_ratio": 0.05,
"num_decay_steps": 0
},
"lr_scheduler_type": "warmup_stable_decay",
"max_grad_norm": 1.0,
"max_steps": 5200,
"optim": "adamw_torch_fused",
"per_device_eval_batch_size": 1,
"per_device_train_batch_size": 1,
"report_to": "wandb",
"save_safetensors": true,
"save_steps": 5200,
"torch_compile": true,
"warmup_steps": 100,
"weight_decay": 0.1
},
"training_keys": [
"*action*",
"*observation_tokenizers*",
"*transformer.transformer*",
"*task_projections*",
"*obs_projections*",
"*readout_embeddings*",
"*task_pos_embeddings*",
"*obs_pos_embeddings*"
]
}
|