|
{ |
|
"model_name": "./hebrew_aramaic_model_early_stopping", |
|
"direction": "he2ar", |
|
"vocabulary_size": 64174, |
|
"model_parameters": 77519872, |
|
"training_config": { |
|
"dataset_path": "./hebrew_aramaic_dataset", |
|
"output_dir": "./hebrew_aramaic_model_final", |
|
"model_name": "./hebrew_aramaic_model_early_stopping", |
|
"direction": "he2ar", |
|
"batch_size": 16, |
|
"learning_rate": 1e-05, |
|
"num_epochs": 3, |
|
"max_input_length": 512, |
|
"max_target_length": 512, |
|
"eval_steps": 500, |
|
"save_steps": 500, |
|
"warmup_steps": 500, |
|
"gradient_accumulation_steps": 1, |
|
"early_stopping_patience": 5, |
|
"early_stopping_threshold": 0.1, |
|
"seed": 42, |
|
"use_fp16": true, |
|
"use_wandb": false, |
|
"use_language_prefix": true, |
|
"skip_evaluation": false |
|
} |
|
} |