{ "modelname": "openai/whisper-base", "gen_args": { "num_beams": 3 }, "fallback": [1,7,5], "corpora": { "train": { "asc": { "languages": "ara", "limit": [ 1000 ] }, "multipa": { "languages": [ "ja", "pl", "mt", "hu", "fi", "el", "ta" ], "limit": [ 1000, 1000, 1000, 1000, 1000, 1000, 1000 ] }, "thchs": { "languages": "cmn", "limit": [ 1000 ] } }, "dev": { "asc": { "languages": "ara", "limit": [ 50 ] }, "multipa": { "languages": [ "ja", "pl", "mt", "hu", "fi", "el", "ta" ], "limit": [ 50, 50, 50, 50, 50, 50, 50 ] }, "thchs": { "languages": "cmn", "limit": [ 50 ] } } }, "hyperparams": { "output_dir": "../models/lowhipa-base-comb", "overwrite_output_dir": "True", "peft": "True", "per_device_train_batch_size": 64, "gradient_accumulation_steps": 1, "learning_rate": 0.001, "warmup_ratio": 0.1, "max_steps": 1410, "gradient_checkpointing": "True", "fp16": "True", "eval_strategy": "steps", "per_device_eval_batch_size": 8, "predict_with_generate": "True", "generation_max_length": 225, "save_steps": 282, "eval_steps": 282, "logging_steps": 282, "logging_first_step": "True", "report_to": [ "tensorboard" ], "load_best_model_at_end": "False", "metric_for_best_model": "pfer", "greater_is_better": "False", "hub_private_repo": "True", "push_to_hub": "False", "torch_empty_cache_steps": 4 } }