chore: _
This commit is contained in:
14
main.py
14
main.py
@@ -86,14 +86,16 @@ def run_sweep(base_config: TrainingConfig, dataset_path: str):
|
||||
"parameters": {
|
||||
"learning_rate": {
|
||||
"distribution": "log_uniform_values",
|
||||
"min": 1e-5,
|
||||
"max": 1e-4,
|
||||
"min": 1e-7,
|
||||
"max": 1e-5,
|
||||
},
|
||||
"lora_r": {"values": [8]},
|
||||
"lora_alpha": {"values": [16]},
|
||||
"per_device_train_batch_size": {"values": [16]},
|
||||
"gradient_accumulation_steps": {"values": [2]},
|
||||
"lora_r": {"values": [32]},
|
||||
"lora_alpha": {"values": [64]},
|
||||
"per_device_train_batch_size": {"values": [32]},
|
||||
"gradient_accumulation_steps": {"values": [4, 8]},
|
||||
"num_train_epochs": {"values": [1]},
|
||||
"warmup_steps": {"values": [10]},
|
||||
"max_grad_norm": {"values": [0.1, 0.3, 0.5]},
|
||||
},
|
||||
"early_terminate": {"type": "hyperband", "min_iter": 100},
|
||||
}
|
||||
|
||||
Reference in New Issue
Block a user