forked from jonatasgrosman/wav2vec2-sprint
-
Notifications
You must be signed in to change notification settings - Fork 0
/
sweep.yaml
78 lines (78 loc) · 1.47 KB
/
sweep.yaml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
program: run_common_voice.py
name: hf-wav2vec-sprint-fi
method: random
metric:
goal: minimize
name: eval/loss
parameters:
seed:
value: 42
report_to:
value: wandb
model_name_or_path:
value: facebook/wav2vec2-large-xlsr-53
dataset_config_name:
value: fi
output_dir:
value: ../models/fi/wav2vec2-large-xlsr-fi-sweep
cache_dir:
value: ../data/fi
overwrite_output_dir:
value: True
fp16:
value: True
max_steps:
value: 500
eval_steps:
value: 100
logging_steps:
value: 100
do_eval:
value: True
do_train:
value: True
per_device_train_batch_size:
value: 16
per_device_eval_batch_size:
value: 16
dataloader_num_workers:
value: 10
preprocessing_num_workers:
value: 10
load_best_model_at_end:
value: True
save_total_limit:
value: 1
evaluation_strategy:
value: steps
freeze_feature_extractor:
value: True
group_by_length:
value: True
min_duration:
value: 2.0
max_duration:
value: 9.0
lr_warmup_ratio:
value: 0.5
lr_constant_ratio:
value: 0.0
augmentation_factor:
values: [0, 1]
layerdrop:
value: 0.0
learning_rate:
values: [1e-4, 3e-4, 6e-4, 1e-3]
attention_dropout:
values: [0.05, 0.1, 0.2]
activation_dropout:
values: [0.05, 0.1, 0.2]
hidden_dropout:
values: [0.05, 0.1, 0.2]
feat_proj_dropout:
values: [0.05, 0.1, 0.2]
mask_time_prob:
values: [0.05, 0.1, 0.2]
early_terminate:
type: hyperband
min_iter: 200