JYP2024 commited on
Commit
6f941bc
1 Parent(s): fec48dc

EBranchformer_SV

Browse files
Files changed (24) hide show
  1. README.md +16 -0
  2. spk_train_ebranchformer_aggregate_sys1_D384_L6_Rel_LayerDrop_raw/40epoch.pth +3 -0
  3. spk_train_ebranchformer_aggregate_sys1_D384_L6_Rel_LayerDrop_raw/RESULTS.md +17 -0
  4. spk_train_ebranchformer_aggregate_sys1_D384_L6_Rel_LayerDrop_raw/config.yaml +226 -0
  5. spk_train_ebranchformer_aggregate_sys1_D384_L6_Rel_LayerDrop_raw/images/backward_time.png +0 -0
  6. spk_train_ebranchformer_aggregate_sys1_D384_L6_Rel_LayerDrop_raw/images/clip.png +0 -0
  7. spk_train_ebranchformer_aggregate_sys1_D384_L6_Rel_LayerDrop_raw/images/eer.png +0 -0
  8. spk_train_ebranchformer_aggregate_sys1_D384_L6_Rel_LayerDrop_raw/images/forward_time.png +0 -0
  9. spk_train_ebranchformer_aggregate_sys1_D384_L6_Rel_LayerDrop_raw/images/gpu_max_cached_mem_GB.png +0 -0
  10. spk_train_ebranchformer_aggregate_sys1_D384_L6_Rel_LayerDrop_raw/images/grad_norm.png +0 -0
  11. spk_train_ebranchformer_aggregate_sys1_D384_L6_Rel_LayerDrop_raw/images/iter_time.png +0 -0
  12. spk_train_ebranchformer_aggregate_sys1_D384_L6_Rel_LayerDrop_raw/images/loss.png +0 -0
  13. spk_train_ebranchformer_aggregate_sys1_D384_L6_Rel_LayerDrop_raw/images/loss_scale.png +0 -0
  14. spk_train_ebranchformer_aggregate_sys1_D384_L6_Rel_LayerDrop_raw/images/mindcf.png +0 -0
  15. spk_train_ebranchformer_aggregate_sys1_D384_L6_Rel_LayerDrop_raw/images/n_trials.png +0 -0
  16. spk_train_ebranchformer_aggregate_sys1_D384_L6_Rel_LayerDrop_raw/images/nontrg_mean.png +0 -0
  17. spk_train_ebranchformer_aggregate_sys1_D384_L6_Rel_LayerDrop_raw/images/nontrg_std.png +0 -0
  18. spk_train_ebranchformer_aggregate_sys1_D384_L6_Rel_LayerDrop_raw/images/optim0_lr0.png +0 -0
  19. spk_train_ebranchformer_aggregate_sys1_D384_L6_Rel_LayerDrop_raw/images/optim_step_time.png +0 -0
  20. spk_train_ebranchformer_aggregate_sys1_D384_L6_Rel_LayerDrop_raw/images/train_time.png +0 -0
  21. spk_train_ebranchformer_aggregate_sys1_D384_L6_Rel_LayerDrop_raw/images/trg_mean.png +0 -0
  22. spk_train_ebranchformer_aggregate_sys1_D384_L6_Rel_LayerDrop_raw/images/trg_std.png +0 -0
  23. spk_train_ebranchformer_aggregate_sys1_D384_L6_Rel_LayerDrop_raw/latest.pth +1 -0
  24. spk_train_ebranchformer_aggregate_sys1_D384_L6_Rel_LayerDrop_raw/train.log +0 -0
README.md CHANGED
@@ -1,3 +1,19 @@
1
  ---
2
  license: cc-by-4.0
3
  ---
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
  ---
2
  license: cc-by-4.0
3
  ---
4
+ # RESULTS
5
+ ## Environments
6
+ date: 2024-11-11 13:27:22.449116
7
+
8
+ - python version: 3.10.13 (main, Sep 11 2023, 13:44:35) [GCC 11.2.0]
9
+ - espnet version: 202409
10
+ - pytorch version: 2.2.2+rocm5.6
11
+
12
+ | | Mean | Std |
13
+ |---|---|---|
14
+ | Target | 8.1720 | 3.9750 |
15
+ | Non-target | 2.0805 | 2.0805 |
16
+
17
+ | Model name | EER(%) | minDCF |
18
+ |---|---|---|
19
+ | conf/tuning/train_ebranchformer_aggregate_sys1_D384_L6_Rel_LayerDrop | 0.638 | 0.04797 |
spk_train_ebranchformer_aggregate_sys1_D384_L6_Rel_LayerDrop_raw/40epoch.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6772cffb1283459b3d342411022b30ec7d32ded12f15855c8ba89b2c976eac2c
3
+ size 156441550
spk_train_ebranchformer_aggregate_sys1_D384_L6_Rel_LayerDrop_raw/RESULTS.md ADDED
@@ -0,0 +1,17 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ <!-- Generated by scripts/utils/show_spk_result.py -->
2
+ # RESULTS
3
+ ## Environments
4
+ date: 2024-11-11 13:27:22.449116
5
+
6
+ - python version: 3.10.13 (main, Sep 11 2023, 13:44:35) [GCC 11.2.0]
7
+ - espnet version: 202409
8
+ - pytorch version: 2.2.2+rocm5.6
9
+
10
+ | | Mean | Std |
11
+ |---|---|---|
12
+ | Target | 8.1720 | 3.9750 |
13
+ | Non-target | 2.0805 | 2.0805 |
14
+
15
+ | Model name | EER(%) | minDCF |
16
+ |---|---|---|
17
+ | conf/tuning/train_ebranchformer_aggregate_sys1_D384_L6_Rel_LayerDrop | 0.638 | 0.04797 |
spk_train_ebranchformer_aggregate_sys1_D384_L6_Rel_LayerDrop_raw/config.yaml ADDED
@@ -0,0 +1,226 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ config: conf/tuning/train_ebranchformer_aggregate_sys1_D384_L6_Rel_LayerDrop.yaml
2
+ print_config: false
3
+ log_level: INFO
4
+ drop_last_iter: true
5
+ dry_run: false
6
+ iterator_type: category
7
+ valid_iterator_type: sequence
8
+ output_dir: exp/spk_train_ebranchformer_aggregate_sys1_D384_L6_Rel_LayerDrop_raw
9
+ ngpu: 1
10
+ seed: 0
11
+ num_workers: 6
12
+ num_att_plot: 0
13
+ dist_backend: nccl
14
+ dist_init_method: env://
15
+ dist_world_size: 8
16
+ dist_rank: 0
17
+ local_rank: 0
18
+ dist_master_addr: localhost
19
+ dist_master_port: null
20
+ dist_launcher: null
21
+ multiprocessing_distributed: true
22
+ unused_parameters: true
23
+ sharded_ddp: false
24
+ use_deepspeed: false
25
+ deepspeed_config: null
26
+ cudnn_enabled: true
27
+ cudnn_benchmark: false
28
+ cudnn_deterministic: false
29
+ use_tf32: false
30
+ collect_stats: false
31
+ write_collected_feats: false
32
+ max_epoch: 40
33
+ patience: null
34
+ val_scheduler_criterion:
35
+ - valid
36
+ - loss
37
+ early_stopping_criterion:
38
+ - valid
39
+ - loss
40
+ - min
41
+ best_model_criterion:
42
+ - - valid
43
+ - eer
44
+ - min
45
+ keep_nbest_models: 3
46
+ nbest_averaging_interval: 0
47
+ grad_clip: 9999
48
+ grad_clip_type: 2.0
49
+ grad_noise: false
50
+ accum_grad: 1
51
+ no_forward_run: false
52
+ resume: true
53
+ train_dtype: float32
54
+ use_amp: false
55
+ log_interval: 100
56
+ use_matplotlib: true
57
+ use_tensorboard: true
58
+ create_graph_in_tensorboard: false
59
+ use_wandb: false
60
+ wandb_project: null
61
+ wandb_id: null
62
+ wandb_entity: null
63
+ wandb_name: null
64
+ wandb_model_log_interval: -1
65
+ detect_anomaly: false
66
+ use_adapter: false
67
+ adapter: lora
68
+ save_strategy: all
69
+ adapter_conf: {}
70
+ pretrain_path: null
71
+ init_param: []
72
+ ignore_init_mismatch: false
73
+ freeze_param: []
74
+ num_iters_per_epoch: null
75
+ batch_size: 200
76
+ valid_batch_size: 80
77
+ batch_bins: 1000000
78
+ valid_batch_bins: null
79
+ category_sample_size: 10
80
+ train_shape_file:
81
+ - exp/spk_stats_16k/train/speech_shape
82
+ valid_shape_file:
83
+ - exp/spk_stats_16k/valid/speech_shape
84
+ batch_type: folded
85
+ valid_batch_type: null
86
+ fold_length:
87
+ - 120000
88
+ sort_in_batch: descending
89
+ shuffle_within_batch: false
90
+ sort_batch: descending
91
+ multiple_iterator: false
92
+ chunk_length: 500
93
+ chunk_shift_ratio: 0.5
94
+ num_cache_chunks: 1024
95
+ chunk_excluded_key_prefixes: []
96
+ chunk_default_fs: null
97
+ chunk_max_abs_length: null
98
+ chunk_discard_short_samples: true
99
+ train_data_path_and_name_and_type:
100
+ - - dump/raw/voxceleb12_devs/wav.scp
101
+ - speech
102
+ - sound
103
+ - - dump/raw/voxceleb12_devs/utt2spk
104
+ - spk_labels
105
+ - text
106
+ valid_data_path_and_name_and_type:
107
+ - - dump/raw/voxceleb1_test/trial.scp
108
+ - speech
109
+ - sound
110
+ - - dump/raw/voxceleb1_test/trial2.scp
111
+ - speech2
112
+ - sound
113
+ - - dump/raw/voxceleb1_test/trial_label
114
+ - spk_labels
115
+ - text
116
+ multi_task_dataset: false
117
+ allow_variable_data_keys: false
118
+ max_cache_size: 0.0
119
+ max_cache_fd: 32
120
+ allow_multi_rates: false
121
+ valid_max_cache_size: null
122
+ exclude_weight_decay: false
123
+ exclude_weight_decay_conf: {}
124
+ optim: adamw
125
+ optim_conf:
126
+ lr: 0.001
127
+ weight_decay: 0.0001
128
+ amsgrad: false
129
+ scheduler: cosineannealingwarmuprestarts
130
+ scheduler_conf:
131
+ first_cycle_steps: 300000
132
+ cycle_mult: 1.0
133
+ max_lr: 0.001
134
+ min_lr: 1.0e-07
135
+ warmup_steps: 30000
136
+ gamma: 0.7
137
+ init: null
138
+ use_preprocessor: true
139
+ input_size: null
140
+ target_duration: 3.0
141
+ spk2utt: dump/raw/voxceleb12_devs/spk2utt
142
+ spk_num: 7205
143
+ sample_rate: 16000
144
+ num_eval: 10
145
+ rir_scp: ''
146
+ model_conf:
147
+ extract_feats_in_collect_stats: false
148
+ frontend: melspec_torch
149
+ frontend_conf:
150
+ preemp: true
151
+ n_fft: 512
152
+ log: true
153
+ win_length: 400
154
+ hop_length: 160
155
+ n_mels: 80
156
+ normalize: mn
157
+ specaug: null
158
+ specaug_conf: {}
159
+ normalize: null
160
+ normalize_conf: {}
161
+ encoder: e_branchformer
162
+ encoder_conf:
163
+ output_size: 384
164
+ attention_heads: 6
165
+ attention_layer_type: rel_selfattn
166
+ pos_enc_layer_type: rel_pos
167
+ rel_pos_type: latest
168
+ cgmlp_linear_units: 1536
169
+ cgmlp_conv_kernel: 31
170
+ use_linear_after_conv: false
171
+ gate_activation: identity
172
+ num_blocks: 6
173
+ dropout_rate: 0.1
174
+ positional_dropout_rate: 0.1
175
+ attention_dropout_rate: 0.1
176
+ input_layer: conv2d2
177
+ layer_drop_rate: 0.05
178
+ linear_units: 1536
179
+ positionwise_layer_type: linear
180
+ use_ffn: true
181
+ macaron_ffn: true
182
+ merge_conv_kernel: 31
183
+ aggregate_layer: true
184
+ pooling: chn_attn_stat
185
+ pooling_conf: {}
186
+ projector: rawnet3
187
+ projector_conf:
188
+ output_size: 192
189
+ preprocessor: spk
190
+ preprocessor_conf:
191
+ target_duration: 3.0
192
+ sample_rate: 16000
193
+ num_eval: 5
194
+ noise_apply_prob: 0.6
195
+ noise_info:
196
+ - - 1.0
197
+ - dump/raw/musan_speech.scp
198
+ - - 4
199
+ - 7
200
+ - - 13
201
+ - 20
202
+ - - 1.0
203
+ - dump/raw/musan_noise.scp
204
+ - - 1
205
+ - 1
206
+ - - 0
207
+ - 15
208
+ - - 1.0
209
+ - dump/raw/musan_music.scp
210
+ - - 1
211
+ - 1
212
+ - - 0
213
+ - 15
214
+ rir_apply_prob: 0.6
215
+ rir_scp: dump/raw/rirs.scp
216
+ loss: aamsoftmax_sc_topk
217
+ loss_conf:
218
+ margin: 0.2
219
+ scale: 32
220
+ K: 3
221
+ mp: 0.06
222
+ k_top: 5
223
+ required:
224
+ - output_dir
225
+ version: '202409'
226
+ distributed: true
spk_train_ebranchformer_aggregate_sys1_D384_L6_Rel_LayerDrop_raw/images/backward_time.png ADDED
spk_train_ebranchformer_aggregate_sys1_D384_L6_Rel_LayerDrop_raw/images/clip.png ADDED
spk_train_ebranchformer_aggregate_sys1_D384_L6_Rel_LayerDrop_raw/images/eer.png ADDED
spk_train_ebranchformer_aggregate_sys1_D384_L6_Rel_LayerDrop_raw/images/forward_time.png ADDED
spk_train_ebranchformer_aggregate_sys1_D384_L6_Rel_LayerDrop_raw/images/gpu_max_cached_mem_GB.png ADDED
spk_train_ebranchformer_aggregate_sys1_D384_L6_Rel_LayerDrop_raw/images/grad_norm.png ADDED
spk_train_ebranchformer_aggregate_sys1_D384_L6_Rel_LayerDrop_raw/images/iter_time.png ADDED
spk_train_ebranchformer_aggregate_sys1_D384_L6_Rel_LayerDrop_raw/images/loss.png ADDED
spk_train_ebranchformer_aggregate_sys1_D384_L6_Rel_LayerDrop_raw/images/loss_scale.png ADDED
spk_train_ebranchformer_aggregate_sys1_D384_L6_Rel_LayerDrop_raw/images/mindcf.png ADDED
spk_train_ebranchformer_aggregate_sys1_D384_L6_Rel_LayerDrop_raw/images/n_trials.png ADDED
spk_train_ebranchformer_aggregate_sys1_D384_L6_Rel_LayerDrop_raw/images/nontrg_mean.png ADDED
spk_train_ebranchformer_aggregate_sys1_D384_L6_Rel_LayerDrop_raw/images/nontrg_std.png ADDED
spk_train_ebranchformer_aggregate_sys1_D384_L6_Rel_LayerDrop_raw/images/optim0_lr0.png ADDED
spk_train_ebranchformer_aggregate_sys1_D384_L6_Rel_LayerDrop_raw/images/optim_step_time.png ADDED
spk_train_ebranchformer_aggregate_sys1_D384_L6_Rel_LayerDrop_raw/images/train_time.png ADDED
spk_train_ebranchformer_aggregate_sys1_D384_L6_Rel_LayerDrop_raw/images/trg_mean.png ADDED
spk_train_ebranchformer_aggregate_sys1_D384_L6_Rel_LayerDrop_raw/images/trg_std.png ADDED
spk_train_ebranchformer_aggregate_sys1_D384_L6_Rel_LayerDrop_raw/latest.pth ADDED
@@ -0,0 +1 @@
 
 
1
+ 40epoch.pth
spk_train_ebranchformer_aggregate_sys1_D384_L6_Rel_LayerDrop_raw/train.log ADDED
The diff for this file is too large to render. See raw diff