Yosuke Kashiwagi commited on
Commit ·
92a91e8
1
Parent(s): 3fb58dc
add up to 9 epochs.
Browse files- exp/bestrq_stats_raw_en/train/feats_lengths_stats.npz +0 -0
- exp/bestrq_stats_raw_en/train/feats_stats.npz +0 -0
- exp/bestrq_stats_raw_en/valid/feats_lengths_stats.npz +0 -0
- exp/bestrq_stats_raw_en/valid/feats_stats.npz +0 -0
- exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr1e-4_seed20220404_chunk3k_raw_en/1epoch.pth +3 -0
- exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr1e-4_seed20220404_chunk3k_raw_en/2epoch.pth +3 -0
- exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr1e-4_seed20220404_chunk3k_raw_en/3epoch.pth +3 -0
- exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr1e-4_seed20220404_chunk3k_raw_en/4epoch.pth +3 -0
- exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr1e-4_seed20220404_chunk3k_raw_en/5epoch.pth +3 -0
- exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr1e-4_seed20220404_chunk3k_raw_en/6epoch.pth +3 -0
- exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr1e-4_seed20220404_chunk3k_raw_en/7epoch.pth +3 -0
- exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr1e-4_seed20220404_chunk3k_raw_en/8epoch.pth +3 -0
- exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr1e-4_seed20220404_chunk3k_raw_en/9epoch.pth +3 -0
- exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr1e-4_seed20220404_chunk3k_raw_en/config.yaml +162 -0
- exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr1e-4_seed20220404_chunk3k_raw_en/images/backward_time.png +0 -0
- exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr1e-4_seed20220404_chunk3k_raw_en/images/forward_time.png +0 -0
- exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr1e-4_seed20220404_chunk3k_raw_en/images/gpu_max_cached_mem_GB.png +0 -0
- exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr1e-4_seed20220404_chunk3k_raw_en/images/iter_time.png +0 -0
- exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr1e-4_seed20220404_chunk3k_raw_en/images/label_coverage.png +0 -0
- exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr1e-4_seed20220404_chunk3k_raw_en/images/loss.png +0 -0
- exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr1e-4_seed20220404_chunk3k_raw_en/images/masked_acc.png +0 -0
- exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr1e-4_seed20220404_chunk3k_raw_en/images/masked_loss.png +0 -0
- exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr1e-4_seed20220404_chunk3k_raw_en/images/optim0_lr0.png +0 -0
- exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr1e-4_seed20220404_chunk3k_raw_en/images/optim_step_time.png +0 -0
- exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr1e-4_seed20220404_chunk3k_raw_en/images/prediction_coverage.png +0 -0
- exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr1e-4_seed20220404_chunk3k_raw_en/images/train_time.png +0 -0
- exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr1e-4_seed20220404_chunk3k_raw_en/images/unmasked_acc.png +0 -0
- exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr1e-4_seed20220404_chunk3k_raw_en/images/unmasked_loss.png +0 -0
- exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr1e-4_seed20220404_chunk3k_raw_en/latest.pth +1 -0
- exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr1e-4_seed20220404_chunk3k_raw_en/valid.masked_acc.best.pth +1 -0
exp/bestrq_stats_raw_en/train/feats_lengths_stats.npz
ADDED
|
Binary file (778 Bytes). View file
|
|
|
exp/bestrq_stats_raw_en/train/feats_stats.npz
ADDED
|
Binary file (1.4 kB). View file
|
|
|
exp/bestrq_stats_raw_en/valid/feats_lengths_stats.npz
ADDED
|
Binary file (778 Bytes). View file
|
|
|
exp/bestrq_stats_raw_en/valid/feats_stats.npz
ADDED
|
Binary file (1.4 kB). View file
|
|
|
exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr1e-4_seed20220404_chunk3k_raw_en/1epoch.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0695cc3c45eb5939faf60b4d16ce9887668df054a37fcfd0cbfcd4e189e364d5
|
| 3 |
+
size 477318768
|
exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr1e-4_seed20220404_chunk3k_raw_en/2epoch.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:550e25732071e5b9c7f5806ebc6d89c88e45b241b12607ef0752caf9e59b9eec
|
| 3 |
+
size 477318768
|
exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr1e-4_seed20220404_chunk3k_raw_en/3epoch.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0e5cb83fe0945168adfade85b039b3c38f3de6be93ff40a4a24af30c487f0743
|
| 3 |
+
size 477318768
|
exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr1e-4_seed20220404_chunk3k_raw_en/4epoch.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:68bb0a19604a91a4506c52ae3213c6c6efea4214f4f4c193f63cfe10102f90c1
|
| 3 |
+
size 477318768
|
exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr1e-4_seed20220404_chunk3k_raw_en/5epoch.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d0eac0949065e62fc1520768bd235a5f9c123b92c11838cab89554e8798a013d
|
| 3 |
+
size 477318768
|
exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr1e-4_seed20220404_chunk3k_raw_en/6epoch.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6004732a67b5dc0e9ae2f658c49f94d4b1963b8e3df4ad9c687ff515a77391ee
|
| 3 |
+
size 477318768
|
exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr1e-4_seed20220404_chunk3k_raw_en/7epoch.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:cf71204536e931dec0b2c97a9315c3e835e7ff4eaa2b004be7c8e5edbee0a873
|
| 3 |
+
size 477318768
|
exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr1e-4_seed20220404_chunk3k_raw_en/8epoch.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d5deb80b4b3c4c64c5627cc718e0a41f2c43d82eecd5f5911041b1e855610300
|
| 3 |
+
size 477318768
|
exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr1e-4_seed20220404_chunk3k_raw_en/9epoch.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2a5ec6f4e976e444c72a1177eb3793cf391c87dfcd322ef5fc2108cb45f4268a
|
| 3 |
+
size 477318768
|
exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr1e-4_seed20220404_chunk3k_raw_en/config.yaml
ADDED
|
@@ -0,0 +1,162 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
config: conf/tuning/train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr1e-4_seed20220404_chunk3k.yaml
|
| 2 |
+
print_config: false
|
| 3 |
+
log_level: INFO
|
| 4 |
+
dry_run: false
|
| 5 |
+
iterator_type: sequence
|
| 6 |
+
output_dir: exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr1e-4_seed20220404_chunk3k_raw_en
|
| 7 |
+
ngpu: 1
|
| 8 |
+
seed: 0
|
| 9 |
+
num_workers: 1
|
| 10 |
+
num_att_plot: 3
|
| 11 |
+
dist_backend: nccl
|
| 12 |
+
dist_init_method: env://
|
| 13 |
+
dist_world_size: 4
|
| 14 |
+
dist_rank: 0
|
| 15 |
+
local_rank: 0
|
| 16 |
+
dist_master_addr: localhost
|
| 17 |
+
dist_master_port: 44969
|
| 18 |
+
dist_launcher: null
|
| 19 |
+
multiprocessing_distributed: true
|
| 20 |
+
unused_parameters: false
|
| 21 |
+
sharded_ddp: false
|
| 22 |
+
cudnn_enabled: true
|
| 23 |
+
cudnn_benchmark: false
|
| 24 |
+
cudnn_deterministic: false
|
| 25 |
+
collect_stats: false
|
| 26 |
+
write_collected_feats: false
|
| 27 |
+
max_epoch: 500
|
| 28 |
+
patience: null
|
| 29 |
+
val_scheduler_criterion:
|
| 30 |
+
- valid
|
| 31 |
+
- loss
|
| 32 |
+
early_stopping_criterion:
|
| 33 |
+
- valid
|
| 34 |
+
- loss
|
| 35 |
+
- min
|
| 36 |
+
best_model_criterion:
|
| 37 |
+
- - valid
|
| 38 |
+
- masked_acc
|
| 39 |
+
- max
|
| 40 |
+
keep_nbest_models: 300
|
| 41 |
+
nbest_averaging_interval: 0
|
| 42 |
+
grad_clip: 5.0
|
| 43 |
+
grad_clip_type: 2.0
|
| 44 |
+
grad_noise: false
|
| 45 |
+
accum_grad: 8
|
| 46 |
+
no_forward_run: false
|
| 47 |
+
resume: true
|
| 48 |
+
train_dtype: float32
|
| 49 |
+
use_amp: true
|
| 50 |
+
log_interval: null
|
| 51 |
+
use_matplotlib: true
|
| 52 |
+
use_tensorboard: true
|
| 53 |
+
use_wandb: false
|
| 54 |
+
wandb_project: null
|
| 55 |
+
wandb_id: null
|
| 56 |
+
wandb_entity: null
|
| 57 |
+
wandb_name: null
|
| 58 |
+
wandb_model_log_interval: -1
|
| 59 |
+
detect_anomaly: false
|
| 60 |
+
pretrain_path: null
|
| 61 |
+
init_param: []
|
| 62 |
+
ignore_init_mismatch: false
|
| 63 |
+
freeze_param: []
|
| 64 |
+
num_iters_per_epoch: null
|
| 65 |
+
batch_size: 256
|
| 66 |
+
valid_batch_size: null
|
| 67 |
+
batch_bins: 1000000
|
| 68 |
+
valid_batch_bins: null
|
| 69 |
+
train_shape_file:
|
| 70 |
+
- exp/bestrq_stats_raw_en/train/speech_shape
|
| 71 |
+
valid_shape_file:
|
| 72 |
+
- exp/bestrq_stats_raw_en/valid/speech_shape
|
| 73 |
+
batch_type: folded
|
| 74 |
+
valid_batch_type: null
|
| 75 |
+
fold_length:
|
| 76 |
+
- 80000
|
| 77 |
+
sort_in_batch: descending
|
| 78 |
+
sort_batch: descending
|
| 79 |
+
multiple_iterator: false
|
| 80 |
+
chunk_length: 500
|
| 81 |
+
chunk_shift_ratio: 0.5
|
| 82 |
+
num_cache_chunks: 1024
|
| 83 |
+
train_data_path_and_name_and_type:
|
| 84 |
+
- - dump/raw/train_60k/wav.scp
|
| 85 |
+
- speech
|
| 86 |
+
- sound
|
| 87 |
+
valid_data_path_and_name_and_type:
|
| 88 |
+
- - dump/raw/dev/wav.scp
|
| 89 |
+
- speech
|
| 90 |
+
- sound
|
| 91 |
+
allow_variable_data_keys: false
|
| 92 |
+
max_cache_size: 0.0
|
| 93 |
+
max_cache_fd: 32
|
| 94 |
+
valid_max_cache_size: null
|
| 95 |
+
optim: adam
|
| 96 |
+
optim_conf:
|
| 97 |
+
lr: 0.0001
|
| 98 |
+
scheduler: warmuplr
|
| 99 |
+
scheduler_conf:
|
| 100 |
+
warmup_steps: 30000
|
| 101 |
+
init: xavier_uniform
|
| 102 |
+
input_size: null
|
| 103 |
+
model_conf:
|
| 104 |
+
lsm_weight: 0.0
|
| 105 |
+
length_normalized_loss: false
|
| 106 |
+
vector_size: 16
|
| 107 |
+
codebook_size: 8192
|
| 108 |
+
temporal_reduction: 4
|
| 109 |
+
mask_prob: 0.01
|
| 110 |
+
mask_length: 40
|
| 111 |
+
unmasked_region_weight: 0
|
| 112 |
+
apply_l2_normalization: true
|
| 113 |
+
codebook_and_matrix_init_file: data/local/codebook_and_matrix_seed20220404.pth
|
| 114 |
+
frame_chunk_size: 3200
|
| 115 |
+
use_preprocessor: true
|
| 116 |
+
token_type: null
|
| 117 |
+
cleaner: null
|
| 118 |
+
speech_volume_normalize: null
|
| 119 |
+
rir_scp: null
|
| 120 |
+
rir_apply_prob: 1.0
|
| 121 |
+
noise_scp: null
|
| 122 |
+
noise_apply_prob: 1.0
|
| 123 |
+
noise_db_range: '13_15'
|
| 124 |
+
frontend: default
|
| 125 |
+
frontend_conf:
|
| 126 |
+
fs: 16k
|
| 127 |
+
n_fft: 512
|
| 128 |
+
win_length: 400
|
| 129 |
+
hop_length: 160
|
| 130 |
+
frontend_conf: null
|
| 131 |
+
apply_stft: true
|
| 132 |
+
specaug: null
|
| 133 |
+
specaug_conf: {}
|
| 134 |
+
normalize: global_mvn
|
| 135 |
+
normalize_conf:
|
| 136 |
+
stats_file: exp/bestrq_stats_raw_en/train/feats_stats.npz
|
| 137 |
+
preencoder: null
|
| 138 |
+
preencoder_conf: {}
|
| 139 |
+
encoder: conformer
|
| 140 |
+
encoder_conf:
|
| 141 |
+
output_size: 512
|
| 142 |
+
attention_heads: 8
|
| 143 |
+
linear_units: 2048
|
| 144 |
+
num_blocks: 17
|
| 145 |
+
dropout_rate: 0.1
|
| 146 |
+
positional_dropout_rate: 0.1
|
| 147 |
+
attention_dropout_rate: 0.1
|
| 148 |
+
input_layer: conv2d
|
| 149 |
+
normalize_before: true
|
| 150 |
+
macaron_style: true
|
| 151 |
+
rel_pos_type: latest
|
| 152 |
+
pos_enc_layer_type: rel_pos
|
| 153 |
+
selfattention_layer_type: rel_selfattn
|
| 154 |
+
activation_type: swish
|
| 155 |
+
use_cnn_module: true
|
| 156 |
+
cnn_module_kernel: 31
|
| 157 |
+
postencoder: null
|
| 158 |
+
postencoder_conf: {}
|
| 159 |
+
required:
|
| 160 |
+
- output_dir
|
| 161 |
+
version: 0.10.7a1
|
| 162 |
+
distributed: true
|
exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr1e-4_seed20220404_chunk3k_raw_en/images/backward_time.png
ADDED
|
exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr1e-4_seed20220404_chunk3k_raw_en/images/forward_time.png
ADDED
|
exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr1e-4_seed20220404_chunk3k_raw_en/images/gpu_max_cached_mem_GB.png
ADDED
|
exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr1e-4_seed20220404_chunk3k_raw_en/images/iter_time.png
ADDED
|
exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr1e-4_seed20220404_chunk3k_raw_en/images/label_coverage.png
ADDED
|
exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr1e-4_seed20220404_chunk3k_raw_en/images/loss.png
ADDED
|
exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr1e-4_seed20220404_chunk3k_raw_en/images/masked_acc.png
ADDED
|
exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr1e-4_seed20220404_chunk3k_raw_en/images/masked_loss.png
ADDED
|
exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr1e-4_seed20220404_chunk3k_raw_en/images/optim0_lr0.png
ADDED
|
exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr1e-4_seed20220404_chunk3k_raw_en/images/optim_step_time.png
ADDED
|
exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr1e-4_seed20220404_chunk3k_raw_en/images/prediction_coverage.png
ADDED
|
exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr1e-4_seed20220404_chunk3k_raw_en/images/train_time.png
ADDED
|
exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr1e-4_seed20220404_chunk3k_raw_en/images/unmasked_acc.png
ADDED
|
exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr1e-4_seed20220404_chunk3k_raw_en/images/unmasked_loss.png
ADDED
|
exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr1e-4_seed20220404_chunk3k_raw_en/latest.pth
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
9epoch.pth
|
exp/bestrq_train_bestrq_conformerL_maskprob1e-2_unmaskedonly_l2norm_cb8192_accum8_bs256_amp_lr1e-4_seed20220404_chunk3k_raw_en/valid.masked_acc.best.pth
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
9epoch.pth
|