hynt commited on
Commit
9dca845
·
verified ·
1 Parent(s): 17cd23d

Upload config.json

Browse files
Files changed (1) hide show
  1. config.json +98 -0
config.json ADDED
@@ -0,0 +1,98 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "model_name": "Efficient Conformer CTC Small",
3
+ "model_type": "CTC",
4
+
5
+ "encoder_params":
6
+ {
7
+ "arch": "Conformer",
8
+ "num_blocks": 15,
9
+ "dim_model": [120, 168, 240],
10
+ "ff_ratio": 4,
11
+ "num_heads": 4,
12
+ "kernel_size": 15,
13
+ "Pdrop": 0.1,
14
+ "conv_stride": 2,
15
+ "att_stride": 1,
16
+ "strided_blocks": [4, 9],
17
+ "expand_blocks": [4, 9],
18
+ "att_group_size": [3, 1, 1],
19
+
20
+ "relative_pos_enc": true,
21
+ "max_pos_encoding": 10000,
22
+
23
+ "subsampling_module": "Conv2d",
24
+ "subsampling_layers": 1,
25
+ "subsampling_filters": [120],
26
+ "subsampling_kernel_size": 3,
27
+ "subsampling_norm": "batch",
28
+ "subsampling_act": "swish",
29
+
30
+ "sample_rate": 16000,
31
+ "win_length_ms": 25,
32
+ "hop_length_ms": 10,
33
+ "n_fft": 512,
34
+ "n_mels": 80,
35
+ "normalize": false,
36
+ "mean": -5.6501,
37
+ "std": 4.2280,
38
+
39
+ "spec_augment": false,
40
+ "mF": 2,
41
+ "F": 27,
42
+ "mT": 5,
43
+ "pS": 0.05
44
+ },
45
+
46
+ "tokenizer_params":
47
+ {
48
+ "tokenizer_path": "datasets/Vietnamese/vi_bpe_1024.model",
49
+ "vocab_type": "bpe",
50
+ "vocab_size": 1024
51
+ },
52
+
53
+ "training_params":
54
+ {
55
+ "epochs": 450,
56
+ "batch_size": 64,
57
+ "accumulated_steps": 2,
58
+ "mixed_precision": true,
59
+
60
+ "optimizer": "Adam",
61
+ "beta1": 0.9,
62
+ "beta2": 0.98,
63
+ "eps": 1e-9,
64
+ "weight_decay": 1e-6,
65
+
66
+ "lr_schedule": "Transformer",
67
+ "schedule_dim": 240,
68
+ "warmup_steps": 10000,
69
+ "K": 2,
70
+
71
+ "train_audio_max_length": 256000,
72
+ "train_label_max_length": 256000,
73
+ "eval_audio_max_length": 256000,
74
+ "eval_label_max_length": 256000,
75
+
76
+ "training_dataset": "Vietnamese",
77
+ "training_dataset_path": "/mnt/c/Users/hyngu/Data/ASRDataset/",
78
+
79
+ "evaluation_dataset": "Vietnamese",
80
+ "evaluation_dataset_path": "/mnt/c/Users/hyngu/Data/ASRDataset/",
81
+
82
+ "callback_path": "callbacks/EfficientConformerCTCSmall/"
83
+ },
84
+
85
+ "decoding_params":
86
+ {
87
+ "beam_size": 5,
88
+ "tmp": 1,
89
+
90
+ "ngram_path": "data/6gram_lm_corpus.binary",
91
+ "ngram_alpha": 0.4,
92
+ "ngram_beta": 1.0,
93
+
94
+ "lm_config": "configs/LM-Transformer.json",
95
+ "lm_weight": 1,
96
+ "lm_tmp": 1
97
+ }
98
+ }