8688chris commited on
Commit
1a80618
·
verified ·
1 Parent(s): 9d2a756

Model save

Browse files
README.md ADDED
@@ -0,0 +1,132 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ library_name: transformers
3
+ license: apache-2.0
4
+ base_model: facebook/wav2vec2-base-960h
5
+ tags:
6
+ - generated_from_trainer
7
+ metrics:
8
+ - wer
9
+ model-index:
10
+ - name: helldivers2-jarvis-asrV8
11
+ results: []
12
+ ---
13
+
14
+ <!-- This model card has been generated automatically according to the information the Trainer had access to. You
15
+ should probably proofread and complete it, then remove this comment. -->
16
+
17
+ # helldivers2-jarvis-asrV8
18
+
19
+ This model is a fine-tuned version of [facebook/wav2vec2-base-960h](https://huggingface.co/facebook/wav2vec2-base-960h) on an unknown dataset.
20
+ It achieves the following results on the evaluation set:
21
+ - Loss: 19.1922
22
+ - Wer: 0.1770
23
+ - Cer: 0.7950
24
+
25
+ ## Model description
26
+
27
+ More information needed
28
+
29
+ ## Intended uses & limitations
30
+
31
+ More information needed
32
+
33
+ ## Training and evaluation data
34
+
35
+ More information needed
36
+
37
+ ## Training procedure
38
+
39
+ ### Training hyperparameters
40
+
41
+ The following hyperparameters were used during training:
42
+ - learning_rate: 1e-05
43
+ - train_batch_size: 15
44
+ - eval_batch_size: 15
45
+ - seed: 42
46
+ - optimizer: Use OptimizerNames.ADAMW_TORCH with betas=(0.9,0.999) and epsilon=1e-08 and optimizer_args=No additional optimizer arguments
47
+ - lr_scheduler_type: linear
48
+ - lr_scheduler_warmup_steps: 50
49
+ - num_epochs: 70
50
+
51
+ ### Training results
52
+
53
+ | Training Loss | Epoch | Step | Validation Loss | Wer | Cer |
54
+ |:-------------:|:-----:|:----:|:---------------:|:------:|:------:|
55
+ | 585.4988 | 1.0 | 73 | 271.5495 | 0.3633 | 0.8109 |
56
+ | 378.3453 | 2.0 | 146 | 168.1931 | 0.3276 | 0.8056 |
57
+ | 319.9564 | 3.0 | 219 | 140.2753 | 0.3131 | 0.8034 |
58
+ | 281.8407 | 4.0 | 292 | 127.9118 | 0.2933 | 0.8023 |
59
+ | 264.2254 | 5.0 | 365 | 103.9656 | 0.2814 | 0.8020 |
60
+ | 233.3232 | 6.0 | 438 | 87.8603 | 0.2655 | 0.8005 |
61
+ | 213.0622 | 7.0 | 511 | 80.5251 | 0.2497 | 0.7993 |
62
+ | 194.7588 | 8.0 | 584 | 77.2796 | 0.2457 | 0.7991 |
63
+ | 197.9257 | 9.0 | 657 | 72.9397 | 0.2378 | 0.7985 |
64
+ | 183.4031 | 10.0 | 730 | 57.6201 | 0.2312 | 0.7979 |
65
+ | 172.3133 | 11.0 | 803 | 56.8209 | 0.2219 | 0.7976 |
66
+ | 165.2571 | 12.0 | 876 | 52.5103 | 0.2219 | 0.7972 |
67
+ | 161.9286 | 13.0 | 949 | 50.8869 | 0.2180 | 0.7970 |
68
+ | 158.4977 | 14.0 | 1022 | 46.2574 | 0.2127 | 0.7969 |
69
+ | 146.6963 | 15.0 | 1095 | 39.4797 | 0.2114 | 0.7968 |
70
+ | 131.5992 | 16.0 | 1168 | 38.5002 | 0.2127 | 0.7966 |
71
+ | 136.5205 | 17.0 | 1241 | 34.6582 | 0.2100 | 0.7965 |
72
+ | 130.8528 | 18.0 | 1314 | 31.8192 | 0.2061 | 0.7964 |
73
+ | 122.9594 | 19.0 | 1387 | 31.4980 | 0.1968 | 0.7961 |
74
+ | 122.6427 | 20.0 | 1460 | 29.6717 | 0.1955 | 0.7961 |
75
+ | 116.4709 | 21.0 | 1533 | 30.8555 | 0.1955 | 0.7960 |
76
+ | 124.5335 | 22.0 | 1606 | 31.9685 | 0.1942 | 0.7959 |
77
+ | 110.134 | 23.0 | 1679 | 32.0465 | 0.1968 | 0.7963 |
78
+ | 105.5423 | 24.0 | 1752 | 30.3238 | 0.1955 | 0.7961 |
79
+ | 113.3944 | 25.0 | 1825 | 28.7380 | 0.1889 | 0.7959 |
80
+ | 112.8572 | 26.0 | 1898 | 25.8070 | 0.1876 | 0.7957 |
81
+ | 106.1037 | 27.0 | 1971 | 28.3786 | 0.1876 | 0.7957 |
82
+ | 105.8874 | 28.0 | 2044 | 27.5647 | 0.1889 | 0.7957 |
83
+ | 96.3391 | 29.0 | 2117 | 29.5317 | 0.1915 | 0.7958 |
84
+ | 103.2364 | 30.0 | 2190 | 26.4454 | 0.1836 | 0.7956 |
85
+ | 101.3744 | 31.0 | 2263 | 24.9761 | 0.1836 | 0.7955 |
86
+ | 94.1529 | 32.0 | 2336 | 25.9349 | 0.1810 | 0.7954 |
87
+ | 89.4031 | 33.0 | 2409 | 18.5316 | 0.1810 | 0.7954 |
88
+ | 98.6291 | 34.0 | 2482 | 26.2887 | 0.1810 | 0.7954 |
89
+ | 88.7591 | 35.0 | 2555 | 26.2593 | 0.1823 | 0.7954 |
90
+ | 91.8604 | 36.0 | 2628 | 27.2263 | 0.1823 | 0.7954 |
91
+ | 83.4981 | 37.0 | 2701 | 26.0174 | 0.1810 | 0.7954 |
92
+ | 88.0891 | 38.0 | 2774 | 26.2153 | 0.1823 | 0.7955 |
93
+ | 85.7155 | 39.0 | 2847 | 24.1102 | 0.1810 | 0.7954 |
94
+ | 87.0231 | 40.0 | 2920 | 25.7208 | 0.1836 | 0.7955 |
95
+ | 85.2278 | 41.0 | 2993 | 25.6799 | 0.1797 | 0.7952 |
96
+ | 83.8083 | 42.0 | 3066 | 25.9679 | 0.1810 | 0.7955 |
97
+ | 83.1864 | 43.0 | 3139 | 23.0670 | 0.1797 | 0.7953 |
98
+ | 92.3624 | 44.0 | 3212 | 23.0629 | 0.1797 | 0.7953 |
99
+ | 101.0567 | 45.0 | 3285 | 23.7475 | 0.1823 | 0.7955 |
100
+ | 77.1269 | 46.0 | 3358 | 21.2927 | 0.1836 | 0.7954 |
101
+ | 79.782 | 47.0 | 3431 | 22.2427 | 0.1797 | 0.7952 |
102
+ | 79.0065 | 48.0 | 3504 | 22.0512 | 0.1783 | 0.7952 |
103
+ | 78.0512 | 49.0 | 3577 | 22.9018 | 0.1770 | 0.7950 |
104
+ | 84.4353 | 50.0 | 3650 | 23.3538 | 0.1783 | 0.7952 |
105
+ | 76.3221 | 51.0 | 3723 | 21.3755 | 0.1823 | 0.7952 |
106
+ | 74.6622 | 52.0 | 3796 | 22.8240 | 0.1783 | 0.7951 |
107
+ | 82.2913 | 53.0 | 3869 | 21.2273 | 0.1770 | 0.7950 |
108
+ | 71.0879 | 54.0 | 3942 | 20.8637 | 0.1770 | 0.7950 |
109
+ | 78.6892 | 55.0 | 4015 | 22.2313 | 0.1770 | 0.7951 |
110
+ | 68.3446 | 56.0 | 4088 | 20.8211 | 0.1797 | 0.7952 |
111
+ | 78.6938 | 57.0 | 4161 | 21.4202 | 0.1783 | 0.7952 |
112
+ | 76.9933 | 58.0 | 4234 | 20.0210 | 0.1783 | 0.7951 |
113
+ | 70.8471 | 59.0 | 4307 | 22.2786 | 0.1783 | 0.7951 |
114
+ | 76.5866 | 60.0 | 4380 | 20.0782 | 0.1770 | 0.7951 |
115
+ | 69.9045 | 61.0 | 4453 | 21.1576 | 0.1797 | 0.7951 |
116
+ | 81.1508 | 62.0 | 4526 | 18.7841 | 0.1797 | 0.7951 |
117
+ | 82.9743 | 63.0 | 4599 | 18.4739 | 0.1823 | 0.7952 |
118
+ | 80.8333 | 64.0 | 4672 | 20.2582 | 0.1810 | 0.7954 |
119
+ | 71.9855 | 65.0 | 4745 | 21.3909 | 0.1770 | 0.7952 |
120
+ | 80.0273 | 66.0 | 4818 | 20.2303 | 0.1797 | 0.7952 |
121
+ | 74.9079 | 67.0 | 4891 | 19.8304 | 0.1783 | 0.7952 |
122
+ | 75.7448 | 68.0 | 4964 | 21.5770 | 0.1823 | 0.7954 |
123
+ | 71.0606 | 69.0 | 5037 | 20.9629 | 0.1797 | 0.7952 |
124
+ | 75.027 | 70.0 | 5110 | 19.1922 | 0.1770 | 0.7950 |
125
+
126
+
127
+ ### Framework versions
128
+
129
+ - Transformers 4.51.3
130
+ - Pytorch 2.5.1+cu121
131
+ - Datasets 3.6.0
132
+ - Tokenizers 0.21.1
config.json ADDED
@@ -0,0 +1,109 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "activation_dropout": 0.1,
3
+ "adapter_attn_dim": null,
4
+ "adapter_kernel_size": 3,
5
+ "adapter_stride": 2,
6
+ "add_adapter": false,
7
+ "apply_spec_augment": true,
8
+ "architectures": [
9
+ "Wav2Vec2ForCTC"
10
+ ],
11
+ "attention_dropout": 0.1,
12
+ "bos_token_id": 1,
13
+ "classifier_proj_size": 256,
14
+ "codevector_dim": 256,
15
+ "contrastive_logits_temperature": 0.1,
16
+ "conv_bias": false,
17
+ "conv_dim": [
18
+ 512,
19
+ 512,
20
+ 512,
21
+ 512,
22
+ 512,
23
+ 512,
24
+ 512
25
+ ],
26
+ "conv_kernel": [
27
+ 10,
28
+ 3,
29
+ 3,
30
+ 3,
31
+ 3,
32
+ 2,
33
+ 2
34
+ ],
35
+ "conv_stride": [
36
+ 5,
37
+ 2,
38
+ 2,
39
+ 2,
40
+ 2,
41
+ 2,
42
+ 2
43
+ ],
44
+ "ctc_loss_reduction": "sum",
45
+ "ctc_zero_infinity": false,
46
+ "diversity_loss_weight": 0.1,
47
+ "do_stable_layer_norm": false,
48
+ "eos_token_id": 2,
49
+ "feat_extract_activation": "gelu",
50
+ "feat_extract_dropout": 0.0,
51
+ "feat_extract_norm": "group",
52
+ "feat_proj_dropout": 0.1,
53
+ "feat_quantizer_dropout": 0.0,
54
+ "final_dropout": 0.1,
55
+ "gradient_checkpointing": false,
56
+ "hidden_act": "gelu",
57
+ "hidden_dropout": 0.1,
58
+ "hidden_dropout_prob": 0.1,
59
+ "hidden_size": 768,
60
+ "initializer_range": 0.02,
61
+ "intermediate_size": 3072,
62
+ "layer_norm_eps": 1e-05,
63
+ "layerdrop": 0.1,
64
+ "mask_feature_length": 10,
65
+ "mask_feature_min_masks": 0,
66
+ "mask_feature_prob": 0.0,
67
+ "mask_time_length": 10,
68
+ "mask_time_min_masks": 2,
69
+ "mask_time_prob": 0.05,
70
+ "model_type": "wav2vec2",
71
+ "num_adapter_layers": 3,
72
+ "num_attention_heads": 12,
73
+ "num_codevector_groups": 2,
74
+ "num_codevectors_per_group": 320,
75
+ "num_conv_pos_embedding_groups": 16,
76
+ "num_conv_pos_embeddings": 128,
77
+ "num_feat_extract_layers": 7,
78
+ "num_hidden_layers": 12,
79
+ "num_negatives": 100,
80
+ "output_hidden_size": 768,
81
+ "pad_token_id": 0,
82
+ "proj_codevector_dim": 256,
83
+ "tdnn_dilation": [
84
+ 1,
85
+ 2,
86
+ 3,
87
+ 1,
88
+ 1
89
+ ],
90
+ "tdnn_dim": [
91
+ 512,
92
+ 512,
93
+ 512,
94
+ 512,
95
+ 1500
96
+ ],
97
+ "tdnn_kernel": [
98
+ 5,
99
+ 3,
100
+ 3,
101
+ 1,
102
+ 1
103
+ ],
104
+ "torch_dtype": "float32",
105
+ "transformers_version": "4.51.3",
106
+ "use_weighted_layer_sum": false,
107
+ "vocab_size": 32,
108
+ "xvector_output_dim": 512
109
+ }
model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c6c8f9eb0424e21e1e0b070a1f387c23d2fcb0200a55045a4cf21fd484b20ae2
3
+ size 377611120
preprocessor_config.json ADDED
@@ -0,0 +1,10 @@
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "do_normalize": true,
3
+ "feature_extractor_type": "Wav2Vec2FeatureExtractor",
4
+ "feature_size": 1,
5
+ "padding_side": "right",
6
+ "padding_value": 0.0,
7
+ "processor_class": "Wav2Vec2Processor",
8
+ "return_attention_mask": false,
9
+ "sampling_rate": 16000
10
+ }
special_tokens_map.json ADDED
@@ -0,0 +1,6 @@
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token": "<s>",
3
+ "eos_token": "</s>",
4
+ "pad_token": "<pad>",
5
+ "unk_token": "<unk>"
6
+ }
tokenizer_config.json ADDED
@@ -0,0 +1,51 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "added_tokens_decoder": {
3
+ "0": {
4
+ "content": "<pad>",
5
+ "lstrip": true,
6
+ "normalized": false,
7
+ "rstrip": true,
8
+ "single_word": false,
9
+ "special": false
10
+ },
11
+ "1": {
12
+ "content": "<s>",
13
+ "lstrip": true,
14
+ "normalized": false,
15
+ "rstrip": true,
16
+ "single_word": false,
17
+ "special": false
18
+ },
19
+ "2": {
20
+ "content": "</s>",
21
+ "lstrip": true,
22
+ "normalized": false,
23
+ "rstrip": true,
24
+ "single_word": false,
25
+ "special": false
26
+ },
27
+ "3": {
28
+ "content": "<unk>",
29
+ "lstrip": true,
30
+ "normalized": false,
31
+ "rstrip": true,
32
+ "single_word": false,
33
+ "special": false
34
+ }
35
+ },
36
+ "bos_token": "<s>",
37
+ "clean_up_tokenization_spaces": false,
38
+ "do_lower_case": false,
39
+ "do_normalize": true,
40
+ "eos_token": "</s>",
41
+ "extra_special_tokens": {},
42
+ "model_max_length": 1000000000000000019884624838656,
43
+ "pad_token": "<pad>",
44
+ "processor_class": "Wav2Vec2Processor",
45
+ "replace_word_delimiter_char": " ",
46
+ "return_attention_mask": false,
47
+ "target_lang": null,
48
+ "tokenizer_class": "Wav2Vec2CTCTokenizer",
49
+ "unk_token": "<unk>",
50
+ "word_delimiter_token": "|"
51
+ }
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:93ac5335cb1225c0552e05b6d96fbe11cc7a9bf81d7ed80f23d7b7738760342e
3
+ size 5368
vocab.json ADDED
@@ -0,0 +1,34 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "'": 27,
3
+ "</s>": 2,
4
+ "<pad>": 0,
5
+ "<s>": 1,
6
+ "<unk>": 3,
7
+ "A": 7,
8
+ "B": 24,
9
+ "C": 19,
10
+ "D": 14,
11
+ "E": 5,
12
+ "F": 20,
13
+ "G": 21,
14
+ "H": 11,
15
+ "I": 10,
16
+ "J": 29,
17
+ "K": 26,
18
+ "L": 15,
19
+ "M": 17,
20
+ "N": 9,
21
+ "O": 8,
22
+ "P": 23,
23
+ "Q": 30,
24
+ "R": 13,
25
+ "S": 12,
26
+ "T": 6,
27
+ "U": 16,
28
+ "V": 25,
29
+ "W": 18,
30
+ "X": 28,
31
+ "Y": 22,
32
+ "Z": 31,
33
+ "|": 4
34
+ }