woodwardmw commited on
Commit
fac7291
·
verified ·
1 Parent(s): b29ad71

Training in progress, step 500

Browse files
added_tokens.json CHANGED
@@ -1,4 +1,4 @@
1
  {
2
- "</s>": 73,
3
- "<s>": 72
4
  }
 
1
  {
2
+ "</s>": 76,
3
+ "<s>": 75
4
  }
config.json CHANGED
@@ -9,7 +9,7 @@
9
  "architectures": [
10
  "Wav2Vec2BertForCTC"
11
  ],
12
- "attention_dropout": 0.0,
13
  "blank_token_id": 0,
14
  "bos_token_id": 1,
15
  "classifier_proj_size": 768,
@@ -26,7 +26,7 @@
26
  "feature_projection_input_dim": 160,
27
  "final_dropout": 0.1,
28
  "hidden_act": "swish",
29
- "hidden_dropout": 0.0,
30
  "hidden_size": 1024,
31
  "initializer_range": 0.02,
32
  "intermediate_size": 4096,
@@ -48,7 +48,7 @@
48
  "num_hidden_layers": 24,
49
  "num_negatives": 100,
50
  "output_hidden_size": 1024,
51
- "pad_token_id": 68,
52
  "position_embeddings_type": "relative_key",
53
  "proj_codevector_dim": 768,
54
  "right_max_position_embeddings": 8,
@@ -78,6 +78,6 @@
78
  "transformers_version": "4.49.0",
79
  "use_intermediate_ffn_before_adapter": false,
80
  "use_weighted_layer_sum": false,
81
- "vocab_size": 74,
82
  "xvector_output_dim": 512
83
  }
 
9
  "architectures": [
10
  "Wav2Vec2BertForCTC"
11
  ],
12
+ "attention_dropout": 0.1,
13
  "blank_token_id": 0,
14
  "bos_token_id": 1,
15
  "classifier_proj_size": 768,
 
26
  "feature_projection_input_dim": 160,
27
  "final_dropout": 0.1,
28
  "hidden_act": "swish",
29
+ "hidden_dropout": 0.1,
30
  "hidden_size": 1024,
31
  "initializer_range": 0.02,
32
  "intermediate_size": 4096,
 
48
  "num_hidden_layers": 24,
49
  "num_negatives": 100,
50
  "output_hidden_size": 1024,
51
+ "pad_token_id": 71,
52
  "position_embeddings_type": "relative_key",
53
  "proj_codevector_dim": 768,
54
  "right_max_position_embeddings": 8,
 
78
  "transformers_version": "4.49.0",
79
  "use_intermediate_ffn_before_adapter": false,
80
  "use_weighted_layer_sum": false,
81
+ "vocab_size": 77,
82
  "xvector_output_dim": 512
83
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:de6262a0e09af1c4f8de3b03b21577cf8b37ab964d5951862b84fa2cc52c9f42
3
- size 2322378112
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f861f5ef22b98759dbd153a1f06f9dc819cce350e445c0354823b68fec3a968f
3
+ size 2322390412
tokenizer_config.json CHANGED
@@ -24,7 +24,7 @@
24
  "single_word": false,
25
  "special": false
26
  },
27
- "68": {
28
  "content": "[PAD]",
29
  "lstrip": true,
30
  "normalized": false,
@@ -32,7 +32,7 @@
32
  "single_word": false,
33
  "special": false
34
  },
35
- "69": {
36
  "content": "[UNK]",
37
  "lstrip": true,
38
  "normalized": false,
@@ -40,7 +40,7 @@
40
  "single_word": false,
41
  "special": false
42
  },
43
- "72": {
44
  "content": "<s>",
45
  "lstrip": false,
46
  "normalized": false,
@@ -48,7 +48,7 @@
48
  "single_word": false,
49
  "special": true
50
  },
51
- "73": {
52
  "content": "</s>",
53
  "lstrip": false,
54
  "normalized": false,
 
24
  "single_word": false,
25
  "special": false
26
  },
27
+ "71": {
28
  "content": "[PAD]",
29
  "lstrip": true,
30
  "normalized": false,
 
32
  "single_word": false,
33
  "special": false
34
  },
35
+ "72": {
36
  "content": "[UNK]",
37
  "lstrip": true,
38
  "normalized": false,
 
40
  "single_word": false,
41
  "special": false
42
  },
43
+ "75": {
44
  "content": "<s>",
45
  "lstrip": false,
46
  "normalized": false,
 
48
  "single_word": false,
49
  "special": true
50
  },
51
+ "76": {
52
  "content": "</s>",
53
  "lstrip": false,
54
  "normalized": false,
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4f83e6c3efd60d97448ee0ad04f217955bbc10e33fc5a49005ee4cd09e9fb81a
3
  size 5368
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8e8228845e62a44b76c6d252121dd5b91007f4f43129c6a5cc9b250bacfa2e91
3
  size 5368
vocab.json CHANGED
@@ -1,74 +1,77 @@
1
  {
2
- "(": 60,
3
- ")": 61,
4
- ",": 20,
5
  "-": 38,
6
  ".": 26,
7
- "7": 57,
8
- ":": 36,
9
- ";": 62,
10
- "<": 34,
11
  "<ctc_blank>": 0,
12
  "<pad>": 1,
13
  "<unk>": 2,
14
- ">": 35,
15
- "?": 49,
16
- "[PAD]": 68,
17
- "[UNK]": 69,
18
- "А": 27,
 
 
19
  "Б": 45,
 
20
  "Г": 39,
21
- "Д": 48,
22
- "Е": 55,
23
- "И": 63,
24
- "К": 41,
25
- "Л": 50,
 
26
  "М": 46,
27
- "Н": 58,
28
- "О": 53,
29
- "П": 64,
30
- "Р": 44,
31
- "С": 52,
32
  "Т": 47,
33
- "У": 59,
34
- "Х": 43,
35
- "Ц": 65,
36
- "Э": 66,
37
- "Ю": 67,
 
38
  "а": 4,
39
  "б": 17,
40
- "в": 25,
41
  "г": 11,
42
  "д": 23,
43
- "е": 8,
44
  "ж": 28,
45
  "з": 21,
46
  "и": 9,
47
- "й": 24,
48
  "к": 14,
49
- "л": 7,
50
- "м": 22,
51
  "н": 10,
52
  "о": 5,
53
- "п": 37,
54
  "р": 13,
55
  "с": 18,
56
- "т": 29,
57
- "у": 16,
58
- "ф": 56,
59
- "х": 15,
60
  "ц": 31,
61
  "ч": 32,
62
- "ш": 33,
63
- "щ": 51,
64
  "ъ": 6,
65
  "ь": 12,
66
  "э": 30,
67
- "ю": 54,
68
- "я": 40,
69
- "ё": 42,
70
- "Ӏ": 19,
71
- "‌": 70,
72
- "‍": 71,
 
73
  "▁": 3
74
  }
 
1
  {
2
+ "!": 67,
3
+ ",": 19,
 
4
  "-": 38,
5
  ".": 26,
6
+ ":": 33,
7
+ "<": 36,
 
 
8
  "<ctc_blank>": 0,
9
  "<pad>": 1,
10
  "<unk>": 2,
11
+ ">": 37,
12
+ "?": 53,
13
+ "[PAD]": 71,
14
+ "[UNK]": 72,
15
+ "«": 54,
16
+ "»": 55,
17
+ "А": 29,
18
  "Б": 45,
19
+ "В": 63,
20
  "Г": 39,
21
+ "Д": 44,
22
+ "Е": 58,
23
+ "Ж": 68,
24
+ "И": 56,
25
+ "К": 40,
26
+ "Л": 59,
27
  "М": 46,
28
+ "Н": 49,
29
+ "О": 57,
30
+ "П": 69,
31
+ "Р": 43,
32
+ "С": 50,
33
  "Т": 47,
34
+ "У": 64,
35
+ "Ф": 65,
36
+ "Х": 51,
37
+ "Ц": 66,
38
+ "Э": 62,
39
+ "Ю": 70,
40
  "а": 4,
41
  "б": 17,
42
+ "в": 24,
43
  "г": 11,
44
  "д": 23,
45
+ "е": 7,
46
  "ж": 28,
47
  "з": 21,
48
  "и": 9,
49
+ "й": 25,
50
  "к": 14,
51
+ "л": 8,
52
+ "м": 20,
53
  "н": 10,
54
  "о": 5,
55
+ "п": 42,
56
  "р": 13,
57
  "с": 18,
58
+ "т": 27,
59
+ "у": 15,
60
+ "ф": 48,
61
+ "х": 16,
62
  "ц": 31,
63
  "ч": 32,
64
+ "ш": 34,
65
+ "щ": 60,
66
  "ъ": 6,
67
  "ь": 12,
68
  "э": 30,
69
+ "ю": 52,
70
+ "я": 35,
71
+ "ё": 41,
72
+ "Ӏ": 22,
73
+ "‌": 73,
74
+ "‍": 74,
75
+ "–": 61,
76
  "▁": 3
77
  }