robinhad commited on
Commit
f0b1d25
1 Parent(s): 03b37d7

Upload 2 files

Browse files
Files changed (2) hide show
  1. config.json +29 -7
  2. vocab.json +1 -1
config.json CHANGED
@@ -8,7 +8,7 @@
8
  "architectures": [
9
  "Wav2Vec2ForCTC"
10
  ],
11
- "attention_dropout": 0.0,
12
  "bos_token_id": 1,
13
  "classifier_proj_size": 256,
14
  "codevector_dim": 768,
@@ -49,17 +49,17 @@
49
  "feat_extract_activation": "gelu",
50
  "feat_extract_dropout": 0.0,
51
  "feat_extract_norm": "layer",
52
- "feat_proj_dropout": 0.0,
53
  "feat_quantizer_dropout": 0.0,
54
  "final_dropout": 0.0,
55
  "gradient_checkpointing": false,
56
  "hidden_act": "gelu",
57
- "hidden_dropout": 0.0,
58
  "hidden_size": 1024,
59
  "initializer_range": 0.02,
60
  "intermediate_size": 4096,
61
  "layer_norm_eps": 1e-05,
62
- "layerdrop": 0.0,
63
  "mask_feature_length": 10,
64
  "mask_feature_min_masks": 0,
65
  "mask_feature_prob": 0.0,
@@ -77,10 +77,32 @@
77
  "num_hidden_layers": 24,
78
  "num_negatives": 100,
79
  "output_hidden_size": 1024,
80
- "pad_token_id": 35,
81
  "proj_codevector_dim": 768,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
82
  "torch_dtype": "float32",
83
- "transformers_version": "4.14.1",
84
  "use_weighted_layer_sum": false,
85
- "vocab_size": 38
 
86
  }
 
8
  "architectures": [
9
  "Wav2Vec2ForCTC"
10
  ],
11
+ "attention_dropout": 0.1,
12
  "bos_token_id": 1,
13
  "classifier_proj_size": 256,
14
  "codevector_dim": 768,
 
49
  "feat_extract_activation": "gelu",
50
  "feat_extract_dropout": 0.0,
51
  "feat_extract_norm": "layer",
52
+ "feat_proj_dropout": 0.1,
53
  "feat_quantizer_dropout": 0.0,
54
  "final_dropout": 0.0,
55
  "gradient_checkpointing": false,
56
  "hidden_act": "gelu",
57
+ "hidden_dropout": 0.1,
58
  "hidden_size": 1024,
59
  "initializer_range": 0.02,
60
  "intermediate_size": 4096,
61
  "layer_norm_eps": 1e-05,
62
+ "layerdrop": 0.1,
63
  "mask_feature_length": 10,
64
  "mask_feature_min_masks": 0,
65
  "mask_feature_prob": 0.0,
 
77
  "num_hidden_layers": 24,
78
  "num_negatives": 100,
79
  "output_hidden_size": 1024,
80
+ "pad_token_id": 36,
81
  "proj_codevector_dim": 768,
82
+ "tdnn_dilation": [
83
+ 1,
84
+ 2,
85
+ 3,
86
+ 1,
87
+ 1
88
+ ],
89
+ "tdnn_dim": [
90
+ 512,
91
+ 512,
92
+ 512,
93
+ 512,
94
+ 1500
95
+ ],
96
+ "tdnn_kernel": [
97
+ 5,
98
+ 3,
99
+ 3,
100
+ 1,
101
+ 1
102
+ ],
103
  "torch_dtype": "float32",
104
+ "transformers_version": "4.25.1",
105
  "use_weighted_layer_sum": false,
106
+ "vocab_size": 39,
107
+ "xvector_output_dim": 512
108
  }
vocab.json CHANGED
@@ -1 +1 @@
1
- {"а": 1, "б": 2, "в": 3, "г": 4, "д": 5, "е": 6, "ж": 7, "з": 8, "и": 9, "й": 10, "к": 11, "л": 12, "м": 13, "н": 14, "о": 15, "п": 16, "р": 17, "с": 18, "т": 19, "у": 20, "ф": 21, "х": 22, "ц": 23, "ч": 24, "ш": 25, "щ": 26, "ь": 27, "ю": 28, "я": 29, "є": 30, "і": 31, "ї": 32, "ґ": 33, "|": 0, "[UNK]": 34, "[PAD]": 35}
 
1
+ {"'": 1, "\u0430": 2, "\u0431": 3, "\u0432": 4, "\u0433": 5, "\u0434": 6, "\u0435": 7, "\u0436": 8, "\u0437": 9, "\u0438": 10, "\u0439": 11, "\u043a": 12, "\u043b": 13, "\u043c": 14, "\u043d": 15, "\u043e": 16, "\u043f": 17, "\u0440": 18, "\u0441": 19, "\u0442": 20, "\u0443": 21, "\u0444": 22, "\u0445": 23, "\u0446": 24, "\u0447": 25, "\u0448": 26, "\u0449": 27, "\u044c": 28, "\u044e": 29, "\u044f": 30, "\u0454": 31, "\u0456": 32, "\u0457": 33, "\u0491": 34, "|": 0, "[UNK]": 35, "[PAD]": 36}