Divyasreepat commited on
Commit
ac5ce2f
1 Parent(s): 4fa7138

Upload folder using huggingface_hub

Browse files
README.md ADDED
@@ -0,0 +1,18 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ library_name: keras-hub
3
+ ---
4
+ This is a [`Whisper` model](https://keras.io/api/keras_hub/models/whisper) uploaded using the KerasHub library and can be used with JAX, TensorFlow, and PyTorch backends.
5
+ Model config:
6
+ * **name:** whisper_backbone
7
+ * **trainable:** True
8
+ * **vocabulary_size:** 51865
9
+ * **num_layers:** 24
10
+ * **num_heads:** 16
11
+ * **hidden_dim:** 1024
12
+ * **intermediate_dim:** 4096
13
+ * **num_mels:** 80
14
+ * **dropout:** 0.0
15
+ * **max_encoder_sequence_length:** 3000
16
+ * **max_decoder_sequence_length:** 448
17
+
18
+ This model card has been generated automatically and should be completed by the model author. See [Model Cards documentation](https://huggingface.co/docs/hub/model-cards) for more information.
assets/tokenizer/merges.txt ADDED
The diff for this file is too large to render. See raw diff
 
assets/tokenizer/vocabulary.json ADDED
The diff for this file is too large to render. See raw diff
 
audio_converter.json ADDED
@@ -0,0 +1,22 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "module": "keras_nlp.src.models.whisper.whisper_audio_converter",
3
+ "class_name": "WhisperAudioConverter",
4
+ "config": {
5
+ "name": "whisper_audio_converter",
6
+ "trainable": true,
7
+ "dtype": {
8
+ "module": "keras",
9
+ "class_name": "DTypePolicy",
10
+ "config": {
11
+ "name": "float32"
12
+ },
13
+ "registered_name": null
14
+ },
15
+ "num_mels": 80,
16
+ "num_fft_bins": 400,
17
+ "stride": 160,
18
+ "sampling_rate": 16000,
19
+ "max_audio_length": 30
20
+ },
21
+ "registered_name": "keras_nlp>WhisperAudioConverter"
22
+ }
config.json ADDED
@@ -0,0 +1,20 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "module": "keras_nlp.src.models.whisper.whisper_backbone",
3
+ "class_name": "WhisperBackbone",
4
+ "config": {
5
+ "name": "whisper_backbone",
6
+ "trainable": true,
7
+ "vocabulary_size": 51865,
8
+ "num_layers": 24,
9
+ "num_heads": 16,
10
+ "hidden_dim": 1024,
11
+ "intermediate_dim": 4096,
12
+ "num_mels": 80,
13
+ "dropout": 0.0,
14
+ "max_encoder_sequence_length": 3000,
15
+ "max_decoder_sequence_length": 448
16
+ },
17
+ "registered_name": "keras_nlp>WhisperBackbone",
18
+ "assets": [],
19
+ "weights": "model.weights.h5"
20
+ }
metadata.json ADDED
@@ -0,0 +1,6 @@
 
 
 
 
 
 
 
1
+ {
2
+ "keras_version": "3.0.1",
3
+ "keras_nlp_version": "0.7.0",
4
+ "parameter_count": 763857920,
5
+ "date_saved": "2023-12-27@02:35:18"
6
+ }
model.weights.h5 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:15760ed855fc6db212109b18447bfcc686a62cff3cd742c6127dcb09318b2b8c
3
+ size 3057470592
tokenizer.json ADDED
@@ -0,0 +1,125 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "module": "keras_nlp.src.models.whisper.whisper_tokenizer",
3
+ "class_name": "WhisperTokenizer",
4
+ "config": {
5
+ "name": "whisper_tokenizer",
6
+ "trainable": true,
7
+ "dtype": "int32",
8
+ "sequence_length": null,
9
+ "add_prefix_space": false,
10
+ "special_tokens": {
11
+ "<|startoftranscript|>": 50258,
12
+ "<|endoftext|>": 50257,
13
+ "<|notimestamps|>": 50363,
14
+ "<|translate|>": 50359,
15
+ "<|transcribe|>": 50358
16
+ },
17
+ "language_tokens": {
18
+ "<|af|>": 50327,
19
+ "<|am|>": 50334,
20
+ "<|ar|>": 50272,
21
+ "<|as|>": 50350,
22
+ "<|az|>": 50304,
23
+ "<|ba|>": 50355,
24
+ "<|be|>": 50330,
25
+ "<|bg|>": 50292,
26
+ "<|bn|>": 50302,
27
+ "<|bo|>": 50347,
28
+ "<|br|>": 50309,
29
+ "<|bs|>": 50315,
30
+ "<|ca|>": 50270,
31
+ "<|cs|>": 50283,
32
+ "<|cy|>": 50297,
33
+ "<|da|>": 50285,
34
+ "<|de|>": 50261,
35
+ "<|el|>": 50281,
36
+ "<|en|>": 50259,
37
+ "<|es|>": 50262,
38
+ "<|et|>": 50307,
39
+ "<|eu|>": 50310,
40
+ "<|fa|>": 50300,
41
+ "<|fi|>": 50277,
42
+ "<|fo|>": 50338,
43
+ "<|fr|>": 50265,
44
+ "<|gl|>": 50319,
45
+ "<|gu|>": 50333,
46
+ "<|haw|>": 50352,
47
+ "<|ha|>": 50354,
48
+ "<|he|>": 50279,
49
+ "<|hi|>": 50276,
50
+ "<|hr|>": 50291,
51
+ "<|ht|>": 50339,
52
+ "<|hu|>": 50286,
53
+ "<|hy|>": 50312,
54
+ "<|id|>": 50275,
55
+ "<|is|>": 50311,
56
+ "<|it|>": 50274,
57
+ "<|ja|>": 50266,
58
+ "<|jw|>": 50356,
59
+ "<|ka|>": 50329,
60
+ "<|kk|>": 50316,
61
+ "<|km|>": 50323,
62
+ "<|kn|>": 50306,
63
+ "<|ko|>": 50264,
64
+ "<|la|>": 50294,
65
+ "<|lb|>": 50345,
66
+ "<|ln|>": 50353,
67
+ "<|lo|>": 50336,
68
+ "<|lt|>": 50293,
69
+ "<|lv|>": 50301,
70
+ "<|mg|>": 50349,
71
+ "<|mi|>": 50295,
72
+ "<|mk|>": 50308,
73
+ "<|ml|>": 50296,
74
+ "<|mn|>": 50314,
75
+ "<|mr|>": 50320,
76
+ "<|ms|>": 50282,
77
+ "<|mt|>": 50343,
78
+ "<|my|>": 50346,
79
+ "<|ne|>": 50313,
80
+ "<|nl|>": 50271,
81
+ "<|nn|>": 50342,
82
+ "<|no|>": 50288,
83
+ "<|oc|>": 50328,
84
+ "<|pa|>": 50321,
85
+ "<|pl|>": 50269,
86
+ "<|ps|>": 50340,
87
+ "<|pt|>": 50267,
88
+ "<|ro|>": 50284,
89
+ "<|ru|>": 50263,
90
+ "<|sa|>": 50344,
91
+ "<|sd|>": 50332,
92
+ "<|si|>": 50322,
93
+ "<|sk|>": 50298,
94
+ "<|sl|>": 50305,
95
+ "<|sn|>": 50324,
96
+ "<|so|>": 50326,
97
+ "<|sq|>": 50317,
98
+ "<|sr|>": 50303,
99
+ "<|su|>": 50357,
100
+ "<|sv|>": 50273,
101
+ "<|sw|>": 50318,
102
+ "<|ta|>": 50287,
103
+ "<|te|>": 50299,
104
+ "<|tg|>": 50331,
105
+ "<|th|>": 50289,
106
+ "<|tk|>": 50341,
107
+ "<|tl|>": 50348,
108
+ "<|tr|>": 50268,
109
+ "<|tt|>": 50351,
110
+ "<|uk|>": 50280,
111
+ "<|ur|>": 50290,
112
+ "<|uz|>": 50337,
113
+ "<|vi|>": 50278,
114
+ "<|yi|>": 50335,
115
+ "<|yo|>": 50325,
116
+ "<|zh|>": 50260
117
+ }
118
+ },
119
+ "registered_name": "keras_nlp>WhisperTokenizer",
120
+ "assets": [
121
+ "assets/tokenizer/merges.txt",
122
+ "assets/tokenizer/vocabulary.json"
123
+ ],
124
+ "weights": null
125
+ }