justheuristic commited on
Commit
9159e0b
1 Parent(s): c10cdb6

push-o-matic

Browse files
Files changed (3) hide show
  1. config.json +6 -3
  2. pytorch_model.bin +1 -1
  3. tokenizer_config.json +1 -1
config.json CHANGED
@@ -1,5 +1,8 @@
1
  {
2
  "apply_residual_connection_post_layernorm": false,
 
 
 
3
  "attention_dropout": 0.0,
4
  "attention_softmax_in_fp32": true,
5
  "bias_dropout_fusion": true,
@@ -7,14 +10,14 @@
7
  "dht_prefix": "bigscience/test-bloomd-6b3",
8
  "eos_token_id": 2,
9
  "hidden_dropout": 0.0,
 
10
  "initializer_range": 0.02,
11
  "layer_norm_epsilon": 1e-05,
12
  "masked_softmax_fusion": true,
13
  "model_type": "bloom",
14
- "n_embed": 4096,
15
  "n_inner": null,
16
  "n_layer": 30,
17
- "num_attention_heads": 32,
18
  "offset_alibi": 100,
19
  "pad_token_id": 3,
20
  "pretraining_tp": 4,
@@ -24,6 +27,6 @@
24
  "slow_but_exact": false,
25
  "transformers_version": "4.21.0.dev0",
26
  "unk_token_id": 0,
27
- "use_cache": false,
28
  "vocab_size": 250880
29
  }
 
1
  {
2
  "apply_residual_connection_post_layernorm": false,
3
+ "architectures": [
4
+ "BloomModel"
5
+ ],
6
  "attention_dropout": 0.0,
7
  "attention_softmax_in_fp32": true,
8
  "bias_dropout_fusion": true,
 
10
  "dht_prefix": "bigscience/test-bloomd-6b3",
11
  "eos_token_id": 2,
12
  "hidden_dropout": 0.0,
13
+ "hidden_size": 4096,
14
  "initializer_range": 0.02,
15
  "layer_norm_epsilon": 1e-05,
16
  "masked_softmax_fusion": true,
17
  "model_type": "bloom",
18
+ "n_head": 32,
19
  "n_inner": null,
20
  "n_layer": 30,
 
21
  "offset_alibi": 100,
22
  "pad_token_id": 3,
23
  "pretraining_tp": 4,
 
27
  "slow_but_exact": false,
28
  "transformers_version": "4.21.0.dev0",
29
  "unk_token_id": 0,
30
+ "use_cache": true,
31
  "vocab_size": 250880
32
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a16a76ab0ef60497ad99fe7c5f6e76f455b1dae5d08fadeaebc849d14d1f5093
3
  size 2055243291
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:50f206263e7636fc72a42747e86c39d576f3b6790f209132bdb8b03fa0660fb7
3
  size 2055243291
tokenizer_config.json CHANGED
@@ -2,9 +2,9 @@
2
  "add_prefix_space": false,
3
  "bos_token": "<s>",
4
  "eos_token": "</s>",
5
- "model_max_length": 1024,
6
  "name_or_path": "bigscience/bloom-6b3",
7
  "pad_token": "<pad>",
 
8
  "special_tokens_map_file": null,
9
  "tokenizer_class": "BloomTokenizer",
10
  "unk_token": "<unk>"
 
2
  "add_prefix_space": false,
3
  "bos_token": "<s>",
4
  "eos_token": "</s>",
 
5
  "name_or_path": "bigscience/bloom-6b3",
6
  "pad_token": "<pad>",
7
+ "padding_side": "left",
8
  "special_tokens_map_file": null,
9
  "tokenizer_class": "BloomTokenizer",
10
  "unk_token": "<unk>"