Beijuka commited on
Commit
b0422c9
1 Parent(s): fc5b7e2

Training in progress, epoch 1

Browse files
Files changed (3) hide show
  1. config.json +3 -1
  2. model.safetensors +2 -2
  3. training_args.bin +2 -2
config.json CHANGED
@@ -1,7 +1,8 @@
1
  {
2
  "_name_or_path": "roberta-base",
 
3
  "architectures": [
4
- "RobertaForMaskedLM"
5
  ],
6
  "attention_probs_dropout_prob": 0.1,
7
  "bos_token_id": 0,
@@ -12,6 +13,7 @@
12
  "hidden_size": 768,
13
  "initializer_range": 0.02,
14
  "intermediate_size": 3072,
 
15
  "layer_norm_eps": 1e-05,
16
  "max_position_embeddings": 514,
17
  "model_type": "roberta",
 
1
  {
2
  "_name_or_path": "roberta-base",
3
+ "add_cross_attention": true,
4
  "architectures": [
5
+ "RobertaForCausalLM"
6
  ],
7
  "attention_probs_dropout_prob": 0.1,
8
  "bos_token_id": 0,
 
13
  "hidden_size": 768,
14
  "initializer_range": 0.02,
15
  "intermediate_size": 3072,
16
+ "is_decoder": true,
17
  "layer_norm_eps": 1e-05,
18
  "max_position_embeddings": 514,
19
  "model_type": "roberta",
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:00869a6539e9651d25afa1675e5d71a3d17d4fe1d653c4080bb02b7e579db7ea
3
- size 498813948
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c7d15dc981775834b8377397e85ed059db46951d06908a4b7ce7d5c9fb4da792
3
+ size 612296700
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b3fe5b8247adb61730fe65c50089e9709888575bde282883ba5246a21215c1da
3
- size 5112
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:57d922e814de1afdf2200038bc23105dc7c702109259328586e84d6b898984c6
3
+ size 5304