End of training

Browse files

Files changed (6) hide show

.gitignore +1 -0
config.json +77 -0
pytorch_model.bin +3 -0
runs/Jul27_12-02-38_aaf4165f6dc0/1658923509.9307225/events.out.tfevents.1658923509.aaf4165f6dc0.91.1 +3 -0
runs/Jul27_12-02-38_aaf4165f6dc0/events.out.tfevents.1658923509.aaf4165f6dc0.91.0 +3 -0
training_args.bin +3 -0

.gitignore ADDED Viewed

	@@ -0,0 +1 @@


1	+ checkpoint-*/

config.json ADDED Viewed

	@@ -0,0 +1,77 @@

+{
+  "_name_or_path": "robingeibel/reformer-big_patent-16384",
+  "architectures": [
+    "ReformerForMaskedLM"
+  ],
+  "attention_head_size": 64,
+  "attention_probs_dropout_prob": 0.1,
+  "attn_layers": [
+    "local",
+    "local",
+    "lsh",
+    "local",
+    "local",
+    "local",
+    "lsh",
+    "local",
+    "local",
+    "local",
+    "lsh",
+    "local"
+  ],
+  "axial_norm_std": 1.0,
+  "axial_pos_embds": false,
+  "axial_pos_embds_dim": [
+    128,
+    128
+  ],
+  "axial_pos_shape": [
+    512,
+    1024
+  ],
+  "chunk_size_lm_head": 0,
+  "classifier_dropout": null,
+  "eos_token_id": 2,
+  "feed_forward_size": 1024,
+  "hash_seed": null,
+  "hidden_act": "relu",
+  "hidden_dropout_prob": 0.05,
+  "hidden_size": 768,
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "layer_norm_eps": 1e-12,
+  "local_attention_probs_dropout_prob": 0.05,
+  "local_attn_chunk_length": 64,
+  "local_num_chunks_after": 0,
+  "local_num_chunks_before": 1,
+  "lsh_attention_probs_dropout_prob": 0.0,
+  "lsh_attn_chunk_length": 64,
+  "lsh_num_chunks_after": 0,
+  "lsh_num_chunks_before": 1,
+  "max_position_embeddings": 16384,
+  "model_type": "reformer",
+  "num_attention_heads": 12,
+  "num_buckets": [
+    64,
+    128
+  ],
+  "num_chunks_after": 0,
+  "num_chunks_before": 1,
+  "num_hashes": 1,
+  "num_hidden_layers": 12,
+  "output_attentions": true,
+  "output_hidden_states": true,
+  "output_past": true,
+  "pad_token_id": 0,
+  "task_specific_params": {
+    "text-generation": {
+      "do_sample": true,
+      "max_length": 100
+    }
+  },
+  "tie_word_embeddings": false,
+  "torch_dtype": "float32",
+  "transformers_version": "4.20.1",
+  "use_cache": true,
+  "vocab_size": 52000
+}

pytorch_model.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2b8fe5305f1dcb1c82f958cd2ab3533f15f4ec1d886de349a05ffbeeae54240e
+size 711743775

runs/Jul27_12-02-38_aaf4165f6dc0/1658923509.9307225/events.out.tfevents.1658923509.aaf4165f6dc0.91.1 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c5a7485480595a3b11773c63fca69a1240bb8c04e794ea9d790fef50d3437c6c
+size 5393

runs/Jul27_12-02-38_aaf4165f6dc0/events.out.tfevents.1658923509.aaf4165f6dc0.91.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:23e1bedefe59b7bfa887bf1b7b845ba7e159c074474412bfa2766bea0067b07c
+size 6346

training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:42393bcfe3a12a59639e323942cae59204e13513f177b435bd75c414927d9c89
+size 3375