Upload folder using huggingface_hub

Files changed (7) hide show

README.md CHANGED Viewed

@@ -2,35 +2,30 @@
 license: mit
 base_model: TheBloke/zephyr-7B-alpha-GPTQ
 tags:
-- trl
-- sft
 - generated_from_trainer
-- peft
-- gptq
 model-index:
-- name: thesa
   results: []
-language:
-- en
-datasets:
-- loaiabdalslam/counselchat
-pipeline_tag: text-generation
-widget:
-- text: "<|system|>You are a therapist helping patients.<|user|>I'm fighting with my boyfriend and he's not talking to me. I don't know what to do<|assistant|>"
-  example_title: "Example 1"
 ---
-# Thesa
-Thesa is an experimental project of a therapy chatbot trained on mental health data and fine-tuned with the Zephyr GPTQ model that uses quantization to decrease high computatinal and storage costs.
 ## Model description
-- Fine-tuned from [TheBloke/zephyr-7B-alpha-GPTQ](https://huggingface.co/TheBloke/zephyr-7B-alpha-GPTQ)
 ## Intended uses & limitations
-The intended use is experimental.
 ## Training procedure
@@ -43,16 +38,13 @@ The following hyperparameters were used during training:
 - seed: 42
 - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
 - lr_scheduler_type: cosine
-- training_steps: 250
 - mixed_precision_training: Native AMP
 ### Framework versions
 - Transformers 4.35.2
 - Pytorch 2.1.0+cu121
 - Datasets 2.16.1
 - Tokenizers 0.15.1
-## More info
-More info at https://github.com/johnhandleyd/thesa

 license: mit
 base_model: TheBloke/zephyr-7B-alpha-GPTQ
 tags:
 - generated_from_trainer
 model-index:
+- name: thesa_v1
   results: []
 ---
+<!-- This model card has been generated automatically according to the information the Trainer had access to. You
+should probably proofread and complete it, then remove this comment. -->
+# thesa_v1
+This model is a fine-tuned version of [TheBloke/zephyr-7B-alpha-GPTQ](https://huggingface.co/TheBloke/zephyr-7B-alpha-GPTQ) on an unknown dataset.
 ## Model description
+More information needed
 ## Intended uses & limitations
+More information needed
+## Training and evaluation data
+More information needed
 ## Training procedure
 - seed: 42
 - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
 - lr_scheduler_type: cosine
+- lr_scheduler_warmup_ratio: 0.1
+- num_epochs: 10
 - mixed_precision_training: Native AMP
 ### Framework versions
 - Transformers 4.35.2
 - Pytorch 2.1.0+cu121
 - Datasets 2.16.1
 - Tokenizers 0.15.1

adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:53b56432ae401224e5ff9ca98ac000d12536a457865b1e1445e58d48278ba023
-size 27280152

 version https://git-lfs.github.com/spec/v1
+oid sha256:870a387ece9708a79136efdea27fc4c3c8727e7941ac6356bd8c10040c274f00
+size 133

runs/Feb26_23-15-54_7d7bf0a59e1f/events.out.tfevents.1708989426.7d7bf0a59e1f.1627.0 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:eb8e7b8d1fb0d7d44d65874cb4ce7718031a4b244603811b6ae4550772c1c410
+size 130

special_tokens_map.json CHANGED Viewed

@@ -18,13 +18,7 @@
     "rstrip": false,
     "single_word": false
   },
-  "pad_token": {
-    "content": "</s>",
-    "lstrip": false,
-    "normalized": false,
-    "rstrip": false,
-    "single_word": false
-  },
   "unk_token": {
     "content": "<unk>",
     "lstrip": false,

     "rstrip": false,
     "single_word": false
   },
+  "pad_token": "</s>",
   "unk_token": {
     "content": "<unk>",
     "lstrip": false,

tokenizer.json CHANGED Viewed

@@ -2,7 +2,7 @@
   "version": "1.0",
   "truncation": {
     "direction": "Left",
-    "max_length": 1024,
     "strategy": "LongestFirst",
     "stride": 0
   },

   "version": "1.0",
   "truncation": {
     "direction": "Left",
+    "max_length": 512,
     "strategy": "LongestFirst",
     "stride": 0
   },

tokenizer.model CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:dadfd56d766715c61d2ef780a525ab43b8e6da4de6865bda3d95fdef5e134055
-size 493443

 version https://git-lfs.github.com/spec/v1
+oid sha256:d3daefa6fd9ee26430a71ad6009f05c4c4ec086746b2dcc3d04649f631d3654f
+size 131

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:0940395a2687650e17943742dd9d4f2da52e06e88efc1b5f2092954bad39de8c
-size 4600

 version https://git-lfs.github.com/spec/v1
+oid sha256:cc72676d9cc9796870f3d2f933bc9ecbe7e0ed5651fb64662437296f3d056120
+size 129