Upload 4 files
Browse files- README.md +67 -0
- added_tokens.json +3 -0
- config.json +43 -0
- gitattributes.txt +34 -0
README.md
ADDED
@@ -0,0 +1,67 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
---
|
2 |
+
license: mit
|
3 |
+
tags:
|
4 |
+
- generated_from_trainer
|
5 |
+
metrics:
|
6 |
+
- accuracy
|
7 |
+
base_model: microsoft/deberta-v3-base
|
8 |
+
model-index:
|
9 |
+
- name: deberta-v3-base-injection
|
10 |
+
results: []
|
11 |
+
datasets:
|
12 |
+
- deepset/prompt-injections
|
13 |
+
language:
|
14 |
+
- en
|
15 |
+
- de
|
16 |
+
---
|
17 |
+
|
18 |
+
<!-- This model card has been generated automatically according to the information the Trainer had access to. You
|
19 |
+
should probably proofread and complete it, then remove this comment. -->
|
20 |
+
|
21 |
+
# deberta-v3-base-injection
|
22 |
+
|
23 |
+
This model is a fine-tuned version of [microsoft/deberta-v3-base](https://huggingface.co/microsoft/deberta-v3-base) on the [promp-injection](https://huggingface.co/datasets/JasperLS/prompt-injections) dataset.
|
24 |
+
It achieves the following results on the evaluation set:
|
25 |
+
- Loss: 0.0673
|
26 |
+
- Accuracy: 0.9914
|
27 |
+
|
28 |
+
## Model description
|
29 |
+
|
30 |
+
This model detects prompt injection attempts and classifies them as "INJECTION". Legitimate requests are classified as "LEGIT". The dataset assumes that legitimate requests are either all sorts of questions of key word searches.
|
31 |
+
|
32 |
+
## Intended uses & limitations
|
33 |
+
|
34 |
+
If you are using this model to secure your system and it is overly "trigger-happy" to classify requests as injections, consider collecting legitimate examples and retraining the model with the [promp-injection](https://huggingface.co/datasets/JasperLS/prompt-injections) dataset.
|
35 |
+
|
36 |
+
## Training and evaluation data
|
37 |
+
|
38 |
+
Based in the [promp-injection](https://huggingface.co/datasets/JasperLS/prompt-injections) dataset.
|
39 |
+
|
40 |
+
## Training procedure
|
41 |
+
|
42 |
+
### Training hyperparameters
|
43 |
+
|
44 |
+
The following hyperparameters were used during training:
|
45 |
+
- learning_rate: 2e-05
|
46 |
+
- train_batch_size: 8
|
47 |
+
- eval_batch_size: 8
|
48 |
+
- seed: 42
|
49 |
+
- optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
|
50 |
+
- lr_scheduler_type: linear
|
51 |
+
- num_epochs: 3
|
52 |
+
|
53 |
+
### Training results
|
54 |
+
|
55 |
+
| Training Loss | Epoch | Step | Validation Loss | Accuracy |
|
56 |
+
|:-------------:|:-----:|:----:|:---------------:|:--------:|
|
57 |
+
| No log | 1.0 | 69 | 0.2353 | 0.9741 |
|
58 |
+
| No log | 2.0 | 138 | 0.0894 | 0.9741 |
|
59 |
+
| No log | 3.0 | 207 | 0.0673 | 0.9914 |
|
60 |
+
|
61 |
+
|
62 |
+
### Framework versions
|
63 |
+
|
64 |
+
- Transformers 4.29.1
|
65 |
+
- Pytorch 2.0.0+cu118
|
66 |
+
- Datasets 2.12.0
|
67 |
+
- Tokenizers 0.13.3
|
added_tokens.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"[MASK]": 128000
|
3 |
+
}
|
config.json
ADDED
@@ -0,0 +1,43 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "microsoft/deberta-v3-base",
|
3 |
+
"architectures": [
|
4 |
+
"DebertaV2ForSequenceClassification"
|
5 |
+
],
|
6 |
+
"attention_probs_dropout_prob": 0.1,
|
7 |
+
"hidden_act": "gelu",
|
8 |
+
"hidden_dropout_prob": 0.1,
|
9 |
+
"hidden_size": 768,
|
10 |
+
"id2label": {
|
11 |
+
"0": "LEGIT",
|
12 |
+
"1": "INJECTION"
|
13 |
+
},
|
14 |
+
"initializer_range": 0.02,
|
15 |
+
"intermediate_size": 3072,
|
16 |
+
"label2id": {
|
17 |
+
"INJECTION": 1,
|
18 |
+
"LEGIT": 0
|
19 |
+
},
|
20 |
+
"layer_norm_eps": 1e-07,
|
21 |
+
"max_position_embeddings": 512,
|
22 |
+
"max_relative_positions": -1,
|
23 |
+
"model_type": "deberta-v2",
|
24 |
+
"norm_rel_ebd": "layer_norm",
|
25 |
+
"num_attention_heads": 12,
|
26 |
+
"num_hidden_layers": 12,
|
27 |
+
"pad_token_id": 0,
|
28 |
+
"pooler_dropout": 0,
|
29 |
+
"pooler_hidden_act": "gelu",
|
30 |
+
"pooler_hidden_size": 768,
|
31 |
+
"pos_att_type": [
|
32 |
+
"p2c",
|
33 |
+
"c2p"
|
34 |
+
],
|
35 |
+
"position_biased_input": false,
|
36 |
+
"position_buckets": 256,
|
37 |
+
"relative_attention": true,
|
38 |
+
"share_att_key": true,
|
39 |
+
"torch_dtype": "float32",
|
40 |
+
"transformers_version": "4.29.1",
|
41 |
+
"type_vocab_size": 0,
|
42 |
+
"vocab_size": 128100
|
43 |
+
}
|
gitattributes.txt
ADDED
@@ -0,0 +1,34 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
*.7z filter=lfs diff=lfs merge=lfs -text
|
2 |
+
*.arrow filter=lfs diff=lfs merge=lfs -text
|
3 |
+
*.bin filter=lfs diff=lfs merge=lfs -text
|
4 |
+
*.bz2 filter=lfs diff=lfs merge=lfs -text
|
5 |
+
*.ckpt filter=lfs diff=lfs merge=lfs -text
|
6 |
+
*.ftz filter=lfs diff=lfs merge=lfs -text
|
7 |
+
*.gz filter=lfs diff=lfs merge=lfs -text
|
8 |
+
*.h5 filter=lfs diff=lfs merge=lfs -text
|
9 |
+
*.joblib filter=lfs diff=lfs merge=lfs -text
|
10 |
+
*.lfs.* filter=lfs diff=lfs merge=lfs -text
|
11 |
+
*.mlmodel filter=lfs diff=lfs merge=lfs -text
|
12 |
+
*.model filter=lfs diff=lfs merge=lfs -text
|
13 |
+
*.msgpack filter=lfs diff=lfs merge=lfs -text
|
14 |
+
*.npy filter=lfs diff=lfs merge=lfs -text
|
15 |
+
*.npz filter=lfs diff=lfs merge=lfs -text
|
16 |
+
*.onnx filter=lfs diff=lfs merge=lfs -text
|
17 |
+
*.ot filter=lfs diff=lfs merge=lfs -text
|
18 |
+
*.parquet filter=lfs diff=lfs merge=lfs -text
|
19 |
+
*.pb filter=lfs diff=lfs merge=lfs -text
|
20 |
+
*.pickle filter=lfs diff=lfs merge=lfs -text
|
21 |
+
*.pkl filter=lfs diff=lfs merge=lfs -text
|
22 |
+
*.pt filter=lfs diff=lfs merge=lfs -text
|
23 |
+
*.pth filter=lfs diff=lfs merge=lfs -text
|
24 |
+
*.rar filter=lfs diff=lfs merge=lfs -text
|
25 |
+
*.safetensors filter=lfs diff=lfs merge=lfs -text
|
26 |
+
saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
27 |
+
*.tar.* filter=lfs diff=lfs merge=lfs -text
|
28 |
+
*.tflite filter=lfs diff=lfs merge=lfs -text
|
29 |
+
*.tgz filter=lfs diff=lfs merge=lfs -text
|
30 |
+
*.wasm filter=lfs diff=lfs merge=lfs -text
|
31 |
+
*.xz filter=lfs diff=lfs merge=lfs -text
|
32 |
+
*.zip filter=lfs diff=lfs merge=lfs -text
|
33 |
+
*.zst filter=lfs diff=lfs merge=lfs -text
|
34 |
+
*tfevents* filter=lfs diff=lfs merge=lfs -text
|