nadika commited on
Commit
4108fba
1 Parent(s): 8eebc32

End of training

Browse files
Files changed (3) hide show
  1. README.md +2 -2
  2. config.json +31 -30
  3. model.safetensors +2 -2
README.md CHANGED
@@ -1,7 +1,7 @@
1
  ---
 
2
  tags:
3
  - generated_from_trainer
4
- base_model: Rajan/NepaliBERT
5
  model-index:
6
  - name: nepali_gov_complaints_classification
7
  results: []
@@ -14,7 +14,7 @@ should probably proofread and complete it, then remove this comment. -->
14
 
15
  This model is a fine-tuned version of [Rajan/NepaliBERT](https://huggingface.co/Rajan/NepaliBERT) on an unknown dataset.
16
  It achieves the following results on the evaluation set:
17
- - Loss: 0.2503
18
 
19
  ## Model description
20
 
 
1
  ---
2
+ base_model: Rajan/NepaliBERT
3
  tags:
4
  - generated_from_trainer
 
5
  model-index:
6
  - name: nepali_gov_complaints_classification
7
  results: []
 
14
 
15
  This model is a fine-tuned version of [Rajan/NepaliBERT](https://huggingface.co/Rajan/NepaliBERT) on an unknown dataset.
16
  It achieves the following results on the evaluation set:
17
+ - Loss: 0.2385
18
 
19
  ## Model description
20
 
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "./my_nepalibert_model",
3
  "architectures": [
4
  "BertForSequenceClassification"
5
  ],
@@ -10,38 +10,38 @@
10
  "hidden_dropout_prob": 0.1,
11
  "hidden_size": 768,
12
  "id2label": {
13
- "0": "\u0905\u0930\u094d\u0925 \u0938\u092c\u0928\u094d\u0927\u0940",
14
- "1": "\u0905\u0930\u094d\u0925\u093f\u0915 \u0905\u0928\u093f\u092f\u092e\u093f\u0924\u0924\u093e \u0924\u0925\u093e \u092d\u094d\u0930\u0937\u094d\u091f\u093e\u091a\u093e\u0930 \u0938\u092e\u094d\u092c\u0928\u094d\u0927\u0940",
15
- "2": "\u0915\u0930\u094d\u092e\u091a\u093e\u0930\u0940 \u0938\u092e\u094d\u0935\u0928\u094d\u0927\u0940",
16
- "3": "\u0916\u093e\u0928\u0947\u092a\u093e\u0928\u0940",
17
- "4": "\u0928\u093f\u0930\u094d\u092e\u093e\u0923 \u0915\u093e\u0930\u094d\u092f \u0938\u092e\u094d\u092c\u0928\u094d\u0927\u0940",
18
- "5": "\u092a\u093e\u0930\u094d\u0915\u093f\u0919\u094d\u0917 \u0924\u0925\u093e \u092e\u0947\u091f\u094d\u0930\u094b \u092a\u0941\u0932\u093f\u0938",
19
- "6": "\u092a\u094d\u0930\u093e\u0915\u0943\u0924\u093f\u0915 \u0936\u094d\u0930\u094b\u0924/\u0938\u093e\u0927\u0928 \u0938\u092e\u094d\u092c\u0928\u094d\u0927\u0940",
20
- "7": "\u092b\u094b\u0939\u094b\u0930\u092e\u0948\u0932\u093e \u0935\u094d\u092f\u0935\u0938\u094d\u0925\u093e\u092a\u0928",
21
- "8": "\u0932\u093e\u0917\u0941 \u092a\u0926\u093e\u0930\u094d\u0925 \u0938\u092e\u094d\u092c\u0928\u094d\u0927\u0940",
22
- "9": "\u0935\u0947\u092c\u0938\u093e\u0907\u091f \u0924\u0925\u093e \u0905\u092d\u093f\u0932\u0947\u0916 \u0935\u094d\u092f\u0935\u0938\u094d\u0925\u093e\u092a\u0928 \u0938\u092e\u094d\u092c\u0928\u094d\u0927\u0940",
23
- "10": "\u0936\u093e\u0928\u094d\u0924\u093f \u0938\u0941\u0930\u0915\u094d\u0937\u093e",
24
- "11": "\u0938\u0942\u091a\u0928\u093e \u0924\u0925\u093e \u0938\u0902\u091a\u093e\u0930",
25
- "12": "\u0938\u094b\u0927\u092a\u0941\u091b, \u0938\u0941\u091d\u093e\u0935, \u092a\u094d\u0930\u0936\u0902\u0938\u093e \u0938\u092e\u094d\u092c\u0928\u094d\u0927\u0940",
26
- "13": "\u0938\u094d\u0935\u093e\u0938\u094d\u0925\u094d\u092f\u0938\u0901\u0917 \u0938\u092e\u094d\u092c\u0928\u094d\u0927\u0940"
27
  },
28
  "initializer_range": 0.02,
29
  "intermediate_size": 3072,
30
  "label2id": {
31
- "\u0905\u0930\u094d\u0925 \u0938\u092c\u0928\u094d\u0927\u0940": 0,
32
- "\u0905\u0930\u094d\u0925\u093f\u0915 \u0905\u0928\u093f\u092f\u092e\u093f\u0924\u0924\u093e \u0924\u0925\u093e \u092d\u094d\u0930\u0937\u094d\u091f\u093e\u091a\u093e\u0930 \u0938\u092e\u094d\u092c\u0928\u094d\u0927\u0940": 1,
33
- "\u0915\u0930\u094d\u092e\u091a\u093e\u0930\u0940 \u0938\u092e\u094d\u0935\u0928\u094d\u0927\u0940": 2,
34
- "\u0916\u093e\u0928\u0947\u092a\u093e\u0928\u0940": 3,
35
- "\u0928\u093f\u0930\u094d\u092e\u093e\u0923 \u0915\u093e\u0930\u094d\u092f \u0938\u092e\u094d\u092c\u0928\u094d\u0927\u0940": 4,
36
- "\u092a\u093e\u0930\u094d\u0915\u093f\u0919\u094d\u0917 \u0924\u0925\u093e \u092e\u0947\u091f\u094d\u0930\u094b \u092a\u0941\u0932\u093f\u0938": 5,
37
- "\u092a\u094d\u0930\u093e\u0915\u0943\u0924\u093f\u0915 \u0936\u094d\u0930\u094b\u0924/\u0938\u093e\u0927\u0928 \u0938\u092e\u094d\u092c\u0928\u094d\u0927\u0940": 6,
38
- "\u092b\u094b\u0939\u094b\u0930\u092e\u0948\u0932\u093e \u0935\u094d\u092f\u0935\u0938\u094d\u0925\u093e\u092a\u0928": 7,
39
- "\u0932\u093e\u0917\u0941 \u092a\u0926\u093e\u0930\u094d\u0925 \u0938\u092e\u094d\u092c\u0928\u094d\u0927\u0940": 8,
40
- "\u0935\u0947\u092c\u0938\u093e\u0907\u091f \u0924\u0925\u093e \u0905\u092d\u093f\u0932\u0947\u0916 \u0935\u094d\u092f\u0935\u0938\u094d\u0925\u093e\u092a\u0928 \u0938\u092e\u094d\u092c\u0928\u094d\u0927\u0940": 9,
41
- "\u0936\u093e\u0928\u094d\u0924\u093f \u0938\u0941\u0930\u0915\u094d\u0937\u093e": 10,
42
- "\u0938\u0942\u091a\u0928\u093e \u0924\u0925\u093e \u0938\u0902\u091a\u093e\u0930": 11,
43
- "\u0938\u094b\u0927\u092a\u0941\u091b, \u0938\u0941\u091d\u093e\u0935, \u092a\u094d\u0930\u0936\u0902\u0938\u093e \u0938\u092e\u094d\u092c\u0928\u094d\u0927\u0940": 12,
44
- "\u0938\u094d\u0935\u093e\u0938\u094d\u0925\u094d\u092f\u0938\u0901\u0917 \u0938\u092e\u094d\u092c\u0928\u094d\u0927\u0940": 13
45
  },
46
  "layer_norm_eps": 1e-12,
47
  "max_position_embeddings": 512,
@@ -50,9 +50,10 @@
50
  "num_hidden_layers": 6,
51
  "pad_token_id": 0,
52
  "position_embedding_type": "absolute",
 
53
  "torch_dtype": "float32",
54
  "transformers_version": "4.38.2",
55
  "type_vocab_size": 2,
56
  "use_cache": true,
57
  "vocab_size": 50000
58
- }
 
1
  {
2
+ "_name_or_path": "Rajan/NepaliBERT",
3
  "architectures": [
4
  "BertForSequenceClassification"
5
  ],
 
10
  "hidden_dropout_prob": 0.1,
11
  "hidden_size": 768,
12
  "id2label": {
13
+ "0": "LABEL_0",
14
+ "1": "LABEL_1",
15
+ "2": "LABEL_2",
16
+ "3": "LABEL_3",
17
+ "4": "LABEL_4",
18
+ "5": "LABEL_5",
19
+ "6": "LABEL_6",
20
+ "7": "LABEL_7",
21
+ "8": "LABEL_8",
22
+ "9": "LABEL_9",
23
+ "10": "LABEL_10",
24
+ "11": "LABEL_11",
25
+ "12": "LABEL_12",
26
+ "13": "LABEL_13"
27
  },
28
  "initializer_range": 0.02,
29
  "intermediate_size": 3072,
30
  "label2id": {
31
+ "LABEL_0": 0,
32
+ "LABEL_1": 1,
33
+ "LABEL_10": 10,
34
+ "LABEL_11": 11,
35
+ "LABEL_12": 12,
36
+ "LABEL_13": 13,
37
+ "LABEL_2": 2,
38
+ "LABEL_3": 3,
39
+ "LABEL_4": 4,
40
+ "LABEL_5": 5,
41
+ "LABEL_6": 6,
42
+ "LABEL_7": 7,
43
+ "LABEL_8": 8,
44
+ "LABEL_9": 9
45
  },
46
  "layer_norm_eps": 1e-12,
47
  "max_position_embeddings": 512,
 
50
  "num_hidden_layers": 6,
51
  "pad_token_id": 0,
52
  "position_embedding_type": "absolute",
53
+ "problem_type": "single_label_classification",
54
  "torch_dtype": "float32",
55
  "transformers_version": "4.38.2",
56
  "type_vocab_size": 2,
57
  "use_cache": true,
58
  "vocab_size": 50000
59
+ }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:10ac3503a5c69ce108e2a521fd7f8855a14399c6af01e2bc014467753ded2cfb
3
- size 327674816
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:05ca3e3d07b8358bbaba3478503163aa83bc462ddebf440ca1d746dbcce14925
3
+ size 327711728