init
Browse files- README.md +160 -0
- config.json +57 -0
- preprocessor_config.json +24 -0
- pytorch_model.bin +3 -0
- training_args.bin +3 -0
README.md
ADDED
@@ -0,0 +1,160 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
---
|
2 |
+
license: apache-2.0
|
3 |
+
base_model: facebook/detr-resnet-50
|
4 |
+
tags:
|
5 |
+
- generated_from_trainer
|
6 |
+
model-index:
|
7 |
+
- name: detr-V8
|
8 |
+
results: []
|
9 |
+
---
|
10 |
+
|
11 |
+
<!-- This model card has been generated automatically according to the information the Trainer had access to. You
|
12 |
+
should probably proofread and complete it, then remove this comment. -->
|
13 |
+
|
14 |
+
# detr-V8
|
15 |
+
|
16 |
+
This model is a fine-tuned version of [facebook/detr-resnet-50](https://huggingface.co/facebook/detr-resnet-50) on the None dataset.
|
17 |
+
It achieves the following results on the evaluation set:
|
18 |
+
- Loss: 0.2139
|
19 |
+
|
20 |
+
## Model description
|
21 |
+
|
22 |
+
More information needed
|
23 |
+
|
24 |
+
## Intended uses & limitations
|
25 |
+
|
26 |
+
More information needed
|
27 |
+
|
28 |
+
## Training and evaluation data
|
29 |
+
|
30 |
+
More information needed
|
31 |
+
|
32 |
+
## Training procedure
|
33 |
+
|
34 |
+
### Training hyperparameters
|
35 |
+
|
36 |
+
The following hyperparameters were used during training:
|
37 |
+
- learning_rate: 2e-05
|
38 |
+
- train_batch_size: 8
|
39 |
+
- eval_batch_size: 8
|
40 |
+
- seed: 42
|
41 |
+
- optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
|
42 |
+
- lr_scheduler_type: linear
|
43 |
+
- num_epochs: 50
|
44 |
+
|
45 |
+
### Training results
|
46 |
+
|
47 |
+
| Training Loss | Epoch | Step | Validation Loss |
|
48 |
+
|:-------------:|:-----:|:------:|:---------------:|
|
49 |
+
| No log | 0.48 | 1000 | 0.3770 |
|
50 |
+
| No log | 0.96 | 2000 | 0.3967 |
|
51 |
+
| 0.4391 | 1.43 | 3000 | 0.3822 |
|
52 |
+
| 0.4391 | 1.91 | 4000 | 0.4163 |
|
53 |
+
| 0.4434 | 2.39 | 5000 | 0.3888 |
|
54 |
+
| 0.4434 | 2.87 | 6000 | 0.3867 |
|
55 |
+
| 0.4509 | 3.35 | 7000 | 0.4205 |
|
56 |
+
| 0.4509 | 3.83 | 8000 | 0.4014 |
|
57 |
+
| 0.455 | 4.3 | 9000 | 0.4117 |
|
58 |
+
| 0.455 | 4.78 | 10000 | 0.3964 |
|
59 |
+
| 0.4476 | 5.26 | 11000 | 0.3915 |
|
60 |
+
| 0.4476 | 5.74 | 12000 | 0.3919 |
|
61 |
+
| 0.444 | 6.22 | 13000 | 0.4026 |
|
62 |
+
| 0.444 | 6.7 | 14000 | 0.3832 |
|
63 |
+
| 0.443 | 7.17 | 15000 | 0.4057 |
|
64 |
+
| 0.443 | 7.65 | 16000 | 0.3677 |
|
65 |
+
| 0.4232 | 8.13 | 17000 | 0.3746 |
|
66 |
+
| 0.4232 | 8.61 | 18000 | 0.3672 |
|
67 |
+
| 0.4202 | 9.09 | 19000 | 0.3629 |
|
68 |
+
| 0.4202 | 9.56 | 20000 | 0.3739 |
|
69 |
+
| 0.4131 | 10.04 | 21000 | 0.3712 |
|
70 |
+
| 0.4131 | 10.52 | 22000 | 0.3470 |
|
71 |
+
| 0.4131 | 11.0 | 23000 | 0.3632 |
|
72 |
+
| 0.4024 | 11.48 | 24000 | 0.3561 |
|
73 |
+
| 0.4024 | 11.96 | 25000 | 0.3562 |
|
74 |
+
| 0.4013 | 12.43 | 26000 | 0.3253 |
|
75 |
+
| 0.4013 | 12.91 | 27000 | 0.3390 |
|
76 |
+
| 0.3925 | 13.39 | 28000 | 0.3398 |
|
77 |
+
| 0.3925 | 13.87 | 29000 | 0.3460 |
|
78 |
+
| 0.3804 | 14.35 | 30000 | 0.3338 |
|
79 |
+
| 0.3804 | 14.83 | 31000 | 0.3201 |
|
80 |
+
| 0.3757 | 15.3 | 32000 | 0.3119 |
|
81 |
+
| 0.3757 | 15.78 | 33000 | 0.3106 |
|
82 |
+
| 0.3663 | 16.26 | 34000 | 0.3164 |
|
83 |
+
| 0.3663 | 16.74 | 35000 | 0.3190 |
|
84 |
+
| 0.3588 | 17.22 | 36000 | 0.3141 |
|
85 |
+
| 0.3588 | 17.69 | 37000 | 0.3262 |
|
86 |
+
| 0.3515 | 18.17 | 38000 | 0.3027 |
|
87 |
+
| 0.3515 | 18.65 | 39000 | 0.3178 |
|
88 |
+
| 0.3557 | 19.13 | 40000 | 0.3053 |
|
89 |
+
| 0.3557 | 19.61 | 41000 | 0.3032 |
|
90 |
+
| 0.3478 | 20.09 | 42000 | 0.3147 |
|
91 |
+
| 0.3478 | 20.56 | 43000 | 0.3069 |
|
92 |
+
| 0.3451 | 21.04 | 44000 | 0.3070 |
|
93 |
+
| 0.3451 | 21.52 | 45000 | 0.3055 |
|
94 |
+
| 0.3451 | 22.0 | 46000 | 0.2883 |
|
95 |
+
| 0.3367 | 22.48 | 47000 | 0.3090 |
|
96 |
+
| 0.3367 | 22.96 | 48000 | 0.2906 |
|
97 |
+
| 0.3348 | 23.43 | 49000 | 0.2805 |
|
98 |
+
| 0.3348 | 23.91 | 50000 | 0.2920 |
|
99 |
+
| 0.3298 | 24.39 | 51000 | 0.2854 |
|
100 |
+
| 0.3298 | 24.87 | 52000 | 0.2841 |
|
101 |
+
| 0.3254 | 25.35 | 53000 | 0.2822 |
|
102 |
+
| 0.3254 | 25.82 | 54000 | 0.2716 |
|
103 |
+
| 0.3169 | 26.3 | 55000 | 0.2825 |
|
104 |
+
| 0.3169 | 26.78 | 56000 | 0.2700 |
|
105 |
+
| 0.314 | 27.26 | 57000 | 0.2640 |
|
106 |
+
| 0.314 | 27.74 | 58000 | 0.2728 |
|
107 |
+
| 0.3047 | 28.22 | 59000 | 0.2654 |
|
108 |
+
| 0.3047 | 28.69 | 60000 | 0.2691 |
|
109 |
+
| 0.2999 | 29.17 | 61000 | 0.2601 |
|
110 |
+
| 0.2999 | 29.65 | 62000 | 0.2607 |
|
111 |
+
| 0.297 | 30.13 | 63000 | 0.2581 |
|
112 |
+
| 0.297 | 30.61 | 64000 | 0.2511 |
|
113 |
+
| 0.2946 | 31.09 | 65000 | 0.2557 |
|
114 |
+
| 0.2946 | 31.56 | 66000 | 0.2568 |
|
115 |
+
| 0.2912 | 32.04 | 67000 | 0.2569 |
|
116 |
+
| 0.2912 | 32.52 | 68000 | 0.2594 |
|
117 |
+
| 0.2912 | 33.0 | 69000 | 0.2553 |
|
118 |
+
| 0.2906 | 33.48 | 70000 | 0.2425 |
|
119 |
+
| 0.2906 | 33.96 | 71000 | 0.2475 |
|
120 |
+
| 0.2833 | 34.43 | 72000 | 0.2394 |
|
121 |
+
| 0.2833 | 34.91 | 73000 | 0.2422 |
|
122 |
+
| 0.278 | 35.39 | 74000 | 0.2403 |
|
123 |
+
| 0.278 | 35.87 | 75000 | 0.2349 |
|
124 |
+
| 0.2738 | 36.35 | 76000 | 0.2300 |
|
125 |
+
| 0.2738 | 36.82 | 77000 | 0.2332 |
|
126 |
+
| 0.2701 | 37.3 | 78000 | 0.2309 |
|
127 |
+
| 0.2701 | 37.78 | 79000 | 0.2298 |
|
128 |
+
| 0.2659 | 38.26 | 80000 | 0.2343 |
|
129 |
+
| 0.2659 | 38.74 | 81000 | 0.2265 |
|
130 |
+
| 0.2626 | 39.22 | 82000 | 0.2310 |
|
131 |
+
| 0.2626 | 39.69 | 83000 | 0.2255 |
|
132 |
+
| 0.259 | 40.17 | 84000 | 0.2263 |
|
133 |
+
| 0.259 | 40.65 | 85000 | 0.2282 |
|
134 |
+
| 0.2563 | 41.13 | 86000 | 0.2309 |
|
135 |
+
| 0.2563 | 41.61 | 87000 | 0.2270 |
|
136 |
+
| 0.2548 | 42.09 | 88000 | 0.2237 |
|
137 |
+
| 0.2548 | 42.56 | 89000 | 0.2203 |
|
138 |
+
| 0.254 | 43.04 | 90000 | 0.2204 |
|
139 |
+
| 0.254 | 43.52 | 91000 | 0.2218 |
|
140 |
+
| 0.254 | 44.0 | 92000 | 0.2207 |
|
141 |
+
| 0.2484 | 44.48 | 93000 | 0.2144 |
|
142 |
+
| 0.2484 | 44.95 | 94000 | 0.2194 |
|
143 |
+
| 0.2475 | 45.43 | 95000 | 0.2165 |
|
144 |
+
| 0.2475 | 45.91 | 96000 | 0.2162 |
|
145 |
+
| 0.2453 | 46.39 | 97000 | 0.2136 |
|
146 |
+
| 0.2453 | 46.87 | 98000 | 0.2152 |
|
147 |
+
| 0.2441 | 47.35 | 99000 | 0.2162 |
|
148 |
+
| 0.2441 | 47.82 | 100000 | 0.2171 |
|
149 |
+
| 0.2408 | 48.3 | 101000 | 0.2119 |
|
150 |
+
| 0.2408 | 48.78 | 102000 | 0.2131 |
|
151 |
+
| 0.2389 | 49.26 | 103000 | 0.2109 |
|
152 |
+
| 0.2389 | 49.74 | 104000 | 0.2139 |
|
153 |
+
|
154 |
+
|
155 |
+
### Framework versions
|
156 |
+
|
157 |
+
- Transformers 4.31.0
|
158 |
+
- Pytorch 2.0.1+cu118
|
159 |
+
- Datasets 2.13.1
|
160 |
+
- Tokenizers 0.13.3
|
config.json
ADDED
@@ -0,0 +1,57 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_commit_hash": "480370a8aeeed9fc8d78837b4e94e5f936fe73f2",
|
3 |
+
"_name_or_path": "facebook/detr-resnet-50",
|
4 |
+
"activation_dropout": 0.0,
|
5 |
+
"activation_function": "relu",
|
6 |
+
"architectures": [
|
7 |
+
"DetrForObjectDetection"
|
8 |
+
],
|
9 |
+
"attention_dropout": 0.0,
|
10 |
+
"auxiliary_loss": false,
|
11 |
+
"backbone": "resnet50",
|
12 |
+
"backbone_config": null,
|
13 |
+
"bbox_cost": 5,
|
14 |
+
"bbox_loss_coefficient": 5,
|
15 |
+
"class_cost": 1,
|
16 |
+
"classifier_dropout": 0.0,
|
17 |
+
"d_model": 256,
|
18 |
+
"decoder_attention_heads": 8,
|
19 |
+
"decoder_ffn_dim": 2048,
|
20 |
+
"decoder_layerdrop": 0.0,
|
21 |
+
"decoder_layers": 6,
|
22 |
+
"dice_loss_coefficient": 1,
|
23 |
+
"dilation": false,
|
24 |
+
"dropout": 0.1,
|
25 |
+
"encoder_attention_heads": 8,
|
26 |
+
"encoder_ffn_dim": 2048,
|
27 |
+
"encoder_layerdrop": 0.0,
|
28 |
+
"encoder_layers": 6,
|
29 |
+
"eos_coefficient": 0.1,
|
30 |
+
"giou_cost": 2,
|
31 |
+
"giou_loss_coefficient": 2,
|
32 |
+
"id2label": {
|
33 |
+
"0": "block",
|
34 |
+
"1": "footer",
|
35 |
+
"2": "header"
|
36 |
+
},
|
37 |
+
"init_std": 0.02,
|
38 |
+
"init_xavier_std": 1.0,
|
39 |
+
"is_encoder_decoder": true,
|
40 |
+
"label2id": {
|
41 |
+
"block": 0,
|
42 |
+
"footer": 1,
|
43 |
+
"header": 2
|
44 |
+
},
|
45 |
+
"mask_loss_coefficient": 1,
|
46 |
+
"max_position_embeddings": 1024,
|
47 |
+
"model_type": "detr",
|
48 |
+
"num_channels": 3,
|
49 |
+
"num_hidden_layers": 6,
|
50 |
+
"num_queries": 100,
|
51 |
+
"position_embedding_type": "sine",
|
52 |
+
"scale_embedding": false,
|
53 |
+
"torch_dtype": "float32",
|
54 |
+
"transformers_version": "4.7.0.dev0",
|
55 |
+
"use_pretrained_backbone": true,
|
56 |
+
"use_timm_backbone": true
|
57 |
+
}
|
preprocessor_config.json
ADDED
@@ -0,0 +1,24 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"do_normalize": true,
|
3 |
+
"do_pad": true,
|
4 |
+
"do_rescale": true,
|
5 |
+
"do_resize": true,
|
6 |
+
"format": "coco_detection",
|
7 |
+
"image_mean": [
|
8 |
+
0.485,
|
9 |
+
0.456,
|
10 |
+
0.406
|
11 |
+
],
|
12 |
+
"image_processor_type": "DetrImageProcessor",
|
13 |
+
"image_std": [
|
14 |
+
0.229,
|
15 |
+
0.224,
|
16 |
+
0.225
|
17 |
+
],
|
18 |
+
"resample": 2,
|
19 |
+
"rescale_factor": 0.00392156862745098,
|
20 |
+
"size": {
|
21 |
+
"longest_edge": 1333,
|
22 |
+
"shortest_edge": 800
|
23 |
+
}
|
24 |
+
}
|
pytorch_model.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b5093a383922dfe65099f81340fb00e2e62b379dfb5f634d590a7c99e772b47c
|
3 |
+
size 166618149
|
training_args.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0dedb2e805a33f9a5b1a599841973942c8cc62fca7adea1ff574e6ef977a26d6
|
3 |
+
size 3963
|