qubvel-hf HF staff commited on
Commit
55ad7b2
1 Parent(s): b7bd3b7

Model save

Browse files
README.md ADDED
@@ -0,0 +1,180 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ license: apache-2.0
3
+ base_model: hustvl/yolos-small
4
+ tags:
5
+ - generated_from_trainer
6
+ model-index:
7
+ - name: hustvl-yolos-small-finetuned-10k-cppe5
8
+ results: []
9
+ ---
10
+
11
+ <!-- This model card has been generated automatically according to the information the Trainer had access to. You
12
+ should probably proofread and complete it, then remove this comment. -->
13
+
14
+ [<img src="https://raw.githubusercontent.com/wandb/assets/main/wandb-github-badge-28.svg" alt="Visualize in Weights & Biases" width="200" height="32"/>](https://wandb.ai/qubvel-hf-co/transformers-detection-model-finetuning-cppe5/runs/u2o06hbj)
15
+ # hustvl-yolos-small-finetuned-10k-cppe5
16
+
17
+ This model is a fine-tuned version of [hustvl/yolos-small](https://huggingface.co/hustvl/yolos-small) on an unknown dataset.
18
+ It achieves the following results on the evaluation set:
19
+ - Loss: 1.4674
20
+ - Map: 0.3363
21
+ - Map 50: 0.6506
22
+ - Map 75: 0.2992
23
+ - Map Small: 0.2695
24
+ - Map Medium: 0.2282
25
+ - Map Large: 0.4791
26
+ - Mar 1: 0.3441
27
+ - Mar 10: 0.4988
28
+ - Mar 100: 0.5186
29
+ - Mar Small: 0.3192
30
+ - Mar Medium: 0.3884
31
+ - Mar Large: 0.6982
32
+ - Map Coverall: 0.607
33
+ - Mar 100 Coverall: 0.7716
34
+ - Map Face Shield: 0.3854
35
+ - Mar 100 Face Shield: 0.5883
36
+ - Map Gloves: 0.2283
37
+ - Mar 100 Gloves: 0.4093
38
+ - Map Goggles: 0.1228
39
+ - Mar 100 Goggles: 0.3319
40
+ - Map Mask: 0.3379
41
+ - Mar 100 Mask: 0.4916
42
+
43
+ ## Model description
44
+
45
+ More information needed
46
+
47
+ ## Intended uses & limitations
48
+
49
+ More information needed
50
+
51
+ ## Training and evaluation data
52
+
53
+ More information needed
54
+
55
+ ## Training procedure
56
+
57
+ ### Training hyperparameters
58
+
59
+ The following hyperparameters were used during training:
60
+ - learning_rate: 5e-05
61
+ - train_batch_size: 8
62
+ - eval_batch_size: 8
63
+ - seed: 1337
64
+ - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
65
+ - lr_scheduler_type: linear
66
+ - num_epochs: 100.0
67
+ - mixed_precision_training: Native AMP
68
+
69
+ ### Training results
70
+
71
+ | Training Loss | Epoch | Step | Validation Loss | Map | Map 50 | Map 75 | Map Small | Map Medium | Map Large | Mar 1 | Mar 10 | Mar 100 | Mar Small | Mar Medium | Mar Large | Map Coverall | Mar 100 Coverall | Map Face Shield | Mar 100 Face Shield | Map Gloves | Mar 100 Gloves | Map Goggles | Mar 100 Goggles | Map Mask | Mar 100 Mask |
72
+ |:-------------:|:-----:|:-----:|:---------------:|:------:|:------:|:------:|:---------:|:----------:|:---------:|:------:|:------:|:-------:|:---------:|:----------:|:---------:|:------------:|:----------------:|:---------------:|:-------------------:|:----------:|:--------------:|:-----------:|:---------------:|:--------:|:------------:|
73
+ | 1.9479 | 1.0 | 107 | 1.6080 | 0.15 | 0.3271 | 0.1142 | 0.0227 | 0.0603 | 0.1779 | 0.1663 | 0.3089 | 0.3414 | 0.098 | 0.2108 | 0.3973 | 0.499 | 0.7191 | 0.048 | 0.2467 | 0.0276 | 0.3377 | 0.0156 | 0.0764 | 0.1598 | 0.3268 |
74
+ | 1.4786 | 2.0 | 214 | 1.4219 | 0.1899 | 0.3864 | 0.1627 | 0.0539 | 0.0911 | 0.2756 | 0.2423 | 0.4081 | 0.4299 | 0.0864 | 0.3003 | 0.5424 | 0.5552 | 0.7951 | 0.1065 | 0.4933 | 0.0707 | 0.326 | 0.042 | 0.2028 | 0.1752 | 0.3324 |
75
+ | 1.3842 | 3.0 | 321 | 1.3797 | 0.2174 | 0.4379 | 0.1755 | 0.0584 | 0.1132 | 0.326 | 0.2616 | 0.4277 | 0.4505 | 0.2266 | 0.3179 | 0.61 | 0.5588 | 0.7698 | 0.1542 | 0.475 | 0.0952 | 0.35 | 0.0469 | 0.2764 | 0.2321 | 0.3816 |
76
+ | 1.2986 | 4.0 | 428 | 1.3926 | 0.1978 | 0.4118 | 0.1625 | 0.0355 | 0.0902 | 0.3168 | 0.2456 | 0.4139 | 0.4312 | 0.181 | 0.3023 | 0.5948 | 0.56 | 0.7568 | 0.1293 | 0.455 | 0.1054 | 0.3574 | 0.0389 | 0.2681 | 0.1553 | 0.319 |
77
+ | 1.233 | 5.0 | 535 | 1.3301 | 0.2271 | 0.5034 | 0.1694 | 0.0505 | 0.1223 | 0.3357 | 0.2595 | 0.4181 | 0.4355 | 0.205 | 0.304 | 0.5722 | 0.5531 | 0.766 | 0.2005 | 0.475 | 0.1371 | 0.3647 | 0.0537 | 0.2486 | 0.1912 | 0.3229 |
78
+ | 1.1644 | 6.0 | 642 | 1.2556 | 0.2497 | 0.5164 | 0.1981 | 0.0579 | 0.1447 | 0.3657 | 0.2915 | 0.4434 | 0.4598 | 0.1981 | 0.3224 | 0.6256 | 0.5888 | 0.7753 | 0.1927 | 0.4933 | 0.1338 | 0.373 | 0.0736 | 0.2667 | 0.2597 | 0.3905 |
79
+ | 1.1229 | 7.0 | 749 | 1.2388 | 0.234 | 0.4963 | 0.1996 | 0.1279 | 0.1367 | 0.3492 | 0.2638 | 0.4433 | 0.4576 | 0.2508 | 0.3912 | 0.6242 | 0.5616 | 0.7895 | 0.1503 | 0.4883 | 0.1564 | 0.373 | 0.043 | 0.2736 | 0.2589 | 0.3637 |
80
+ | 1.0939 | 8.0 | 856 | 1.2988 | 0.2343 | 0.5195 | 0.1773 | 0.0506 | 0.1319 | 0.3447 | 0.2687 | 0.3976 | 0.4065 | 0.1377 | 0.2645 | 0.5857 | 0.5806 | 0.7494 | 0.1693 | 0.4083 | 0.1114 | 0.3059 | 0.0683 | 0.2069 | 0.2419 | 0.362 |
81
+ | 1.0571 | 9.0 | 963 | 1.2067 | 0.2604 | 0.5346 | 0.2265 | 0.0671 | 0.1565 | 0.383 | 0.3001 | 0.4545 | 0.4655 | 0.1538 | 0.3488 | 0.625 | 0.6037 | 0.7586 | 0.2 | 0.49 | 0.1749 | 0.3858 | 0.0758 | 0.3097 | 0.2477 | 0.3832 |
82
+ | 1.0535 | 10.0 | 1070 | 1.2278 | 0.2534 | 0.5112 | 0.2324 | 0.0556 | 0.1444 | 0.3914 | 0.3011 | 0.4593 | 0.4806 | 0.1686 | 0.3462 | 0.6597 | 0.6104 | 0.7821 | 0.1993 | 0.525 | 0.1614 | 0.3956 | 0.0553 | 0.3014 | 0.2407 | 0.3989 |
83
+ | 0.9948 | 11.0 | 1177 | 1.2097 | 0.2653 | 0.5317 | 0.2346 | 0.2441 | 0.1608 | 0.3892 | 0.3125 | 0.4766 | 0.4903 | 0.2854 | 0.3756 | 0.643 | 0.5968 | 0.7648 | 0.2183 | 0.5533 | 0.1797 | 0.3936 | 0.0557 | 0.3306 | 0.276 | 0.4089 |
84
+ | 0.9766 | 12.0 | 1284 | 1.2409 | 0.258 | 0.5423 | 0.2228 | 0.1649 | 0.1503 | 0.3925 | 0.2986 | 0.4553 | 0.4667 | 0.2045 | 0.3461 | 0.6238 | 0.5955 | 0.7667 | 0.2124 | 0.5267 | 0.1877 | 0.3613 | 0.0559 | 0.3 | 0.2382 | 0.3788 |
85
+ | 0.9642 | 13.0 | 1391 | 1.2483 | 0.2733 | 0.5497 | 0.2377 | 0.1841 | 0.1614 | 0.401 | 0.3115 | 0.4527 | 0.4643 | 0.2125 | 0.3235 | 0.6653 | 0.6113 | 0.7821 | 0.2527 | 0.55 | 0.1924 | 0.3544 | 0.0694 | 0.2639 | 0.2406 | 0.3709 |
86
+ | 0.9632 | 14.0 | 1498 | 1.2315 | 0.2728 | 0.544 | 0.2363 | 0.0893 | 0.1691 | 0.3978 | 0.308 | 0.4605 | 0.4713 | 0.1705 | 0.345 | 0.6593 | 0.6124 | 0.7753 | 0.2228 | 0.4933 | 0.1615 | 0.3475 | 0.0861 | 0.325 | 0.2814 | 0.4151 |
87
+ | 0.9342 | 15.0 | 1605 | 1.2185 | 0.2843 | 0.5699 | 0.2436 | 0.2202 | 0.1798 | 0.4107 | 0.313 | 0.4628 | 0.4732 | 0.2514 | 0.3365 | 0.6666 | 0.6132 | 0.7858 | 0.2452 | 0.54 | 0.1971 | 0.3578 | 0.0855 | 0.2736 | 0.2807 | 0.4089 |
88
+ | 0.9118 | 16.0 | 1712 | 1.2268 | 0.2759 | 0.5763 | 0.2359 | 0.1335 | 0.1694 | 0.4276 | 0.3045 | 0.4556 | 0.4712 | 0.2254 | 0.3336 | 0.6805 | 0.6205 | 0.8 | 0.2553 | 0.53 | 0.161 | 0.349 | 0.0765 | 0.2833 | 0.2661 | 0.3939 |
89
+ | 0.9031 | 17.0 | 1819 | 1.2224 | 0.2794 | 0.5673 | 0.2443 | 0.2481 | 0.1638 | 0.41 | 0.3079 | 0.4683 | 0.4888 | 0.275 | 0.3562 | 0.6834 | 0.6053 | 0.8012 | 0.2647 | 0.5367 | 0.1652 | 0.3735 | 0.1022 | 0.3542 | 0.2594 | 0.3782 |
90
+ | 0.8556 | 18.0 | 1926 | 1.1809 | 0.2933 | 0.5872 | 0.265 | 0.2545 | 0.1984 | 0.3951 | 0.3132 | 0.4787 | 0.496 | 0.2908 | 0.3581 | 0.6792 | 0.5871 | 0.7981 | 0.2753 | 0.5567 | 0.1937 | 0.3971 | 0.0936 | 0.2903 | 0.3171 | 0.438 |
91
+ | 0.8221 | 19.0 | 2033 | 1.2087 | 0.2939 | 0.5973 | 0.249 | 0.0952 | 0.1777 | 0.4381 | 0.312 | 0.4685 | 0.4845 | 0.133 | 0.3389 | 0.6883 | 0.6256 | 0.8111 | 0.2686 | 0.5233 | 0.1739 | 0.3603 | 0.1 | 0.3069 | 0.3015 | 0.4207 |
92
+ | 0.8202 | 20.0 | 2140 | 1.2266 | 0.2934 | 0.5939 | 0.2522 | 0.1408 | 0.1867 | 0.4349 | 0.3234 | 0.4769 | 0.4945 | 0.1756 | 0.3613 | 0.6994 | 0.617 | 0.7975 | 0.3123 | 0.5533 | 0.1686 | 0.3637 | 0.0951 | 0.3486 | 0.2741 | 0.4095 |
93
+ | 0.7954 | 21.0 | 2247 | 1.2556 | 0.2905 | 0.6004 | 0.2432 | 0.1632 | 0.1839 | 0.438 | 0.3135 | 0.4719 | 0.4865 | 0.2116 | 0.3531 | 0.6842 | 0.6094 | 0.7741 | 0.2976 | 0.56 | 0.1763 | 0.3574 | 0.089 | 0.3069 | 0.2802 | 0.4341 |
94
+ | 0.7868 | 22.0 | 2354 | 1.2723 | 0.2717 | 0.559 | 0.2363 | 0.1494 | 0.1689 | 0.411 | 0.293 | 0.4624 | 0.4771 | 0.1901 | 0.3415 | 0.6822 | 0.5933 | 0.7735 | 0.3068 | 0.5717 | 0.1651 | 0.3358 | 0.0718 | 0.3236 | 0.2213 | 0.381 |
95
+ | 0.7827 | 23.0 | 2461 | 1.2710 | 0.2957 | 0.6092 | 0.2317 | 0.2667 | 0.1878 | 0.4432 | 0.3189 | 0.4785 | 0.4928 | 0.2995 | 0.3684 | 0.6803 | 0.6028 | 0.7802 | 0.3233 | 0.5533 | 0.1795 | 0.3843 | 0.1219 | 0.3333 | 0.2511 | 0.4128 |
96
+ | 0.7795 | 24.0 | 2568 | 1.2305 | 0.3039 | 0.6021 | 0.2739 | 0.2054 | 0.2003 | 0.4373 | 0.3229 | 0.4902 | 0.5068 | 0.2637 | 0.3887 | 0.6889 | 0.6232 | 0.766 | 0.2872 | 0.575 | 0.1954 | 0.3838 | 0.1011 | 0.3528 | 0.3125 | 0.4564 |
97
+ | 0.7524 | 25.0 | 2675 | 1.2481 | 0.2897 | 0.5968 | 0.2423 | 0.2147 | 0.1875 | 0.4391 | 0.3168 | 0.4866 | 0.5029 | 0.2532 | 0.3815 | 0.689 | 0.598 | 0.779 | 0.2973 | 0.58 | 0.1842 | 0.3833 | 0.1061 | 0.3417 | 0.2627 | 0.4307 |
98
+ | 0.7446 | 26.0 | 2782 | 1.2481 | 0.2894 | 0.5835 | 0.2479 | 0.16 | 0.182 | 0.441 | 0.3083 | 0.4857 | 0.496 | 0.1905 | 0.3783 | 0.6953 | 0.6217 | 0.7765 | 0.2919 | 0.5733 | 0.1736 | 0.3652 | 0.068 | 0.3319 | 0.292 | 0.433 |
99
+ | 0.7203 | 27.0 | 2889 | 1.2720 | 0.2871 | 0.5801 | 0.2338 | 0.2113 | 0.1852 | 0.4258 | 0.3107 | 0.48 | 0.4955 | 0.2698 | 0.3781 | 0.6844 | 0.6106 | 0.7698 | 0.2779 | 0.5633 | 0.2001 | 0.3819 | 0.0842 | 0.3333 | 0.2625 | 0.4291 |
100
+ | 0.7239 | 28.0 | 2996 | 1.2166 | 0.3043 | 0.621 | 0.256 | 0.1515 | 0.1926 | 0.4491 | 0.3286 | 0.4874 | 0.5037 | 0.2054 | 0.3733 | 0.6882 | 0.6196 | 0.7728 | 0.3166 | 0.58 | 0.1917 | 0.3799 | 0.095 | 0.3319 | 0.2985 | 0.4536 |
101
+ | 0.6987 | 29.0 | 3103 | 1.2685 | 0.3008 | 0.6003 | 0.256 | 0.2512 | 0.1964 | 0.4285 | 0.3231 | 0.4964 | 0.5118 | 0.3015 | 0.3921 | 0.6779 | 0.6247 | 0.7716 | 0.2988 | 0.5933 | 0.1999 | 0.3819 | 0.0914 | 0.3514 | 0.2895 | 0.4609 |
102
+ | 0.6776 | 30.0 | 3210 | 1.2834 | 0.2976 | 0.6053 | 0.2574 | 0.1637 | 0.1951 | 0.4457 | 0.3311 | 0.4801 | 0.4952 | 0.2704 | 0.3691 | 0.6739 | 0.6165 | 0.787 | 0.28 | 0.59 | 0.194 | 0.3652 | 0.1218 | 0.3236 | 0.2759 | 0.4101 |
103
+ | 0.6695 | 31.0 | 3317 | 1.2599 | 0.2957 | 0.5942 | 0.268 | 0.1376 | 0.1935 | 0.4377 | 0.3115 | 0.4812 | 0.4988 | 0.2589 | 0.3643 | 0.6915 | 0.6154 | 0.7852 | 0.2669 | 0.585 | 0.2035 | 0.3936 | 0.0936 | 0.2917 | 0.2991 | 0.4385 |
104
+ | 0.6829 | 32.0 | 3424 | 1.3085 | 0.2938 | 0.5904 | 0.2481 | 0.2294 | 0.1851 | 0.4296 | 0.311 | 0.4789 | 0.497 | 0.2771 | 0.3744 | 0.6878 | 0.622 | 0.7741 | 0.3067 | 0.5867 | 0.1709 | 0.3505 | 0.1139 | 0.3681 | 0.2557 | 0.4056 |
105
+ | 0.6632 | 33.0 | 3531 | 1.2422 | 0.2996 | 0.6001 | 0.2578 | 0.1768 | 0.1909 | 0.4405 | 0.3214 | 0.4901 | 0.5081 | 0.2888 | 0.3812 | 0.6588 | 0.6126 | 0.7728 | 0.2943 | 0.5967 | 0.2104 | 0.4064 | 0.0948 | 0.3208 | 0.2858 | 0.4436 |
106
+ | 0.6518 | 34.0 | 3638 | 1.2245 | 0.3093 | 0.611 | 0.2619 | 0.1701 | 0.2059 | 0.4612 | 0.3295 | 0.4808 | 0.498 | 0.2206 | 0.3699 | 0.6679 | 0.6104 | 0.7809 | 0.3062 | 0.5633 | 0.2068 | 0.3794 | 0.1203 | 0.3222 | 0.303 | 0.4441 |
107
+ | 0.6649 | 35.0 | 3745 | 1.2282 | 0.3067 | 0.621 | 0.267 | 0.2252 | 0.2014 | 0.4684 | 0.3313 | 0.4843 | 0.5019 | 0.2741 | 0.3718 | 0.6808 | 0.5992 | 0.7796 | 0.3058 | 0.5617 | 0.2148 | 0.4064 | 0.1257 | 0.3194 | 0.2883 | 0.4425 |
108
+ | 0.6373 | 36.0 | 3852 | 1.3044 | 0.3085 | 0.6184 | 0.2823 | 0.248 | 0.2014 | 0.4489 | 0.3186 | 0.4898 | 0.5107 | 0.2978 | 0.3889 | 0.6776 | 0.6084 | 0.7784 | 0.3151 | 0.59 | 0.2058 | 0.3985 | 0.113 | 0.3153 | 0.3 | 0.4715 |
109
+ | 0.6139 | 37.0 | 3959 | 1.2725 | 0.3138 | 0.6336 | 0.2796 | 0.1862 | 0.203 | 0.4697 | 0.3262 | 0.4928 | 0.5143 | 0.2357 | 0.387 | 0.6958 | 0.6116 | 0.7802 | 0.3125 | 0.5667 | 0.2204 | 0.3961 | 0.1065 | 0.3625 | 0.3181 | 0.4659 |
110
+ | 0.6087 | 38.0 | 4066 | 1.2936 | 0.3072 | 0.6272 | 0.2668 | 0.2027 | 0.2048 | 0.4465 | 0.3151 | 0.4832 | 0.5024 | 0.2461 | 0.3726 | 0.6757 | 0.6071 | 0.7981 | 0.3166 | 0.575 | 0.1965 | 0.3814 | 0.1308 | 0.3375 | 0.2848 | 0.4201 |
111
+ | 0.613 | 39.0 | 4173 | 1.2992 | 0.3233 | 0.6431 | 0.3037 | 0.1967 | 0.2164 | 0.4755 | 0.3249 | 0.4887 | 0.5027 | 0.2438 | 0.3761 | 0.6875 | 0.6188 | 0.7753 | 0.332 | 0.5717 | 0.2113 | 0.3873 | 0.1314 | 0.325 | 0.3232 | 0.4542 |
112
+ | 0.6009 | 40.0 | 4280 | 1.3210 | 0.3105 | 0.6141 | 0.2801 | 0.196 | 0.1976 | 0.446 | 0.3223 | 0.4704 | 0.4859 | 0.2349 | 0.3542 | 0.6723 | 0.6392 | 0.7722 | 0.3152 | 0.5433 | 0.1995 | 0.3672 | 0.0986 | 0.2847 | 0.3001 | 0.462 |
113
+ | 0.5766 | 41.0 | 4387 | 1.2828 | 0.3157 | 0.6377 | 0.2786 | 0.2062 | 0.2068 | 0.4597 | 0.3266 | 0.4825 | 0.5013 | 0.2481 | 0.3722 | 0.6859 | 0.6119 | 0.7753 | 0.3294 | 0.5683 | 0.2074 | 0.4 | 0.1285 | 0.3139 | 0.3013 | 0.4492 |
114
+ | 0.5692 | 42.0 | 4494 | 1.3361 | 0.3209 | 0.6257 | 0.2844 | 0.2785 | 0.2123 | 0.4655 | 0.3311 | 0.4922 | 0.5103 | 0.3317 | 0.3787 | 0.6923 | 0.6219 | 0.7802 | 0.3437 | 0.5767 | 0.1992 | 0.3897 | 0.1221 | 0.3347 | 0.3177 | 0.4704 |
115
+ | 0.5563 | 43.0 | 4601 | 1.2864 | 0.3284 | 0.6405 | 0.2969 | 0.2098 | 0.2261 | 0.4568 | 0.3312 | 0.5031 | 0.5202 | 0.2639 | 0.399 | 0.6864 | 0.6278 | 0.7821 | 0.3447 | 0.5733 | 0.2249 | 0.4186 | 0.1179 | 0.3486 | 0.327 | 0.4782 |
116
+ | 0.5581 | 44.0 | 4708 | 1.2884 | 0.3309 | 0.6319 | 0.3104 | 0.2022 | 0.2285 | 0.4627 | 0.337 | 0.5046 | 0.5237 | 0.268 | 0.4064 | 0.6992 | 0.6404 | 0.7944 | 0.353 | 0.595 | 0.2145 | 0.3877 | 0.1283 | 0.3639 | 0.3185 | 0.4777 |
117
+ | 0.5464 | 45.0 | 4815 | 1.3207 | 0.3205 | 0.6256 | 0.2849 | 0.1818 | 0.2114 | 0.4495 | 0.3295 | 0.493 | 0.5136 | 0.2564 | 0.3824 | 0.7016 | 0.6279 | 0.787 | 0.3335 | 0.5867 | 0.2226 | 0.4064 | 0.1144 | 0.3194 | 0.304 | 0.4687 |
118
+ | 0.5445 | 46.0 | 4922 | 1.2675 | 0.3266 | 0.6518 | 0.295 | 0.2526 | 0.2217 | 0.4655 | 0.3354 | 0.4991 | 0.5164 | 0.3 | 0.3932 | 0.6916 | 0.626 | 0.7883 | 0.3552 | 0.5817 | 0.2189 | 0.4054 | 0.1285 | 0.3347 | 0.3045 | 0.4721 |
119
+ | 0.5247 | 47.0 | 5029 | 1.3173 | 0.3311 | 0.6464 | 0.2924 | 0.2393 | 0.226 | 0.4541 | 0.339 | 0.4983 | 0.5182 | 0.2804 | 0.3948 | 0.6897 | 0.6356 | 0.784 | 0.3544 | 0.6 | 0.2171 | 0.4034 | 0.1408 | 0.3333 | 0.3077 | 0.4704 |
120
+ | 0.5302 | 48.0 | 5136 | 1.2731 | 0.326 | 0.631 | 0.2795 | 0.2521 | 0.2174 | 0.4665 | 0.3267 | 0.4931 | 0.5104 | 0.2953 | 0.3882 | 0.6879 | 0.6296 | 0.784 | 0.3588 | 0.585 | 0.1986 | 0.3961 | 0.1284 | 0.3333 | 0.3147 | 0.4536 |
121
+ | 0.5149 | 49.0 | 5243 | 1.2684 | 0.3152 | 0.6229 | 0.2801 | 0.2283 | 0.2075 | 0.4572 | 0.3264 | 0.4836 | 0.5022 | 0.281 | 0.3707 | 0.6804 | 0.6224 | 0.7772 | 0.3308 | 0.5433 | 0.2041 | 0.4078 | 0.1049 | 0.3153 | 0.3136 | 0.4676 |
122
+ | 0.5118 | 50.0 | 5350 | 1.3018 | 0.3252 | 0.6248 | 0.305 | 0.2196 | 0.2206 | 0.4821 | 0.3287 | 0.4858 | 0.5015 | 0.2654 | 0.3794 | 0.6771 | 0.6159 | 0.7691 | 0.3332 | 0.5717 | 0.2209 | 0.3961 | 0.1375 | 0.3167 | 0.3185 | 0.4542 |
123
+ | 0.502 | 51.0 | 5457 | 1.2466 | 0.3319 | 0.653 | 0.2901 | 0.2399 | 0.2178 | 0.4883 | 0.3388 | 0.4905 | 0.5081 | 0.289 | 0.3748 | 0.6816 | 0.626 | 0.7772 | 0.357 | 0.5783 | 0.2109 | 0.402 | 0.1552 | 0.3208 | 0.3103 | 0.462 |
124
+ | 0.506 | 52.0 | 5564 | 1.2553 | 0.3153 | 0.64 | 0.2721 | 0.24 | 0.2077 | 0.4769 | 0.3287 | 0.4818 | 0.4982 | 0.2784 | 0.372 | 0.6928 | 0.6264 | 0.766 | 0.3397 | 0.5717 | 0.2087 | 0.3956 | 0.1133 | 0.3111 | 0.2885 | 0.4464 |
125
+ | 0.5066 | 53.0 | 5671 | 1.3476 | 0.3352 | 0.6334 | 0.2955 | 0.2544 | 0.2323 | 0.4958 | 0.3383 | 0.4952 | 0.5163 | 0.3038 | 0.3849 | 0.7196 | 0.6251 | 0.7759 | 0.3453 | 0.5733 | 0.2273 | 0.4162 | 0.1552 | 0.3319 | 0.3231 | 0.4844 |
126
+ | 0.4992 | 54.0 | 5778 | 1.3008 | 0.3303 | 0.6458 | 0.292 | 0.1557 | 0.2268 | 0.4735 | 0.3312 | 0.4849 | 0.5011 | 0.228 | 0.3711 | 0.691 | 0.611 | 0.7673 | 0.3633 | 0.5567 | 0.2247 | 0.3995 | 0.1374 | 0.2986 | 0.3149 | 0.4832 |
127
+ | 0.4791 | 55.0 | 5885 | 1.3185 | 0.3348 | 0.6544 | 0.2884 | 0.2444 | 0.2309 | 0.4804 | 0.3387 | 0.4981 | 0.5153 | 0.2973 | 0.3873 | 0.7085 | 0.6284 | 0.7784 | 0.3575 | 0.595 | 0.2163 | 0.4034 | 0.1542 | 0.3278 | 0.3175 | 0.4721 |
128
+ | 0.4628 | 56.0 | 5992 | 1.2985 | 0.3266 | 0.6258 | 0.2912 | 0.216 | 0.2286 | 0.4531 | 0.3407 | 0.4845 | 0.5015 | 0.2562 | 0.3845 | 0.6729 | 0.6301 | 0.7747 | 0.3721 | 0.5833 | 0.2105 | 0.402 | 0.1221 | 0.3097 | 0.2983 | 0.438 |
129
+ | 0.4568 | 57.0 | 6099 | 1.2744 | 0.3368 | 0.6356 | 0.3091 | 0.2112 | 0.2331 | 0.4793 | 0.3421 | 0.4889 | 0.5086 | 0.2813 | 0.3778 | 0.691 | 0.6273 | 0.7741 | 0.3848 | 0.58 | 0.2022 | 0.4078 | 0.1421 | 0.2972 | 0.3276 | 0.4838 |
130
+ | 0.4508 | 58.0 | 6206 | 1.3367 | 0.3387 | 0.6541 | 0.3073 | 0.256 | 0.2365 | 0.4842 | 0.3444 | 0.4925 | 0.5096 | 0.3095 | 0.3798 | 0.6947 | 0.6259 | 0.7735 | 0.3822 | 0.5767 | 0.2121 | 0.4005 | 0.1487 | 0.3125 | 0.3246 | 0.4849 |
131
+ | 0.4476 | 59.0 | 6313 | 1.2988 | 0.3422 | 0.6574 | 0.3041 | 0.2575 | 0.2349 | 0.4833 | 0.3421 | 0.4973 | 0.5173 | 0.3087 | 0.3878 | 0.7027 | 0.6439 | 0.7858 | 0.3656 | 0.5683 | 0.239 | 0.4191 | 0.1374 | 0.3333 | 0.325 | 0.4799 |
132
+ | 0.4418 | 60.0 | 6420 | 1.3153 | 0.336 | 0.6532 | 0.3026 | 0.2298 | 0.2296 | 0.4988 | 0.342 | 0.4952 | 0.5178 | 0.2729 | 0.3987 | 0.6979 | 0.617 | 0.7735 | 0.3692 | 0.5767 | 0.2324 | 0.4152 | 0.1367 | 0.3347 | 0.3246 | 0.4888 |
133
+ | 0.4255 | 61.0 | 6527 | 1.3474 | 0.3351 | 0.6402 | 0.3107 | 0.2307 | 0.2303 | 0.4998 | 0.3483 | 0.5026 | 0.5188 | 0.2808 | 0.3929 | 0.7016 | 0.6216 | 0.7741 | 0.3898 | 0.5933 | 0.2099 | 0.3975 | 0.1265 | 0.3361 | 0.3277 | 0.4927 |
134
+ | 0.4398 | 62.0 | 6634 | 1.3079 | 0.3235 | 0.6414 | 0.2716 | 0.203 | 0.2249 | 0.4655 | 0.3377 | 0.4969 | 0.5139 | 0.2522 | 0.3896 | 0.691 | 0.6164 | 0.7716 | 0.3404 | 0.575 | 0.2371 | 0.4216 | 0.1347 | 0.3347 | 0.2889 | 0.4665 |
135
+ | 0.4373 | 63.0 | 6741 | 1.3848 | 0.3227 | 0.6411 | 0.2715 | 0.2586 | 0.2268 | 0.4554 | 0.338 | 0.4883 | 0.5056 | 0.2983 | 0.3867 | 0.6765 | 0.6107 | 0.7599 | 0.3369 | 0.59 | 0.2328 | 0.4044 | 0.1322 | 0.3153 | 0.3011 | 0.4587 |
136
+ | 0.4287 | 64.0 | 6848 | 1.3676 | 0.3218 | 0.6456 | 0.2789 | 0.2563 | 0.2225 | 0.4598 | 0.3365 | 0.4915 | 0.5088 | 0.3148 | 0.3826 | 0.6923 | 0.5985 | 0.7549 | 0.3578 | 0.5667 | 0.2206 | 0.4142 | 0.1304 | 0.3417 | 0.3018 | 0.4665 |
137
+ | 0.4085 | 65.0 | 6955 | 1.3785 | 0.3343 | 0.6465 | 0.2967 | 0.2321 | 0.2383 | 0.4732 | 0.3415 | 0.4994 | 0.514 | 0.2836 | 0.3928 | 0.6854 | 0.6048 | 0.763 | 0.3561 | 0.5817 | 0.2355 | 0.4078 | 0.1399 | 0.3319 | 0.335 | 0.4855 |
138
+ | 0.4018 | 66.0 | 7062 | 1.3817 | 0.3259 | 0.6478 | 0.279 | 0.2321 | 0.227 | 0.4848 | 0.3364 | 0.4897 | 0.5103 | 0.2796 | 0.3899 | 0.6871 | 0.6028 | 0.7605 | 0.3393 | 0.57 | 0.2203 | 0.4015 | 0.1491 | 0.3306 | 0.318 | 0.4888 |
139
+ | 0.4005 | 67.0 | 7169 | 1.3791 | 0.3305 | 0.6483 | 0.2948 | 0.2344 | 0.225 | 0.4871 | 0.3358 | 0.4895 | 0.5095 | 0.2826 | 0.3829 | 0.6944 | 0.6162 | 0.7654 | 0.3629 | 0.5683 | 0.2217 | 0.3941 | 0.1194 | 0.3222 | 0.3324 | 0.4972 |
140
+ | 0.4 | 68.0 | 7276 | 1.3844 | 0.3413 | 0.6686 | 0.2994 | 0.2306 | 0.2315 | 0.4953 | 0.3424 | 0.4996 | 0.5178 | 0.2897 | 0.3871 | 0.7112 | 0.618 | 0.7728 | 0.3626 | 0.58 | 0.2307 | 0.4137 | 0.1373 | 0.3208 | 0.3581 | 0.5017 |
141
+ | 0.3961 | 69.0 | 7383 | 1.3469 | 0.334 | 0.6535 | 0.2764 | 0.2806 | 0.2249 | 0.4906 | 0.3449 | 0.5058 | 0.5229 | 0.3374 | 0.3884 | 0.7273 | 0.6161 | 0.7778 | 0.3543 | 0.585 | 0.2291 | 0.4088 | 0.1308 | 0.3514 | 0.3396 | 0.4916 |
142
+ | 0.3817 | 70.0 | 7490 | 1.3834 | 0.328 | 0.6577 | 0.286 | 0.2902 | 0.2249 | 0.4676 | 0.3436 | 0.4968 | 0.5121 | 0.3332 | 0.3912 | 0.6866 | 0.6162 | 0.7593 | 0.3558 | 0.5717 | 0.2175 | 0.4093 | 0.1222 | 0.3361 | 0.3282 | 0.4844 |
143
+ | 0.3851 | 71.0 | 7597 | 1.3745 | 0.3268 | 0.6354 | 0.281 | 0.2392 | 0.2237 | 0.4644 | 0.3386 | 0.4965 | 0.5132 | 0.3088 | 0.3918 | 0.685 | 0.6184 | 0.7654 | 0.3537 | 0.575 | 0.2253 | 0.4039 | 0.1238 | 0.3528 | 0.313 | 0.4687 |
144
+ | 0.3773 | 72.0 | 7704 | 1.3953 | 0.3325 | 0.6475 | 0.2841 | 0.2436 | 0.2233 | 0.4887 | 0.3397 | 0.4968 | 0.5134 | 0.3069 | 0.3873 | 0.6961 | 0.6198 | 0.7673 | 0.3492 | 0.575 | 0.2159 | 0.4088 | 0.1404 | 0.325 | 0.3375 | 0.4911 |
145
+ | 0.3709 | 73.0 | 7811 | 1.3560 | 0.3299 | 0.6478 | 0.2891 | 0.2394 | 0.2246 | 0.4904 | 0.3415 | 0.4962 | 0.5133 | 0.2887 | 0.3893 | 0.6974 | 0.6232 | 0.7648 | 0.3428 | 0.5567 | 0.2255 | 0.4074 | 0.13 | 0.3444 | 0.3281 | 0.4933 |
146
+ | 0.386 | 74.0 | 7918 | 1.3967 | 0.3336 | 0.6619 | 0.2908 | 0.2852 | 0.23 | 0.4811 | 0.3439 | 0.4963 | 0.5149 | 0.3293 | 0.3951 | 0.6897 | 0.6098 | 0.7636 | 0.3737 | 0.5967 | 0.2245 | 0.401 | 0.1329 | 0.3319 | 0.3271 | 0.4816 |
147
+ | 0.3584 | 75.0 | 8025 | 1.3931 | 0.3342 | 0.6622 | 0.3032 | 0.2654 | 0.2288 | 0.4765 | 0.3417 | 0.495 | 0.513 | 0.3084 | 0.3815 | 0.7017 | 0.6155 | 0.7784 | 0.3649 | 0.57 | 0.2321 | 0.402 | 0.1249 | 0.3222 | 0.3336 | 0.4922 |
148
+ | 0.3481 | 76.0 | 8132 | 1.3925 | 0.3368 | 0.6585 | 0.2895 | 0.269 | 0.2329 | 0.4833 | 0.348 | 0.5001 | 0.5193 | 0.3074 | 0.3935 | 0.7015 | 0.6196 | 0.7821 | 0.3493 | 0.5783 | 0.2393 | 0.4118 | 0.1409 | 0.3292 | 0.3348 | 0.495 |
149
+ | 0.3512 | 77.0 | 8239 | 1.3984 | 0.3323 | 0.6513 | 0.2849 | 0.2895 | 0.2248 | 0.4827 | 0.3393 | 0.4967 | 0.5136 | 0.3289 | 0.382 | 0.7079 | 0.6188 | 0.7772 | 0.339 | 0.5783 | 0.2318 | 0.4074 | 0.1319 | 0.3208 | 0.3402 | 0.4844 |
150
+ | 0.3366 | 78.0 | 8346 | 1.4160 | 0.3414 | 0.6618 | 0.3016 | 0.263 | 0.2376 | 0.4876 | 0.3428 | 0.4978 | 0.5138 | 0.3062 | 0.3873 | 0.6903 | 0.6113 | 0.7704 | 0.3714 | 0.595 | 0.2483 | 0.4093 | 0.131 | 0.3056 | 0.3449 | 0.4888 |
151
+ | 0.3278 | 79.0 | 8453 | 1.4257 | 0.3367 | 0.6401 | 0.3062 | 0.2399 | 0.2326 | 0.4775 | 0.3408 | 0.4939 | 0.5115 | 0.2817 | 0.3838 | 0.6977 | 0.6067 | 0.771 | 0.3648 | 0.5717 | 0.2445 | 0.4108 | 0.1211 | 0.3069 | 0.3463 | 0.4972 |
152
+ | 0.3225 | 80.0 | 8560 | 1.3995 | 0.3355 | 0.6592 | 0.2994 | 0.2158 | 0.2357 | 0.4778 | 0.3447 | 0.496 | 0.5105 | 0.2617 | 0.3863 | 0.6889 | 0.6033 | 0.7562 | 0.3597 | 0.5817 | 0.2395 | 0.4039 | 0.1327 | 0.3153 | 0.3423 | 0.4955 |
153
+ | 0.3197 | 81.0 | 8667 | 1.3828 | 0.3368 | 0.6525 | 0.3008 | 0.239 | 0.2342 | 0.48 | 0.3525 | 0.503 | 0.5196 | 0.2863 | 0.3951 | 0.6975 | 0.6113 | 0.7735 | 0.3803 | 0.5817 | 0.2268 | 0.4029 | 0.1239 | 0.3347 | 0.3415 | 0.505 |
154
+ | 0.3119 | 82.0 | 8774 | 1.3821 | 0.3367 | 0.6504 | 0.313 | 0.2674 | 0.2299 | 0.4826 | 0.3486 | 0.4961 | 0.5121 | 0.309 | 0.3872 | 0.692 | 0.6122 | 0.763 | 0.3691 | 0.58 | 0.2295 | 0.4108 | 0.1337 | 0.3097 | 0.3391 | 0.4972 |
155
+ | 0.3022 | 83.0 | 8881 | 1.4340 | 0.3378 | 0.6458 | 0.2983 | 0.2439 | 0.2336 | 0.4668 | 0.3417 | 0.4952 | 0.5138 | 0.2866 | 0.3936 | 0.6793 | 0.6111 | 0.7636 | 0.3687 | 0.5783 | 0.2383 | 0.4206 | 0.1301 | 0.3139 | 0.341 | 0.4927 |
156
+ | 0.3011 | 84.0 | 8988 | 1.4571 | 0.3335 | 0.6497 | 0.2893 | 0.2644 | 0.2254 | 0.4719 | 0.3399 | 0.4901 | 0.5069 | 0.3052 | 0.3811 | 0.6801 | 0.6158 | 0.7654 | 0.3622 | 0.5783 | 0.2278 | 0.4029 | 0.1355 | 0.3069 | 0.3261 | 0.481 |
157
+ | 0.2972 | 85.0 | 9095 | 1.4258 | 0.3338 | 0.6461 | 0.2916 | 0.2397 | 0.2283 | 0.4751 | 0.3449 | 0.499 | 0.516 | 0.2907 | 0.3911 | 0.6938 | 0.606 | 0.7574 | 0.3745 | 0.6017 | 0.2265 | 0.4025 | 0.1277 | 0.3264 | 0.3343 | 0.4922 |
158
+ | 0.2859 | 86.0 | 9202 | 1.4684 | 0.329 | 0.6399 | 0.2879 | 0.2591 | 0.2221 | 0.4732 | 0.3452 | 0.4957 | 0.5163 | 0.3076 | 0.3911 | 0.6931 | 0.6055 | 0.766 | 0.3602 | 0.5983 | 0.2173 | 0.3936 | 0.1339 | 0.3306 | 0.328 | 0.4927 |
159
+ | 0.2921 | 87.0 | 9309 | 1.4191 | 0.3332 | 0.646 | 0.2982 | 0.2655 | 0.2265 | 0.477 | 0.3415 | 0.5005 | 0.5196 | 0.3141 | 0.3895 | 0.7048 | 0.6053 | 0.7679 | 0.3804 | 0.6133 | 0.2223 | 0.402 | 0.1294 | 0.3278 | 0.3286 | 0.4872 |
160
+ | 0.2788 | 88.0 | 9416 | 1.4109 | 0.3327 | 0.6484 | 0.2959 | 0.2407 | 0.2284 | 0.4755 | 0.3454 | 0.498 | 0.5162 | 0.2875 | 0.3884 | 0.7014 | 0.6128 | 0.771 | 0.3555 | 0.585 | 0.2313 | 0.4025 | 0.1274 | 0.3333 | 0.3366 | 0.4894 |
161
+ | 0.2808 | 89.0 | 9523 | 1.4585 | 0.3333 | 0.6453 | 0.3076 | 0.2643 | 0.2279 | 0.4756 | 0.3423 | 0.4977 | 0.5168 | 0.3141 | 0.388 | 0.6946 | 0.6058 | 0.7673 | 0.3719 | 0.5967 | 0.2322 | 0.4118 | 0.1281 | 0.3139 | 0.3286 | 0.4944 |
162
+ | 0.2747 | 90.0 | 9630 | 1.4490 | 0.3338 | 0.6433 | 0.2976 | 0.2402 | 0.2257 | 0.4754 | 0.3455 | 0.4997 | 0.5175 | 0.2859 | 0.3942 | 0.6893 | 0.6087 | 0.7667 | 0.3793 | 0.595 | 0.2274 | 0.4083 | 0.1186 | 0.3264 | 0.3347 | 0.4911 |
163
+ | 0.2528 | 91.0 | 9737 | 1.4493 | 0.3362 | 0.6504 | 0.2926 | 0.2687 | 0.2288 | 0.4798 | 0.342 | 0.5006 | 0.5198 | 0.3141 | 0.3965 | 0.6867 | 0.6044 | 0.7704 | 0.389 | 0.6 | 0.2308 | 0.4103 | 0.1191 | 0.3222 | 0.3375 | 0.4961 |
164
+ | 0.2593 | 92.0 | 9844 | 1.4320 | 0.334 | 0.6486 | 0.2993 | 0.2461 | 0.2263 | 0.4702 | 0.3423 | 0.4986 | 0.517 | 0.2961 | 0.3884 | 0.6883 | 0.6089 | 0.7679 | 0.3741 | 0.5917 | 0.2337 | 0.4078 | 0.1149 | 0.3208 | 0.3382 | 0.4966 |
165
+ | 0.2685 | 93.0 | 9951 | 1.4475 | 0.3357 | 0.6478 | 0.2992 | 0.2672 | 0.2258 | 0.4738 | 0.3425 | 0.4978 | 0.5165 | 0.3123 | 0.3859 | 0.7037 | 0.6143 | 0.771 | 0.3774 | 0.5883 | 0.2311 | 0.4132 | 0.1173 | 0.325 | 0.3386 | 0.4849 |
166
+ | 0.2618 | 94.0 | 10058 | 1.4451 | 0.3385 | 0.6593 | 0.2988 | 0.2673 | 0.2324 | 0.4768 | 0.3457 | 0.5009 | 0.519 | 0.316 | 0.3898 | 0.6985 | 0.6104 | 0.7716 | 0.387 | 0.5967 | 0.2296 | 0.4039 | 0.1281 | 0.3278 | 0.3373 | 0.495 |
167
+ | 0.2513 | 95.0 | 10165 | 1.4426 | 0.3403 | 0.6552 | 0.313 | 0.2645 | 0.2336 | 0.4795 | 0.3429 | 0.5006 | 0.5179 | 0.3109 | 0.391 | 0.6934 | 0.6134 | 0.7735 | 0.3953 | 0.595 | 0.2311 | 0.4025 | 0.1209 | 0.3278 | 0.3408 | 0.4911 |
168
+ | 0.2596 | 96.0 | 10272 | 1.4438 | 0.338 | 0.6557 | 0.3033 | 0.2669 | 0.2288 | 0.4786 | 0.344 | 0.5005 | 0.5189 | 0.317 | 0.3915 | 0.6914 | 0.6119 | 0.7722 | 0.3964 | 0.595 | 0.2265 | 0.4054 | 0.1177 | 0.3347 | 0.3374 | 0.4872 |
169
+ | 0.2363 | 97.0 | 10379 | 1.4447 | 0.3379 | 0.6526 | 0.3044 | 0.2687 | 0.2297 | 0.4771 | 0.3437 | 0.5013 | 0.5196 | 0.32 | 0.3893 | 0.6969 | 0.608 | 0.7735 | 0.3861 | 0.5917 | 0.2335 | 0.4083 | 0.122 | 0.3319 | 0.3396 | 0.4927 |
170
+ | 0.2346 | 98.0 | 10486 | 1.4613 | 0.3366 | 0.6512 | 0.299 | 0.267 | 0.2288 | 0.4809 | 0.3425 | 0.5006 | 0.5201 | 0.3166 | 0.391 | 0.6999 | 0.6083 | 0.7722 | 0.3887 | 0.5933 | 0.2285 | 0.4088 | 0.1186 | 0.3319 | 0.3388 | 0.4944 |
171
+ | 0.2452 | 99.0 | 10593 | 1.4607 | 0.3362 | 0.6498 | 0.3001 | 0.2676 | 0.2286 | 0.4805 | 0.344 | 0.4982 | 0.5179 | 0.3168 | 0.3889 | 0.6997 | 0.6076 | 0.7716 | 0.3863 | 0.585 | 0.2264 | 0.4049 | 0.124 | 0.3347 | 0.3368 | 0.4933 |
172
+ | 0.2287 | 100.0 | 10700 | 1.4674 | 0.3363 | 0.6506 | 0.2992 | 0.2695 | 0.2282 | 0.4791 | 0.3441 | 0.4988 | 0.5186 | 0.3192 | 0.3884 | 0.6982 | 0.607 | 0.7716 | 0.3854 | 0.5883 | 0.2283 | 0.4093 | 0.1228 | 0.3319 | 0.3379 | 0.4916 |
173
+
174
+
175
+ ### Framework versions
176
+
177
+ - Transformers 4.41.0.dev0
178
+ - Pytorch 1.13.0+cu117
179
+ - Datasets 2.18.0
180
+ - Tokenizers 0.19.0
all_results.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 100.0,
3
+ "total_flos": 5.80084344142848e+16,
4
+ "train_loss": 1.202735595703125,
5
+ "train_runtime": 44.9423,
6
+ "train_samples_per_second": 6.675,
7
+ "train_steps_per_second": 2.225
8
+ }
config.json ADDED
@@ -0,0 +1,48 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "hustvl/yolos-small",
3
+ "architectures": [
4
+ "YolosForObjectDetection"
5
+ ],
6
+ "attention_probs_dropout_prob": 0.0,
7
+ "auxiliary_loss": false,
8
+ "bbox_cost": 5,
9
+ "bbox_loss_coefficient": 5,
10
+ "class_cost": 1,
11
+ "eos_coefficient": 0.1,
12
+ "giou_cost": 2,
13
+ "giou_loss_coefficient": 2,
14
+ "hidden_act": "gelu",
15
+ "hidden_dropout_prob": 0.0,
16
+ "hidden_size": 384,
17
+ "id2label": {
18
+ "0": "Coverall",
19
+ "1": "Face_Shield",
20
+ "2": "Gloves",
21
+ "3": "Goggles",
22
+ "4": "Mask"
23
+ },
24
+ "image_size": [
25
+ 512,
26
+ 864
27
+ ],
28
+ "initializer_range": 0.02,
29
+ "intermediate_size": 1536,
30
+ "label2id": {
31
+ "Coverall": 0,
32
+ "Face_Shield": 1,
33
+ "Gloves": 2,
34
+ "Goggles": 3,
35
+ "Mask": 4
36
+ },
37
+ "layer_norm_eps": 1e-12,
38
+ "model_type": "yolos",
39
+ "num_attention_heads": 6,
40
+ "num_channels": 3,
41
+ "num_detection_tokens": 100,
42
+ "num_hidden_layers": 12,
43
+ "patch_size": 16,
44
+ "qkv_bias": true,
45
+ "torch_dtype": "float32",
46
+ "transformers_version": "4.41.0.dev0",
47
+ "use_mid_position_embeddings": true
48
+ }
model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3a5f538837dc09ea2712d6f8bfc3262f561167fd8e1d3ed9841a5218d529e2ad
3
+ size 122630832
preprocessor_config.json ADDED
@@ -0,0 +1,45 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_valid_processor_keys": [
3
+ "images",
4
+ "annotations",
5
+ "return_segmentation_masks",
6
+ "masks_path",
7
+ "do_resize",
8
+ "size",
9
+ "resample",
10
+ "do_rescale",
11
+ "rescale_factor",
12
+ "do_normalize",
13
+ "image_mean",
14
+ "image_std",
15
+ "do_convert_annotations",
16
+ "do_pad",
17
+ "format",
18
+ "return_tensors",
19
+ "data_format",
20
+ "input_data_format"
21
+ ],
22
+ "do_convert_annotations": true,
23
+ "do_normalize": true,
24
+ "do_pad": true,
25
+ "do_rescale": true,
26
+ "do_resize": true,
27
+ "format": "coco_detection",
28
+ "image_mean": [
29
+ 0.485,
30
+ 0.456,
31
+ 0.406
32
+ ],
33
+ "image_processor_type": "YolosImageProcessor",
34
+ "image_std": [
35
+ 0.229,
36
+ 0.224,
37
+ 0.225
38
+ ],
39
+ "resample": 2,
40
+ "rescale_factor": 0.00392156862745098,
41
+ "size": {
42
+ "longest_edge": 600,
43
+ "shortest_edge": 600
44
+ }
45
+ }
train_results.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 100.0,
3
+ "total_flos": 5.80084344142848e+16,
4
+ "train_loss": 1.202735595703125,
5
+ "train_runtime": 44.9423,
6
+ "train_samples_per_second": 6.675,
7
+ "train_steps_per_second": 2.225
8
+ }
trainer_state.json ADDED
@@ -0,0 +1,30 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": null,
3
+ "best_model_checkpoint": null,
4
+ "epoch": 100.0,
5
+ "eval_steps": 500,
6
+ "global_step": 100,
7
+ "is_hyper_param_search": false,
8
+ "is_local_process_zero": true,
9
+ "is_world_process_zero": true,
10
+ "log_history": [
11
+ {
12
+ "epoch": 100.0,
13
+ "step": 100,
14
+ "total_flos": 5.80084344142848e+16,
15
+ "train_loss": 1.202735595703125,
16
+ "train_runtime": 44.9423,
17
+ "train_samples_per_second": 6.675,
18
+ "train_steps_per_second": 2.225
19
+ }
20
+ ],
21
+ "logging_steps": 500,
22
+ "max_steps": 100,
23
+ "num_input_tokens_seen": 0,
24
+ "num_train_epochs": 100,
25
+ "save_steps": 500,
26
+ "total_flos": 5.80084344142848e+16,
27
+ "train_batch_size": 3,
28
+ "trial_name": null,
29
+ "trial_params": null
30
+ }
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ae4d318227fded1d565ca310ab7c380889a2d992f50d4ed663b317ad432b3eb9
3
+ size 4731