frankers3 commited on
Commit
36efa90
1 Parent(s): f6b5d4c

Training in progress, step 200

Browse files
Files changed (5) hide show
  1. README.md +5 -5
  2. config.json +11 -16
  3. model.safetensors +2 -2
  4. preprocessor_config.json +1 -1
  5. training_args.bin +1 -1
README.md CHANGED
@@ -1,6 +1,6 @@
1
  ---
2
  license: apache-2.0
3
- base_model: SenseTime/deformable-detr
4
  tags:
5
  - generated_from_trainer
6
  model-index:
@@ -13,7 +13,7 @@ should probably proofread and complete it, then remove this comment. -->
13
 
14
  # detr
15
 
16
- This model is a fine-tuned version of [SenseTime/deformable-detr](https://huggingface.co/SenseTime/deformable-detr) on the None dataset.
17
 
18
  ## Model description
19
 
@@ -38,7 +38,7 @@ The following hyperparameters were used during training:
38
  - seed: 42
39
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
40
  - lr_scheduler_type: linear
41
- - num_epochs: 15
42
  - mixed_precision_training: Native AMP
43
 
44
  ### Training results
@@ -47,7 +47,7 @@ The following hyperparameters were used during training:
47
 
48
  ### Framework versions
49
 
50
- - Transformers 4.38.2
51
  - Pytorch 2.2.1+cu121
52
- - Datasets 2.18.0
53
  - Tokenizers 0.15.2
 
1
  ---
2
  license: apache-2.0
3
+ base_model: facebook/detr-resnet-50
4
  tags:
5
  - generated_from_trainer
6
  model-index:
 
13
 
14
  # detr
15
 
16
+ This model is a fine-tuned version of [facebook/detr-resnet-50](https://huggingface.co/facebook/detr-resnet-50) on the None dataset.
17
 
18
  ## Model description
19
 
 
38
  - seed: 42
39
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
40
  - lr_scheduler_type: linear
41
+ - num_epochs: 20
42
  - mixed_precision_training: Native AMP
43
 
44
  ### Training results
 
47
 
48
  ### Framework versions
49
 
50
+ - Transformers 4.38.1
51
  - Pytorch 2.2.1+cu121
52
+ - Datasets 2.17.1
53
  - Tokenizers 0.15.2
config.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
- "_name_or_path": "SenseTime/deformable-detr",
3
  "activation_dropout": 0.0,
4
  "activation_function": "relu",
5
  "architectures": [
6
- "DeformableDetrForObjectDetection"
7
  ],
8
  "attention_dropout": 0.0,
9
  "auxiliary_loss": false,
@@ -13,23 +13,20 @@
13
  "bbox_cost": 5,
14
  "bbox_loss_coefficient": 5,
15
  "class_cost": 1,
 
16
  "d_model": 256,
17
  "decoder_attention_heads": 8,
18
- "decoder_ffn_dim": 1024,
19
  "decoder_layerdrop": 0.0,
20
  "decoder_layers": 6,
21
- "decoder_n_points": 4,
22
  "dice_loss_coefficient": 1,
23
  "dilation": false,
24
- "disable_custom_kernels": false,
25
  "dropout": 0.1,
26
  "encoder_attention_heads": 8,
27
- "encoder_ffn_dim": 1024,
28
  "encoder_layerdrop": 0.0,
29
  "encoder_layers": 6,
30
- "encoder_n_points": 4,
31
  "eos_coefficient": 0.1,
32
- "focal_alpha": 0.25,
33
  "giou_cost": 2,
34
  "giou_loss_coefficient": 2,
35
  "id2label": {
@@ -43,16 +40,14 @@
43
  },
44
  "mask_loss_coefficient": 1,
45
  "max_position_embeddings": 1024,
46
- "model_type": "deformable_detr",
47
  "num_channels": 3,
48
- "num_feature_levels": 4,
49
- "num_queries": 300,
50
  "position_embedding_type": "sine",
 
51
  "torch_dtype": "float32",
52
- "transformers_version": "4.38.2",
53
- "two_stage": false,
54
- "two_stage_num_proposals": 300,
55
  "use_pretrained_backbone": true,
56
- "use_timm_backbone": true,
57
- "with_box_refine": false
58
  }
 
1
  {
2
+ "_name_or_path": "facebook/detr-resnet-50",
3
  "activation_dropout": 0.0,
4
  "activation_function": "relu",
5
  "architectures": [
6
+ "DetrForObjectDetection"
7
  ],
8
  "attention_dropout": 0.0,
9
  "auxiliary_loss": false,
 
13
  "bbox_cost": 5,
14
  "bbox_loss_coefficient": 5,
15
  "class_cost": 1,
16
+ "classifier_dropout": 0.0,
17
  "d_model": 256,
18
  "decoder_attention_heads": 8,
19
+ "decoder_ffn_dim": 2048,
20
  "decoder_layerdrop": 0.0,
21
  "decoder_layers": 6,
 
22
  "dice_loss_coefficient": 1,
23
  "dilation": false,
 
24
  "dropout": 0.1,
25
  "encoder_attention_heads": 8,
26
+ "encoder_ffn_dim": 2048,
27
  "encoder_layerdrop": 0.0,
28
  "encoder_layers": 6,
 
29
  "eos_coefficient": 0.1,
 
30
  "giou_cost": 2,
31
  "giou_loss_coefficient": 2,
32
  "id2label": {
 
40
  },
41
  "mask_loss_coefficient": 1,
42
  "max_position_embeddings": 1024,
43
+ "model_type": "detr",
44
  "num_channels": 3,
45
+ "num_hidden_layers": 6,
46
+ "num_queries": 150,
47
  "position_embedding_type": "sine",
48
+ "scale_embedding": false,
49
  "torch_dtype": "float32",
50
+ "transformers_version": "4.38.1",
 
 
51
  "use_pretrained_backbone": true,
52
+ "use_timm_backbone": true
 
53
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:511243e3fc69b8a971865ffd71b042f08fcc0bcfc65714942640983896e8724b
3
- size 160676460
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b2c3f006aa8d99951bc725eeac437f5c25d93a93aab07ad4b43f5939cd1655c9
3
+ size 166546024
preprocessor_config.json CHANGED
@@ -10,7 +10,7 @@
10
  0.456,
11
  0.406
12
  ],
13
- "image_processor_type": "DeformableDetrImageProcessor",
14
  "image_std": [
15
  0.229,
16
  0.224,
 
10
  0.456,
11
  0.406
12
  ],
13
+ "image_processor_type": "DetrImageProcessor",
14
  "image_std": [
15
  0.229,
16
  0.224,
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b93bbc9d246d3cab23e8ec1e4fd3b7d7076041f54d586188dd75f21fdb9289bf
3
  size 4856
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e6eb9b88d2bec2c45b07ccd100f7ffc91323aefe2611c9395f2361133829b4d9
3
  size 4856