Initial commit
Browse files- README.md +2 -2
- sam2_hiera_l.yaml → sam2.1_hiera_l.yaml +5 -2
- sam2.1_hiera_large.pt +2 -2
README.md
CHANGED
@@ -42,7 +42,7 @@ with torch.inference_mode(), torch.autocast("cuda", dtype=torch.bfloat16):
|
|
42 |
...
|
43 |
```
|
44 |
|
45 |
-
Refer to the [demo notebooks](https://github.com/facebookresearch/segment-anything-2/tree/main/notebooks) for details.
|
46 |
|
47 |
### Citation
|
48 |
|
@@ -55,4 +55,4 @@ To cite the paper, model, or software, please use the below:
|
|
55 |
url={https://arxiv.org/abs/2408.00714},
|
56 |
year={2024}
|
57 |
}
|
58 |
-
```
|
|
|
42 |
...
|
43 |
```
|
44 |
|
45 |
+
Refer to the [demo notebooks](https://github.com/facebookresearch/segment-anything-2/tree/main/notebooks) for more details.
|
46 |
|
47 |
### Citation
|
48 |
|
|
|
55 |
url={https://arxiv.org/abs/2408.00714},
|
56 |
year={2024}
|
57 |
}
|
58 |
+
```
|
sam2_hiera_l.yaml → sam2.1_hiera_l.yaml
RENAMED
@@ -93,6 +93,7 @@ model:
|
|
93 |
use_mask_input_as_output_without_sam: true
|
94 |
# Memory
|
95 |
directly_add_no_mem_embed: true
|
|
|
96 |
# use high-resolution feature map in the SAM mask decoder
|
97 |
use_high_res_features_in_sam: true
|
98 |
# output 3 masks on the first click on initial conditioning frames
|
@@ -101,7 +102,9 @@ model:
|
|
101 |
iou_prediction_use_sigmoid: True
|
102 |
# cross-attend to object pointers from other frames (based on SAM output tokens) in the encoder
|
103 |
use_obj_ptrs_in_encoder: true
|
104 |
-
add_tpos_enc_to_obj_ptrs:
|
|
|
|
|
105 |
only_obj_ptrs_in_the_past_for_eval: true
|
106 |
# object occlusion prediction
|
107 |
pred_obj_scores: true
|
@@ -114,4 +117,4 @@ model:
|
|
114 |
multimask_max_pt_num: 1
|
115 |
use_mlp_for_obj_ptr_proj: true
|
116 |
# Compilation flag
|
117 |
-
compile_image_encoder: False
|
|
|
93 |
use_mask_input_as_output_without_sam: true
|
94 |
# Memory
|
95 |
directly_add_no_mem_embed: true
|
96 |
+
no_obj_embed_spatial: true
|
97 |
# use high-resolution feature map in the SAM mask decoder
|
98 |
use_high_res_features_in_sam: true
|
99 |
# output 3 masks on the first click on initial conditioning frames
|
|
|
102 |
iou_prediction_use_sigmoid: True
|
103 |
# cross-attend to object pointers from other frames (based on SAM output tokens) in the encoder
|
104 |
use_obj_ptrs_in_encoder: true
|
105 |
+
add_tpos_enc_to_obj_ptrs: true
|
106 |
+
proj_tpos_enc_in_obj_ptrs: true
|
107 |
+
use_signed_tpos_enc_to_obj_ptrs: true
|
108 |
only_obj_ptrs_in_the_past_for_eval: true
|
109 |
# object occlusion prediction
|
110 |
pred_obj_scores: true
|
|
|
117 |
multimask_max_pt_num: 1
|
118 |
use_mlp_for_obj_ptr_proj: true
|
119 |
# Compilation flag
|
120 |
+
compile_image_encoder: False
|
sam2.1_hiera_large.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2647878d5dfa5098f2f8649825738a9345572bae2d4350a2468587ece47dd318
|
3 |
+
size 898083611
|