Jie Hu commited on
Commit
23c29a5
·
1 Parent(s): 9fdf8bc

init project

Browse files
Files changed (3) hide show
  1. .DS_Store +0 -0
  2. modules/.DS_Store +0 -0
  3. modules/pe3r/models.py +32 -32
.DS_Store ADDED
Binary file (6.15 kB). View file
 
modules/.DS_Store ADDED
Binary file (8.2 kB). View file
 
modules/pe3r/models.py CHANGED
@@ -18,35 +18,35 @@ class Models:
18
  MAST3R_CKP = 'naver/MASt3R_ViTLarge_BaseDecoder_512_catmlpdpt_metric'
19
  self.mast3r = AsymmetricMASt3R.from_pretrained(MAST3R_CKP).to(device)
20
 
21
- # -- sam2 --
22
- # SAM2_CKP = "./checkpoints/sam2.1_hiera_large.pt"
23
- # SAM2_CKP = 'hujiecpp/sam2-1-hiera-large'
24
- # SAM2_CONFIG = "./configs/sam2.1/sam2.1_hiera_l.yaml"
25
- # self.sam2 = build_sam2_video_predictor(SAM2_CONFIG, SAM2_CKP, device=device, apply_postprocessing=False)
26
- # self.sam2.eval()
27
- self.sam2 = SAM2VideoPredictor.from_pretrained('facebook/sam2.1-hiera-large', device=device)
28
-
29
- # -- mobilesamv2 & sam1 --
30
- # SAM1_ENCODER_CKP = './checkpoints/sam_vit_h.pt'
31
- # SAM1_ENCODER_CKP = 'facebook/sam-vit-huge/model.safetensors'
32
- SAM1_DECODER_CKP = './checkpoints/Prompt_guided_Mask_Decoder.pt'
33
- self.mobilesamv2 = sam_model_registry['sam_vit_h'](None)
34
- # image_encoder=sam_model_registry['sam_vit_h_encoder'](SAM1_ENCODER_CKP)
35
- sam1 = SamModel.from_pretrained('facebook/sam-vit-huge')
36
- image_encoder = sam1.vision_encoder
37
-
38
- prompt_encoder, mask_decoder = sam_model_registry['prompt_guided_decoder'](SAM1_DECODER_CKP)
39
- self.mobilesamv2.prompt_encoder = prompt_encoder
40
- self.mobilesamv2.mask_decoder = mask_decoder
41
- self.mobilesamv2.image_encoder=image_encoder
42
- self.mobilesamv2.to(device=device)
43
- self.mobilesamv2.eval()
44
-
45
- # -- yolov8 --
46
- YOLO8_CKP='./checkpoints/ObjectAwareModel.pt'
47
- self.yolov8 = ObjectAwareModel(YOLO8_CKP)
48
-
49
- # -- siglip --
50
- self.siglip = AutoModel.from_pretrained("google/siglip-large-patch16-256", device_map=device)
51
- self.siglip_tokenizer = AutoTokenizer.from_pretrained("google/siglip-large-patch16-256", device_map=device)
52
- self.siglip_processor = AutoProcessor.from_pretrained("google/siglip-large-patch16-256", device_map=device)
 
18
  MAST3R_CKP = 'naver/MASt3R_ViTLarge_BaseDecoder_512_catmlpdpt_metric'
19
  self.mast3r = AsymmetricMASt3R.from_pretrained(MAST3R_CKP).to(device)
20
 
21
+ # # -- sam2 --
22
+ # # SAM2_CKP = "./checkpoints/sam2.1_hiera_large.pt"
23
+ # # SAM2_CKP = 'hujiecpp/sam2-1-hiera-large'
24
+ # # SAM2_CONFIG = "./configs/sam2.1/sam2.1_hiera_l.yaml"
25
+ # # self.sam2 = build_sam2_video_predictor(SAM2_CONFIG, SAM2_CKP, device=device, apply_postprocessing=False)
26
+ # # self.sam2.eval()
27
+ # self.sam2 = SAM2VideoPredictor.from_pretrained('facebook/sam2.1-hiera-large', device=device)
28
+
29
+ # # -- mobilesamv2 & sam1 --
30
+ # # SAM1_ENCODER_CKP = './checkpoints/sam_vit_h.pt'
31
+ # # SAM1_ENCODER_CKP = 'facebook/sam-vit-huge/model.safetensors'
32
+ # SAM1_DECODER_CKP = './checkpoints/Prompt_guided_Mask_Decoder.pt'
33
+ # self.mobilesamv2 = sam_model_registry['sam_vit_h'](None)
34
+ # # image_encoder=sam_model_registry['sam_vit_h_encoder'](SAM1_ENCODER_CKP)
35
+ # sam1 = SamModel.from_pretrained('facebook/sam-vit-huge')
36
+ # image_encoder = sam1.vision_encoder
37
+
38
+ # prompt_encoder, mask_decoder = sam_model_registry['prompt_guided_decoder'](SAM1_DECODER_CKP)
39
+ # self.mobilesamv2.prompt_encoder = prompt_encoder
40
+ # self.mobilesamv2.mask_decoder = mask_decoder
41
+ # self.mobilesamv2.image_encoder=image_encoder
42
+ # self.mobilesamv2.to(device=device)
43
+ # self.mobilesamv2.eval()
44
+
45
+ # # -- yolov8 --
46
+ # YOLO8_CKP='./checkpoints/ObjectAwareModel.pt'
47
+ # self.yolov8 = ObjectAwareModel(YOLO8_CKP)
48
+
49
+ # # -- siglip --
50
+ # self.siglip = AutoModel.from_pretrained("google/siglip-large-patch16-256", device_map=device)
51
+ # self.siglip_tokenizer = AutoTokenizer.from_pretrained("google/siglip-large-patch16-256", device_map=device)
52
+ # self.siglip_processor = AutoProcessor.from_pretrained("google/siglip-large-patch16-256", device_map=device)