Spaces:

hujiecpp
/

PE3R

Running on Zero

App Files Files Community

hujiecpp commited on Feb 21

Commit

89fb9c8

1 Parent(s): 6cbef76

init project

Browse files

Files changed (1) hide show

app.py +25 -22

app.py CHANGED Viewed

@@ -542,36 +542,39 @@ def get_reconstructed_scene(outdir, filelist, schedule, niter, min_conf_thr,
     outfile = get_3D_model_from_scene(outdir, scene, min_conf_thr, as_pointcloud, mask_sky,
                                       clean_depth, transparent_cams, cam_size)
     scene.to('cpu')
     torch.cuda.empty_cache()
     return scene, outfile
 # @spaces.GPU(duration=60)
-def get_3D_object_from_scene(outdir, text, threshold, scene, min_conf_thr, as_pointcloud,
-                 mask_sky, clean_depth, transparent_cams, cam_size):
-    device = 'cuda' if torch.cuda.is_available() else 'cpu'
-    siglip_tokenizer = AutoTokenizer.from_pretrained("google/siglip-large-patch16-256")
-    siglip = AutoModel.from_pretrained("google/siglip-large-patch16-256", device_map=device)
-    texts = [text]
-    inputs = siglip_tokenizer(text=texts, padding="max_length", return_tensors="pt")
-    inputs = {key: value.to(device) for key, value in inputs.items()}
-    with torch.no_grad():
-        text_feats =siglip.get_text_features(**inputs)
-        text_feats = text_feats / text_feats.norm(dim=-1, keepdim=True)
-    scene.render_image(text_feats, threshold)
-    scene.ori_imgs = scene.rendered_imgs
-    outfile = get_3D_model_from_scene(outdir, scene, min_conf_thr, as_pointcloud, mask_sky,
-                                      clean_depth, transparent_cams, cam_size)
-    return outfile
 with tempfile.TemporaryDirectory(suffix='pe3r_gradio_demo') as tmpdirname:
     recon_fun = functools.partial(get_reconstructed_scene, tmpdirname)
     # model_from_scene_fun = functools.partial(get_3D_model_from_scene, tmpdirname)
-    get_3D_object_from_scene_fun = functools.partial(get_3D_object_from_scene, tmpdirname)
     with gradio.Blocks(css=""".gradio-container {margin: 0 !important; min-width: 100%};""", title="PE3R Demo") as demo:
         # scene state is save so that you can change conf_thr, cam_size... without rerunning the inference
@@ -626,8 +629,8 @@ with tempfile.TemporaryDirectory(suffix='pe3r_gradio_demo') as tmpdirname:
                                     scenegraph_type, winsize, refid],
                             outputs=[scene, outmodel]) # , outgallery
-            find_btn.click(fn=get_3D_object_from_scene_fun,
-                                inputs=[text_input, threshold, scene, min_conf_thr, as_pointcloud, mask_sky,
-                                        clean_depth, transparent_cams, cam_size],
-                            outputs=outmodel)
     demo.launch(show_error=True, share=None, server_name=None, server_port=None)

     outfile = get_3D_model_from_scene(outdir, scene, min_conf_thr, as_pointcloud, mask_sky,
                                       clean_depth, transparent_cams, cam_size)
+    print(scene)
     scene.to('cpu')
+    print(scene)
     torch.cuda.empty_cache()
     return scene, outfile
 # @spaces.GPU(duration=60)
+# def get_3D_object_from_scene(outdir, text, threshold, scene, min_conf_thr, as_pointcloud,
+#                  mask_sky, clean_depth, transparent_cams, cam_size):
+#     device = 'cuda' if torch.cuda.is_available() else 'cpu'
+#     siglip_tokenizer = AutoTokenizer.from_pretrained("google/siglip-large-patch16-256")
+#     siglip = AutoModel.from_pretrained("google/siglip-large-patch16-256", device_map=device)
+#     texts = [text]
+#     inputs = siglip_tokenizer(text=texts, padding="max_length", return_tensors="pt")
+#     inputs = {key: value.to(device) for key, value in inputs.items()}
+#     with torch.no_grad():
+#         text_feats =siglip.get_text_features(**inputs)
+#         text_feats = text_feats / text_feats.norm(dim=-1, keepdim=True)
+#     scene.render_image(text_feats, threshold)
+#     scene.ori_imgs = scene.rendered_imgs
+#     outfile = get_3D_model_from_scene(outdir, scene, min_conf_thr, as_pointcloud, mask_sky,
+#                                       clean_depth, transparent_cams, cam_size)
+#     return outfile
 with tempfile.TemporaryDirectory(suffix='pe3r_gradio_demo') as tmpdirname:
     recon_fun = functools.partial(get_reconstructed_scene, tmpdirname)
     # model_from_scene_fun = functools.partial(get_3D_model_from_scene, tmpdirname)
+    # get_3D_object_from_scene_fun = functools.partial(get_3D_object_from_scene, tmpdirname)
     with gradio.Blocks(css=""".gradio-container {margin: 0 !important; min-width: 100%};""", title="PE3R Demo") as demo:
         # scene state is save so that you can change conf_thr, cam_size... without rerunning the inference
                                     scenegraph_type, winsize, refid],
                             outputs=[scene, outmodel]) # , outgallery
+            # find_btn.click(fn=get_3D_object_from_scene_fun,
+            #                     inputs=[text_input, threshold, scene, min_conf_thr, as_pointcloud, mask_sky,
+            #                             clean_depth, transparent_cams, cam_size],
+            #                 outputs=outmodel)
     demo.launch(show_error=True, share=None, server_name=None, server_port=None)