Spaces:

facebook
/

vggsfm

Running on Zero

App Files Files Community

JianyuanWang commited on Jun 26

Commit

34d287c

•

1 Parent(s): 8866a87

push

Browse files

This view is limited to 50 files because it contains too many changes. See raw diff

Files changed (50) hide show

app.py +156 -46
debug_demo.py +31 -0
glbscene.glb +0 -0
requirements.txt +1 -1
{vggsfm → vggsfm_code}/.gitignore +0 -0
{vggsfm → vggsfm_code}/CHANGELOG.txt +0 -0
{vggsfm → vggsfm_code}/CODE_OF_CONDUCT.md +0 -0
{vggsfm → vggsfm_code}/CONTRIBUTING.md +0 -0
{vggsfm → vggsfm_code}/LICENSE.txt +0 -0
{vggsfm → vggsfm_code}/README.md +0 -0
{vggsfm → vggsfm_code}/assets/ui.png +0 -0
{vggsfm → vggsfm_code}/cfgs/demo.yaml +0 -0
{vggsfm → vggsfm_code}/demo.py +0 -0
{vggsfm → vggsfm_code}/examples/apple/images/frame000007.jpg +0 -0
{vggsfm → vggsfm_code}/examples/apple/images/frame000012.jpg +0 -0
{vggsfm → vggsfm_code}/examples/apple/images/frame000017.jpg +0 -0
{vggsfm → vggsfm_code}/examples/apple/images/frame000019.jpg +0 -0
{vggsfm → vggsfm_code}/examples/apple/images/frame000024.jpg +0 -0
{vggsfm → vggsfm_code}/examples/apple/images/frame000025.jpg +0 -0
{vggsfm → vggsfm_code}/examples/apple/images/frame000043.jpg +0 -0
{vggsfm → vggsfm_code}/examples/apple/images/frame000052.jpg +0 -0
{vggsfm → vggsfm_code}/examples/apple/images/frame000070.jpg +0 -0
{vggsfm → vggsfm_code}/examples/apple/images/frame000077.jpg +0 -0
{vggsfm → vggsfm_code}/examples/apple/images/frame000085.jpg +0 -0
{vggsfm → vggsfm_code}/examples/apple/images/frame000096.jpg +0 -0
{vggsfm → vggsfm_code}/examples/apple/images/frame000128.jpg +0 -0
{vggsfm → vggsfm_code}/examples/apple/images/frame000145.jpg +0 -0
{vggsfm → vggsfm_code}/examples/apple/images/frame000160.jpg +0 -0
{vggsfm → vggsfm_code}/examples/apple/images/frame000162.jpg +0 -0
{vggsfm → vggsfm_code}/examples/apple/images/frame000168.jpg +0 -0
{vggsfm → vggsfm_code}/examples/apple/images/frame000172.jpg +0 -0
{vggsfm → vggsfm_code}/examples/apple/images/frame000191.jpg +0 -0
{vggsfm → vggsfm_code}/examples/apple/images/frame000200.jpg +0 -0
{vggsfm → vggsfm_code}/examples/british_museum/images/29057984_287139632.jpg +0 -0
{vggsfm → vggsfm_code}/examples/british_museum/images/32630292_7166579210.jpg +0 -0
{vggsfm → vggsfm_code}/examples/british_museum/images/45839934_4117745134.jpg +0 -0
{vggsfm → vggsfm_code}/examples/british_museum/images/51004432_567773767.jpg +0 -0
{vggsfm → vggsfm_code}/examples/british_museum/images/62620282_3728576515.jpg +0 -0
{vggsfm → vggsfm_code}/examples/british_museum/images/71931631_7212707886.jpg +0 -0
{vggsfm → vggsfm_code}/examples/british_museum/images/78600497_407639599.jpg +0 -0
{vggsfm → vggsfm_code}/examples/british_museum/images/80340357_5029510336.jpg +0 -0
{vggsfm → vggsfm_code}/examples/british_museum/images/81272348_2712949069.jpg +0 -0
{vggsfm → vggsfm_code}/examples/british_museum/images/93266801_2335569192.jpg +0 -0
{vggsfm → vggsfm_code}/examples/cake/images/frame000020.jpg +0 -0
{vggsfm → vggsfm_code}/examples/cake/images/frame000069.jpg +0 -0
{vggsfm → vggsfm_code}/examples/cake/images/frame000096.jpg +0 -0
{vggsfm → vggsfm_code}/examples/cake/images/frame000112.jpg +0 -0
{vggsfm → vggsfm_code}/examples/cake/images/frame000146.jpg +0 -0
{vggsfm → vggsfm_code}/examples/cake/images/frame000149.jpg +0 -0
{vggsfm → vggsfm_code}/examples/cake/images/frame000166.jpg +0 -0

app.py CHANGED Viewed

@@ -4,68 +4,178 @@ import torch
 import numpy as np
 import gradio as gr
-def parse_video(video_file):
-    vs = cv2.VideoCapture(video_file)
-    frames = []
-    while True:
-        (gotit, frame) = vs.read()
-        if frame is not None:
-            frame = cv2.cvtColor(frame, cv2.COLOR_BGR2RGB)
-            frames.append(frame)
-        if not gotit:
-            break
-    return np.stack(frames)
 @spaces.GPU
-def cotracker_demo(
     input_video,
-    grid_size: int = 10,
-    tracks_leave_trace: bool = False,
 ):
-    load_video = parse_video(input_video)
-    load_video = torch.from_numpy(load_video).permute(0, 3, 1, 2)[None].float()
-    import time
-    def current_milli_time():
-        return round(time.time() * 1000)
-    filename = str(current_milli_time())
-    return os.path.join(
-        os.path.dirname(__file__), "results", f"{filename}.mp4"
-    )
-app = gr.Interface(
-    title="🎨 CoTracker: It is Better to Track Together",
-    description="<div style='text-align: left;'> \
-    <p>Welcome to <a href='http://co-tracker.github.io' target='_blank'>CoTracker</a>! This space demonstrates point (pixel) tracking in videos. \
-    Points are sampled on a regular grid and are tracked jointly. </p> \
-    <p> To get started, simply upload your <b>.mp4</b> video in landscape orientation or click on one of the example videos to load them. The shorter the video, the faster the processing. We recommend submitting short videos of length <b>2-7 seconds</b>.</p> \
-    <ul style='display: inline-block; text-align: left;'> \
-        <li>The total number of grid points is the square of <b>Grid Size</b>.</li> \
-        <li>Check <b>Visualize Track Traces</b> to visualize traces of all the tracked points. </li> \
-    </ul> \
-    <p style='text-align: left'>For more details, check out our <a href='https://github.com/facebookresearch/co-tracker' target='_blank'>GitHub Repo</a> ⭐</p> \
-    </div>",
-    fn=cotracker_demo,
-    inputs=[
-        gr.Video(type="file", label="Input video", interactive=True),
-        gr.Slider(minimum=10, maximum=80, step=1, value=10, label="Number of tracks"),
-    ],
-    outputs=gr.Video(label="Video with predicted tracks"),
-    cache_examples=True,
-    allow_flagging=False,
-)
-app.queue(max_size=20, concurrency_count=1).launch(debug=True)

 import numpy as np
 import gradio as gr
+import trimesh
+import sys
+import os
+sys.path.append('vggsfm_code/')
+import shutil
+from vggsfm_code.hf_demo import demo_fn
+from omegaconf import DictConfig, OmegaConf
+from viz_utils.viz_fn import add_camera
+#
+from scipy.spatial.transform import Rotation
+import PIL
+import spaces
 @spaces.GPU
+def vggsfm_demo(
+    input_image,
     input_video,
+    query_frame_num,
+    max_query_pts
+    # grid_size: int = 10,
 ):
+    cfg_file = "vggsfm_code/cfgs/demo.yaml"
+    cfg = OmegaConf.load(cfg_file)
+    max_input_image = 20
+    target_dir = f"input_images"
+    if os.path.exists(target_dir):
+        shutil.rmtree(target_dir)
+    os.makedirs(target_dir)
+    target_dir_images = target_dir + "/images"
+    os.makedirs(target_dir_images)
+    if input_image is not None:
+        if len(input_image)<3:
+            return None, "Please input at least three frames"
+        input_image = sorted(input_image)
+        input_image = input_image[:max_input_image]
+        # Copy files to the new directory
+        for file_name in input_image:
+            shutil.copy(file_name, target_dir_images)
+    elif input_video is not None:
+        vs = cv2.VideoCapture(input_video)
+        fps = vs.get(cv2.CAP_PROP_FPS)
+        frame_rate = 1
+        frame_interval = int(fps * frame_rate)
+        video_frame_num = 0
+        count = 0
+        while video_frame_num<=max_input_image:
+            (gotit, frame) = vs.read()
+            count +=1
+            if count % frame_interval == 0:
+                cv2.imwrite(target_dir_images+"/"+f"{video_frame_num:06}.png", frame)
+                video_frame_num+=1
+            if not gotit:
+                break
+        if video_frame_num<3:
+            return None, "Please input at least three frames"
+    else:
+        return None, "Input format incorrect"
+    cfg.query_frame_num = query_frame_num
+    cfg.max_query_pts = max_query_pts
+    print(f"Files have been copied to {target_dir_images}")
+    cfg.SCENE_DIR = target_dir
+    predictions = demo_fn(cfg)
+    glbfile = vggsfm_predictions_to_glb(predictions)
+    print(input_image)
+    print(input_video)
+    return glbfile, "Success"
+def vggsfm_predictions_to_glb(predictions):
+    # learned from https://github.com/naver/dust3r/blob/main/dust3r/viz.py
+    points3D = predictions["points3D"].cpu().numpy()
+    points3D_rgb = predictions["points3D_rgb"].cpu().numpy()
+    points3D_rgb = (points3D_rgb*255).astype(np.uint8)
+    extrinsics_opencv = predictions["extrinsics_opencv"].cpu().numpy()
+    intrinsics_opencv = predictions["intrinsics_opencv"].cpu().numpy()
+    raw_image_paths = predictions["raw_image_paths"]
+    images = predictions["images"].permute(0,2,3,1).cpu().numpy()
+    images = (images*255).astype(np.uint8)
+    glbscene = trimesh.Scene()
+    point_cloud = trimesh.PointCloud(points3D, colors=points3D_rgb)
+    glbscene.add_geometry(point_cloud)
+    camera_edge_colors = [(255, 0, 0), (0, 0, 255), (0, 255, 0), (255, 0, 255), (255, 204, 0), (0, 204, 204),
+                (128, 255, 255), (255, 128, 255), (255, 255, 128), (0, 0, 0), (128, 128, 128)]
+    frame_num = len(extrinsics_opencv)
+    extrinsics_opencv_4x4 = np.zeros((frame_num, 4, 4))
+    extrinsics_opencv_4x4[:, :3, :4] = extrinsics_opencv
+    extrinsics_opencv_4x4[:, 3, 3] = 1
+    for idx in range(frame_num):
+        cam_from_world = extrinsics_opencv_4x4[idx]
+        cam_to_world = np.linalg.inv(cam_from_world)
+        cur_cam_color = camera_edge_colors[idx % len(camera_edge_colors)]
+        cur_focal = intrinsics_opencv[idx, 0, 0]
+        # cur_image_path = raw_image_paths[idx]
+        # cur_image = np.array(PIL.Image.open(cur_image_path))
+        # add_camera(glbscene, cam_to_world, cur_cam_color, image=None, imsize=cur_image.shape[1::-1],
+                #    focal=None,screen_width=0.3)
+        add_camera(glbscene, cam_to_world, cur_cam_color, image=None, imsize=(1024,1024),
+                   focal=None,screen_width=0.35)
+    opengl_mat = np.array([[1, 0, 0, 0],
+                    [0, -1, 0, 0],
+                    [0, 0, -1, 0],
+                    [0, 0, 0, 1]])
+    rot = np.eye(4)
+    rot[:3, :3] = Rotation.from_euler('y', np.deg2rad(180)).as_matrix()
+    glbscene.apply_transform(np.linalg.inv(np.linalg.inv(extrinsics_opencv_4x4[0]) @ opengl_mat @ rot))
+    glbfile = "glbscene.glb"
+    glbscene.export(file_obj=glbfile)
+    return glbfile
+if True:
+    demo = gr.Interface(
+        title="🎨 VGGSfM: Visual Geometry Grounded Deep Structure From Motion",
+        description="<div style='text-align: left;'> \
+        <p>Welcome to <a href='https://github.com/facebookresearch/vggsfm' target='_blank'>VGGSfM</a>!",
+        fn=vggsfm_demo,
+        inputs=[
+            gr.File(file_count="multiple", label="Input Images", interactive=True),
+            gr.Video(label="Input video", interactive=True),
+            gr.Slider(minimum=1, maximum=10, step=1, value=5, label="Number of query images"),
+            gr.Slider(minimum=512, maximum=4096, step=1, value=1024, label="Number of query points"),
+        ],
+        outputs=[gr.Model3D(label="Reconstruction"), gr.Textbox(label="Log")],
+        cache_examples=True,
+        allow_flagging=False,
+    )
+    demo.queue(max_size=20, concurrency_count=1).launch(debug=True)
+    # demo.launch(debug=True, share=True)
+else:
+    import glob
+    files = glob.glob(f'vggsfm_code/examples/cake/images/*', recursive=True)
+    vggsfm_demo(files, None, None)
+# demo.queue(max_size=20, concurrency_count=1).launch(debug=True, share=True)

debug_demo.py ADDED Viewed

	@@ -0,0 +1,31 @@

+import gradio as gr
+def greet(name, intensity):
+    return "Hello, " + name + "!" * int(intensity)
+demo = gr.Interface(
+    fn=greet,
+    inputs=["text", "slider"],
+    outputs=["text"],
+)
+demo.launch(share=True)
+import sys
+import os
+sys.path.append('vggsfm_code/')
+from vggsfm_code.hf_demo import demo_fn
+from omegaconf import DictConfig, OmegaConf
+cfg_file = "vggsfm_code/cfgs/demo.yaml"
+cfg = OmegaConf.load(cfg_file)
+cfg.SCENE_DIR = "vggsfm_code/examples/cake"
+import pdb;pdb.set_trace()
+demo_fn(cfg)

glbscene.glb ADDED Viewed

Binary file (97.8 kB). View file

requirements.txt CHANGED Viewed

@@ -7,4 +7,4 @@ git+https://github.com/cvg/LightGlue.git#egg=LightGlue
 numpy==1.26.3
 pycolmap==0.6.1
 https://huggingface.co/facebook/VGGSfM/resolve/main/poselib-2.0.2-cp310-cp310-linux_x86_64.whl

 numpy==1.26.3
 pycolmap==0.6.1
 https://huggingface.co/facebook/VGGSfM/resolve/main/poselib-2.0.2-cp310-cp310-linux_x86_64.whl
+trimesh

{vggsfm → vggsfm_code}/.gitignore RENAMED Viewed

File without changes

{vggsfm → vggsfm_code}/CHANGELOG.txt RENAMED Viewed

File without changes

{vggsfm → vggsfm_code}/CODE_OF_CONDUCT.md RENAMED Viewed

File without changes

{vggsfm → vggsfm_code}/CONTRIBUTING.md RENAMED Viewed

File without changes

{vggsfm → vggsfm_code}/LICENSE.txt RENAMED Viewed

File without changes

{vggsfm → vggsfm_code}/README.md RENAMED Viewed

File without changes

{vggsfm → vggsfm_code}/assets/ui.png RENAMED Viewed

File without changes

{vggsfm → vggsfm_code}/cfgs/demo.yaml RENAMED Viewed

File without changes

{vggsfm → vggsfm_code}/demo.py RENAMED Viewed

File without changes

{vggsfm → vggsfm_code}/examples/apple/images/frame000007.jpg RENAMED Viewed

File without changes

{vggsfm → vggsfm_code}/examples/apple/images/frame000012.jpg RENAMED Viewed

File without changes

{vggsfm → vggsfm_code}/examples/apple/images/frame000017.jpg RENAMED Viewed

File without changes

{vggsfm → vggsfm_code}/examples/apple/images/frame000019.jpg RENAMED Viewed

File without changes

{vggsfm → vggsfm_code}/examples/apple/images/frame000024.jpg RENAMED Viewed

File without changes

{vggsfm → vggsfm_code}/examples/apple/images/frame000025.jpg RENAMED Viewed

File without changes

{vggsfm → vggsfm_code}/examples/apple/images/frame000043.jpg RENAMED Viewed

File without changes

{vggsfm → vggsfm_code}/examples/apple/images/frame000052.jpg RENAMED Viewed

File without changes

{vggsfm → vggsfm_code}/examples/apple/images/frame000070.jpg RENAMED Viewed

File without changes

{vggsfm → vggsfm_code}/examples/apple/images/frame000077.jpg RENAMED Viewed

File without changes

{vggsfm → vggsfm_code}/examples/apple/images/frame000085.jpg RENAMED Viewed

File without changes

{vggsfm → vggsfm_code}/examples/apple/images/frame000096.jpg RENAMED Viewed

File without changes

{vggsfm → vggsfm_code}/examples/apple/images/frame000128.jpg RENAMED Viewed

File without changes

{vggsfm → vggsfm_code}/examples/apple/images/frame000145.jpg RENAMED Viewed

File without changes

{vggsfm → vggsfm_code}/examples/apple/images/frame000160.jpg RENAMED Viewed

File without changes

{vggsfm → vggsfm_code}/examples/apple/images/frame000162.jpg RENAMED Viewed

File without changes

{vggsfm → vggsfm_code}/examples/apple/images/frame000168.jpg RENAMED Viewed

File without changes

{vggsfm → vggsfm_code}/examples/apple/images/frame000172.jpg RENAMED Viewed

File without changes

{vggsfm → vggsfm_code}/examples/apple/images/frame000191.jpg RENAMED Viewed

File without changes

{vggsfm → vggsfm_code}/examples/apple/images/frame000200.jpg RENAMED Viewed

File without changes

{vggsfm → vggsfm_code}/examples/british_museum/images/29057984_287139632.jpg RENAMED Viewed

File without changes

{vggsfm → vggsfm_code}/examples/british_museum/images/32630292_7166579210.jpg RENAMED Viewed

File without changes

{vggsfm → vggsfm_code}/examples/british_museum/images/45839934_4117745134.jpg RENAMED Viewed

File without changes

{vggsfm → vggsfm_code}/examples/british_museum/images/51004432_567773767.jpg RENAMED Viewed

File without changes

{vggsfm → vggsfm_code}/examples/british_museum/images/62620282_3728576515.jpg RENAMED Viewed

File without changes

{vggsfm → vggsfm_code}/examples/british_museum/images/71931631_7212707886.jpg RENAMED Viewed

File without changes

{vggsfm → vggsfm_code}/examples/british_museum/images/78600497_407639599.jpg RENAMED Viewed

File without changes

{vggsfm → vggsfm_code}/examples/british_museum/images/80340357_5029510336.jpg RENAMED Viewed

File without changes

{vggsfm → vggsfm_code}/examples/british_museum/images/81272348_2712949069.jpg RENAMED Viewed

File without changes

{vggsfm → vggsfm_code}/examples/british_museum/images/93266801_2335569192.jpg RENAMED Viewed

File without changes

{vggsfm → vggsfm_code}/examples/cake/images/frame000020.jpg RENAMED Viewed

File without changes

{vggsfm → vggsfm_code}/examples/cake/images/frame000069.jpg RENAMED Viewed

File without changes

{vggsfm → vggsfm_code}/examples/cake/images/frame000096.jpg RENAMED Viewed

File without changes

{vggsfm → vggsfm_code}/examples/cake/images/frame000112.jpg RENAMED Viewed

File without changes

{vggsfm → vggsfm_code}/examples/cake/images/frame000146.jpg RENAMED Viewed

File without changes

{vggsfm → vggsfm_code}/examples/cake/images/frame000149.jpg RENAMED Viewed

File without changes

{vggsfm → vggsfm_code}/examples/cake/images/frame000166.jpg RENAMED Viewed

File without changes