Spaces:

oxkitsune
/

rerun-ml-depth-pro

Running on Zero

oxkitsune commited on Oct 18

Commit

7b059da

•

1 Parent(s): a0e3696

webm webcam output?

Files changed (4) hide show

app.py CHANGED Viewed

@@ -76,6 +76,7 @@ def predict_depth(input_image):
 @rr.thread_local_stream("rerun_example_ml_depth_pro")
 def run_rerun(path_to_video):
     stream = rr.binary_stream()
     blueprint = rrb.Blueprint(
         rrb.Vertical(
@@ -93,15 +94,16 @@ def run_rerun(path_to_video):
     rr.send_blueprint(blueprint)
     yield stream.read()
     video_asset = rr.AssetVideo(path=path_to_video)
     rr.log("world/video", video_asset, static=True)
     # Send automatically determined video frame timestamps.
     frame_timestamps_ns = video_asset.read_frame_timestamps_ns()
-    # load the video using opencv
     cap = cv2.VideoCapture(path_to_video)
-    # loop through the video and log the frames using the video timestamps
     for i in range(len(frame_timestamps_ns)):
         ret, frame = cap.read()
         if not ret:
@@ -161,19 +163,12 @@ def run_rerun(path_to_video):
     yield stream.read()
-# Example images
-example_images = [
-    "examples/lemur.jpg",
-    "examples/cat.jpg",
-    "examples/silly-cat.png",
-]
 with gr.Blocks() as interface:
     gr.Markdown(
         """
         # DepthPro Rerun Demo
-        [DepthPro](https://huggingface.co/apple/DepthPro) is a fast metric depth prediction model. Simply upload an image to predict its inverse depth map and focal length.
         High resolution videos will be automatically resized to 256x256 pixels, to speed up the inference and visualize multiple frames.
         """

 @rr.thread_local_stream("rerun_example_ml_depth_pro")
 def run_rerun(path_to_video):
     stream = rr.binary_stream()
+    print("video path:", path_to_video)
     blueprint = rrb.Blueprint(
         rrb.Vertical(
     rr.send_blueprint(blueprint)
     yield stream.read()
     video_asset = rr.AssetVideo(path=path_to_video)
     rr.log("world/video", video_asset, static=True)
     # Send automatically determined video frame timestamps.
     frame_timestamps_ns = video_asset.read_frame_timestamps_ns()
     cap = cv2.VideoCapture(path_to_video)
+    num_frames = cap.get(cv2.CAP_PROP_FRAME_COUNT)
+    print(f"Number of frames in the video: {num_frames}")
     for i in range(len(frame_timestamps_ns)):
         ret, frame = cap.read()
         if not ret:
     yield stream.read()
 with gr.Blocks() as interface:
     gr.Markdown(
         """
         # DepthPro Rerun Demo
+        [DepthPro](https://huggingface.co/apple/DepthPro) is a fast metric depth prediction model. Simply upload a video to visualize the depth predictions in real-time.
         High resolution videos will be automatically resized to 256x256 pixels, to speed up the inference and visualize multiple frames.
         """

pyproject.toml CHANGED Viewed

@@ -3,14 +3,14 @@ name = "rerun-apple-depth-pro"
 version = "0.1.0"
 description = "Add your description here"
 readme = "README.md"
-requires-python = ">=3.10"
 dependencies = [
     "attrs>=24.2.0",
     "depth-pro",
     "gradio>=4.44.1",
     "gradio-rerun>=0.0.8",
     "rerun-sdk==0.19.0",
-    "spaces>=0.30.3",
 ]
 [tool.uv]

 version = "0.1.0"
 description = "Add your description here"
 readme = "README.md"
+requires-python = ">=3.8"
 dependencies = [
     "attrs>=24.2.0",
     "depth-pro",
     "gradio>=4.44.1",
     "gradio-rerun>=0.0.8",
     "rerun-sdk==0.19.0",
+    "spaces>=0.30.4",
 ]
 [tool.uv]

requirements.txt CHANGED Viewed

@@ -80,7 +80,7 @@ semantic-version==2.10.0
 shellingham==1.5.4
 six==1.16.0
 sniffio==1.3.1
-spaces==0.30.3
 stack-data==0.6.3
 starlette==0.38.6
 sympy==1.13.3

 shellingham==1.5.4
 six==1.16.0
 sniffio==1.3.1
+spaces==0.30.4
 stack-data==0.6.3
 starlette==0.38.6
 sympy==1.13.3

uv.lock CHANGED Viewed

The diff for this file is too large to render. See raw diff