jev-aleks commited on
Commit
d1494df
·
1 Parent(s): e55f275

add description

Browse files
Files changed (3) hide show
  1. README.md +1 -1
  2. app.py +14 -1
  3. demo_utils/examples/log.csv +1 -1
README.md CHANGED
@@ -9,7 +9,7 @@ sdk_version: 5.35.0
9
  app_file: app.py
10
  pinned: false
11
  license: apache-2.0
12
- short_description: SceneDINO Demo
13
  ---
14
 
15
  Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference
 
9
  app_file: app.py
10
  pinned: false
11
  license: apache-2.0
12
+ short_description: SceneDINO (ICCV 2025)
13
  ---
14
 
15
  Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference
app.py CHANGED
@@ -190,6 +190,18 @@ def demo_run(image: str,
190
  return output_2d, glb_path
191
 
192
 
 
 
 
 
 
 
 
 
 
 
 
 
193
  demo = gr.Interface(
194
  demo_run,
195
  inputs=[
@@ -197,7 +209,7 @@ demo = gr.Interface(
197
  gr.Radio(label="Backbone", choices=["DINO (ViT-B)", "DINOv2 (ViT-B)"]),
198
  gr.Radio(label="Mode", choices=["Feature PCA 1-3", "Feature PCA 4-6", "Feature PCA 7-9", "SSC (unsup.)", "SSC (linear)"]),
199
  gr.Slider(label="Density threshold", minimum=0, maximum=1, step=0.05, value=0.2),
200
- gr.Slider(label="Resolution [m]", minimum=0.05, maximum=0.5, step=0.1, value=0.2),
201
  gr.Slider(label="X Range [m]", minimum=1, maximum=50, step=1, value=10),
202
  gr.Slider(label="Y Range [m]", minimum=1, maximum=50, step=1, value=10),
203
  gr.Slider(label="Z Range [m]", minimum=1, maximum=100, step=1, value=20),
@@ -212,6 +224,7 @@ demo = gr.Interface(
212
  ],
213
  title="SceneDINO Demo",
214
  examples="demo_utils/examples",
 
215
  )
216
 
217
  demo.launch()
 
190
  return output_2d, glb_path
191
 
192
 
193
+ markdown_description = """
194
+ [Paper](https://arxiv.org/abs/xxxx.xxxxx) | [Code](https://github.com/tum-vision/scenedino) | [Project Page](https://visinf.github.io/scenedino/)
195
+ Upload a single image to infer 3D geometry and semantics with **SceneDINO**. You can find some example images below.
196
+
197
+ - **Feature PCA**
198
+ We visualize our high-dimensional feature field using PCA and visualizing three of the components in RGB. Interactively adjust which are visualized.
199
+ - **SSC** (Semantic Scene Completion)
200
+ Our features are used downstream for semantic predictions. Choose between the fully unsupervised approach or the linear probing approach.
201
+
202
+ <span style="color:orange">⚠️ NOTE: We assume the intrinsic camera matrix of KITTI-360, images are cropped and rescaled to 192x640. Further note our demo's voxel limit of 5M. </span>
203
+ """
204
+
205
  demo = gr.Interface(
206
  demo_run,
207
  inputs=[
 
209
  gr.Radio(label="Backbone", choices=["DINO (ViT-B)", "DINOv2 (ViT-B)"]),
210
  gr.Radio(label="Mode", choices=["Feature PCA 1-3", "Feature PCA 4-6", "Feature PCA 7-9", "SSC (unsup.)", "SSC (linear)"]),
211
  gr.Slider(label="Density threshold", minimum=0, maximum=1, step=0.05, value=0.2),
212
+ gr.Slider(label="Resolution [m]", minimum=0.05, maximum=0.5, step=0.05, value=0.2),
213
  gr.Slider(label="X Range [m]", minimum=1, maximum=50, step=1, value=10),
214
  gr.Slider(label="Y Range [m]", minimum=1, maximum=50, step=1, value=10),
215
  gr.Slider(label="Z Range [m]", minimum=1, maximum=100, step=1, value=20),
 
224
  ],
225
  title="SceneDINO Demo",
226
  examples="demo_utils/examples",
227
+ description=markdown_description,
228
  )
229
 
230
  demo.launch()
demo_utils/examples/log.csv CHANGED
@@ -1,2 +1,2 @@
1
  image, mode, sigma_threshold, resolution, x_range, y_range, z_range
2
- "kitti-360.png","DINO (ViT-B)","Feature PCA 1-3",0.25,0.5,20,20,50
 
1
  image, mode, sigma_threshold, resolution, x_range, y_range, z_range
2
+ "kitti-360.png","DINOv2 (ViT-B)","Feature PCA 1-3",0.25,0.25,20,20,50