spiritupbro AP123 commited on
Commit
79527d4
·
0 Parent(s):

Duplicate from AP123/text-to-3D

Browse files

Co-authored-by: AP <[email protected]>

Files changed (7) hide show
  1. .gitattributes +34 -0
  2. README.md +13 -0
  3. app.py +264 -0
  4. images/chair.png +0 -0
  5. images/corgi.png +0 -0
  6. images/cube_stack.jpg +0 -0
  7. requirements.txt +5 -0
.gitattributes ADDED
@@ -0,0 +1,34 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ *.7z filter=lfs diff=lfs merge=lfs -text
2
+ *.arrow filter=lfs diff=lfs merge=lfs -text
3
+ *.bin filter=lfs diff=lfs merge=lfs -text
4
+ *.bz2 filter=lfs diff=lfs merge=lfs -text
5
+ *.ckpt filter=lfs diff=lfs merge=lfs -text
6
+ *.ftz filter=lfs diff=lfs merge=lfs -text
7
+ *.gz filter=lfs diff=lfs merge=lfs -text
8
+ *.h5 filter=lfs diff=lfs merge=lfs -text
9
+ *.joblib filter=lfs diff=lfs merge=lfs -text
10
+ *.lfs.* filter=lfs diff=lfs merge=lfs -text
11
+ *.mlmodel filter=lfs diff=lfs merge=lfs -text
12
+ *.model filter=lfs diff=lfs merge=lfs -text
13
+ *.msgpack filter=lfs diff=lfs merge=lfs -text
14
+ *.npy filter=lfs diff=lfs merge=lfs -text
15
+ *.npz filter=lfs diff=lfs merge=lfs -text
16
+ *.onnx filter=lfs diff=lfs merge=lfs -text
17
+ *.ot filter=lfs diff=lfs merge=lfs -text
18
+ *.parquet filter=lfs diff=lfs merge=lfs -text
19
+ *.pb filter=lfs diff=lfs merge=lfs -text
20
+ *.pickle filter=lfs diff=lfs merge=lfs -text
21
+ *.pkl filter=lfs diff=lfs merge=lfs -text
22
+ *.pt filter=lfs diff=lfs merge=lfs -text
23
+ *.pth filter=lfs diff=lfs merge=lfs -text
24
+ *.rar filter=lfs diff=lfs merge=lfs -text
25
+ *.safetensors filter=lfs diff=lfs merge=lfs -text
26
+ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
27
+ *.tar.* filter=lfs diff=lfs merge=lfs -text
28
+ *.tflite filter=lfs diff=lfs merge=lfs -text
29
+ *.tgz filter=lfs diff=lfs merge=lfs -text
30
+ *.wasm filter=lfs diff=lfs merge=lfs -text
31
+ *.xz filter=lfs diff=lfs merge=lfs -text
32
+ *.zip filter=lfs diff=lfs merge=lfs -text
33
+ *.zst filter=lfs diff=lfs merge=lfs -text
34
+ *tfevents* filter=lfs diff=lfs merge=lfs -text
README.md ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ title: Point-e Demo
3
+ emoji: 🐢
4
+ colorFrom: yellow
5
+ colorTo: blue
6
+ sdk: gradio
7
+ sdk_version: 3.14.0
8
+ app_file: app.py
9
+ pinned: false
10
+ duplicated_from: AP123/text-to-3D
11
+ ---
12
+
13
+ Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference
app.py ADDED
@@ -0,0 +1,264 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ import os
2
+ from PIL import Image
3
+ import torch
4
+
5
+ from point_e.diffusion.configs import DIFFUSION_CONFIGS, diffusion_from_config
6
+ from point_e.diffusion.sampler import PointCloudSampler
7
+ from point_e.models.download import load_checkpoint
8
+ from point_e.models.configs import MODEL_CONFIGS, model_from_config
9
+ from point_e.util.plotting import plot_point_cloud
10
+ from point_e.util.pc_to_mesh import marching_cubes_mesh
11
+
12
+ import skimage.measure
13
+
14
+ from pyntcloud import PyntCloud
15
+ import matplotlib.colors
16
+ import plotly.graph_objs as go
17
+
18
+ import trimesh
19
+
20
+ import gradio as gr
21
+
22
+
23
+ state = ""
24
+ device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')
25
+
26
+ def set_state(s):
27
+ print(s)
28
+ global state
29
+ state = s
30
+
31
+ def get_state():
32
+ return state
33
+
34
+ set_state('Creating txt2mesh model...')
35
+ t2m_name = 'base40M-textvec'
36
+ t2m_model = model_from_config(MODEL_CONFIGS[t2m_name], device)
37
+ t2m_model.eval()
38
+ base_diffusion_t2m = diffusion_from_config(DIFFUSION_CONFIGS[t2m_name])
39
+
40
+ set_state('Downloading txt2mesh checkpoint...')
41
+ t2m_model.load_state_dict(load_checkpoint(t2m_name, device))
42
+
43
+
44
+ def load_img2mesh_model(model_name):
45
+ set_state(f'Creating img2mesh model {model_name}...')
46
+ i2m_name = model_name
47
+ i2m_model = model_from_config(MODEL_CONFIGS[i2m_name], device)
48
+ i2m_model.eval()
49
+ base_diffusion_i2m = diffusion_from_config(DIFFUSION_CONFIGS[i2m_name])
50
+
51
+ set_state(f'Downloading img2mesh checkpoint {model_name}...')
52
+ i2m_model.load_state_dict(load_checkpoint(i2m_name, device))
53
+
54
+ return i2m_model, base_diffusion_i2m
55
+
56
+ img2mesh_model_name = 'base40M' #'base300M' #'base1B'
57
+ i2m_model, base_diffusion_i2m = load_img2mesh_model(img2mesh_model_name)
58
+
59
+
60
+ set_state('Creating upsample model...')
61
+ upsampler_model = model_from_config(MODEL_CONFIGS['upsample'], device)
62
+ upsampler_model.eval()
63
+ upsampler_diffusion = diffusion_from_config(DIFFUSION_CONFIGS['upsample'])
64
+
65
+ set_state('Downloading upsampler checkpoint...')
66
+ upsampler_model.load_state_dict(load_checkpoint('upsample', device))
67
+
68
+ set_state('Creating SDF model...')
69
+ sdf_name = 'sdf'
70
+ sdf_model = model_from_config(MODEL_CONFIGS[sdf_name], device)
71
+ sdf_model.eval()
72
+
73
+ set_state('Loading SDF model...')
74
+ sdf_model.load_state_dict(load_checkpoint(sdf_name, device))
75
+
76
+ stable_diffusion = gr.Blocks.load(name="spaces/runwayml/stable-diffusion-v1-5")
77
+
78
+
79
+ set_state('')
80
+
81
+ def get_sampler(model_name, txt2obj, guidance_scale):
82
+
83
+ global img2mesh_model_name
84
+ global base_diffusion_i2m
85
+ global i2m_model
86
+ if model_name != img2mesh_model_name:
87
+ img2mesh_model_name = model_name
88
+ i2m_model, base_diffusion_i2m = load_img2mesh_model(model_name)
89
+
90
+ return PointCloudSampler(
91
+ device=device,
92
+ models=[t2m_model if txt2obj else i2m_model, upsampler_model],
93
+ diffusions=[base_diffusion_t2m if txt2obj else base_diffusion_i2m, upsampler_diffusion],
94
+ num_points=[1024, 4096 - 1024],
95
+ aux_channels=['R', 'G', 'B'],
96
+ guidance_scale=[guidance_scale, 0.0 if txt2obj else guidance_scale],
97
+ model_kwargs_key_filter=('texts', '') if txt2obj else ("*",)
98
+ )
99
+
100
+ def generate_txt2img(prompt):
101
+
102
+ prompt = f"“a 3d rendering of {prompt}, full view, white background"
103
+ gallery_dir = stable_diffusion(prompt, fn_index=2)
104
+ imgs = [os.path.join(gallery_dir, img) for img in os.listdir(gallery_dir) if os.path.splitext(img)[1] == '.jpg']
105
+
106
+ return imgs[0], gr.update(visible=True)
107
+
108
+ def generate_3D(input, model_name='base40M', guidance_scale=3.0, grid_size=32):
109
+
110
+ set_state('Entered generate function...')
111
+
112
+ if isinstance(input, Image.Image):
113
+ input = prepare_img(input)
114
+
115
+ # if input is a string, it's a text prompt
116
+ sampler = get_sampler(model_name, txt2obj=True if isinstance(input, str) else False, guidance_scale=guidance_scale)
117
+
118
+ # Produce a sample from the model.
119
+ set_state('Sampling...')
120
+ samples = None
121
+ kw_args = dict(texts=[input]) if isinstance(input, str) else dict(images=[input])
122
+ for x in sampler.sample_batch_progressive(batch_size=1, model_kwargs=kw_args):
123
+ samples = x
124
+
125
+ set_state('Converting to point cloud...')
126
+ pc = sampler.output_to_point_clouds(samples)[0]
127
+
128
+ set_state('Saving point cloud...')
129
+ with open("point_cloud.ply", "wb") as f:
130
+ pc.write_ply(f)
131
+
132
+ set_state('Converting to mesh...')
133
+ save_ply(pc, 'mesh.ply', grid_size)
134
+
135
+ set_state('')
136
+
137
+ return pc_to_plot(pc), ply_to_obj('mesh.ply', '3d_model.obj'), gr.update(value=['3d_model.obj', 'mesh.ply', 'point_cloud.ply'], visible=True)
138
+
139
+ def prepare_img(img):
140
+
141
+ w, h = img.size
142
+ if w > h:
143
+ img = img.crop((w - h) / 2, 0, w - (w - h) / 2, h)
144
+ else:
145
+ img = img.crop((0, (h - w) / 2, w, h - (h - w) / 2))
146
+
147
+ # resize to 256x256
148
+ img = img.resize((256, 256))
149
+
150
+ return img
151
+
152
+ def pc_to_plot(pc):
153
+
154
+ return go.Figure(
155
+ data=[
156
+ go.Scatter3d(
157
+ x=pc.coords[:,0], y=pc.coords[:,1], z=pc.coords[:,2],
158
+ mode='markers',
159
+ marker=dict(
160
+ size=2,
161
+ color=['rgb({},{},{})'.format(r,g,b) for r,g,b in zip(pc.channels["R"], pc.channels["G"], pc.channels["B"])],
162
+ )
163
+ )
164
+ ],
165
+ layout=dict(
166
+ scene=dict(xaxis=dict(visible=False), yaxis=dict(visible=False), zaxis=dict(visible=False))
167
+ ),
168
+ )
169
+
170
+ def ply_to_obj(ply_file, obj_file):
171
+ mesh = trimesh.load(ply_file)
172
+ mesh.export(obj_file)
173
+
174
+ return obj_file
175
+
176
+ def save_ply(pc, file_name, grid_size):
177
+
178
+ # Produce a mesh (with vertex colors)
179
+ mesh = marching_cubes_mesh(
180
+ pc=pc,
181
+ model=sdf_model,
182
+ batch_size=4096,
183
+ grid_size=grid_size, # increase to 128 for resolution used in evals
184
+ progress=True,
185
+ )
186
+
187
+ # Write the mesh to a PLY file to import into some other program.
188
+ with open(file_name, 'wb') as f:
189
+ mesh.write_ply(f)
190
+
191
+
192
+ with gr.Blocks() as app:
193
+ gr.Markdown("# Image-to-3D")
194
+ gr.Markdown("Turn any image or prompt to a 3D asset! Powered by StableDiffusion and OpenAI Point-E. Check out (https://twitter.com/angrypenguinPNG) for a tutorial on how to best use this space.")
195
+ gr.HTML("""To skip the queue you can duplicate this space:
196
+ <br><a href="https://huggingface.co/spaces/AP123/text-to-3D?duplicate=true"><img src="https://img.shields.io/badge/-Duplicate%20Space-blue?labelColor=white&style=flat&logo=&logoWidth=14" alt="Duplicate Space"></a>
197
+ <br>Don't forget to change space hardware to <b>GPU</b> after duplicating it.""")
198
+
199
+ with gr.Row():
200
+ with gr.Column():
201
+ with gr.Tab("Image to 3D"):
202
+ img = gr.Image(label="Image")
203
+ gr.Markdown("Best results with images of 3D objects with no shadows on a white background.")
204
+ btn_generate_img2obj = gr.Button(value="Generate")
205
+
206
+ with gr.Tab("Text to 3D"):
207
+ gr.Markdown("Generate an image with Stable Diffusion, then convert it to 3D. Just enter the object you want to generate.")
208
+ prompt_sd = gr.Textbox(label="Prompt", placeholder="a 3d rendering of [your prompt], full view, white background")
209
+ btn_generate_txt2sd = gr.Button(value="Generate image")
210
+ img_sd = gr.Image(label="Image")
211
+ btn_generate_sd2obj = gr.Button(value="Convert to 3D", visible=False)
212
+
213
+ with gr.Accordion("Advanced settings", open=False):
214
+ dropdown_models = gr.Dropdown(label="Model", value="base40M", choices=["base40M", "base300M"]) #, "base1B"])
215
+ guidance_scale = gr.Slider(label="Guidance scale", value=3.0, minimum=3.0, maximum=10.0, step=0.1)
216
+ grid_size = gr.Slider(label="Grid size (for .obj 3D model)", value=32, minimum=16, maximum=128, step=16)
217
+
218
+ with gr.Column():
219
+ plot = gr.Plot(label="Point cloud")
220
+ # btn_pc_to_obj = gr.Button(value="Convert to OBJ", visible=False)
221
+ model_3d = gr.Model3D(value=None)
222
+ file_out = gr.File(label="Files", visible=False)
223
+
224
+ # state_info = state_info = gr.Textbox(label="State", show_label=False).style(container=False)
225
+
226
+
227
+ # inputs = [dropdown_models, prompt, img, guidance_scale, grid_size]
228
+ outputs = [plot, model_3d, file_out]
229
+
230
+ btn_generate_img2obj.click(generate_3D, inputs=[img, dropdown_models, guidance_scale, grid_size], outputs=outputs)
231
+
232
+ prompt_sd.submit(generate_txt2img, inputs=prompt_sd, outputs=[img_sd, btn_generate_sd2obj])
233
+ btn_generate_txt2sd.click(generate_txt2img, inputs=prompt_sd, outputs=[img_sd, btn_generate_sd2obj], queue=False)
234
+ btn_generate_sd2obj.click(generate_3D, inputs=[img, dropdown_models, guidance_scale, grid_size], outputs=outputs)
235
+
236
+ # btn_pc_to_obj.click(ply_to_obj, inputs=plot, outputs=[model_3d, file_out])
237
+
238
+ gr.Examples(
239
+ examples=[
240
+ ["images/corgi.png"],
241
+ ["images/cube_stack.jpg"],
242
+ ["images/chair.png"],
243
+ ],
244
+ inputs=[img],
245
+ outputs=outputs,
246
+ fn=generate_3D,
247
+ cache_examples=False
248
+ )
249
+
250
+ # app.load(get_state, inputs=[], outputs=state_info, every=0.5, show_progress=False)
251
+
252
+ gr.HTML("""
253
+ <br><br>
254
+ <div style="border-top: 1px solid #303030;">
255
+ <br>
256
+ <p>Space by:<br>
257
+ <a href="https://twitter.com/hahahahohohe"><img src="https://img.shields.io/twitter/follow/hahahahohohe?label=%40anzorq&style=social" alt="Twitter Follow"></a><br>
258
+ <a href="https://github.com/qunash"><img alt="GitHub followers" src="https://img.shields.io/github/followers/qunash?style=social" alt="Github Follow"></a></p><br>
259
+ <a href="https://www.buymeacoffee.com/anzorq" target="_blank"><img src="https://cdn.buymeacoffee.com/buttons/v2/default-yellow.png" alt="Buy Me A Coffee" style="height: 30px !important;width: 102px !important;" ></a><br><br>
260
+ <p><img src="https://visitor-badge.glitch.me/badge?page_id=anzorq.point-e_demo" alt="visitors"></p>
261
+ </div>
262
+ """)
263
+
264
+ app.queue(max_size=250, concurrency_count=6).launch()
images/chair.png ADDED
images/corgi.png ADDED
images/cube_stack.jpg ADDED
requirements.txt ADDED
@@ -0,0 +1,5 @@
 
 
 
 
 
 
1
+ git+https://github.com/openai/point-e@main
2
+ pyntcloud
3
+ plotly
4
+ trimesh
5
+