Spaces:

sudo-ai
/

MeshFormer

Running

App Files Files Community

NCJ commited on Aug 14, 2024

Commit

57a1960

verified ·

1 Parent(s): 234bf91

copy from dev

Browse files

Files changed (37) hide show

.gitattributes +30 -0
Dockerfile +55 -0
README.md +2 -2
demo_examples/01.png +3 -0
demo_examples/03.png +3 -0
demo_examples/04.png +3 -0
demo_examples/05.png +3 -0
demo_examples/07.png +3 -0
demo_examples/09.png +3 -0
demo_examples/12.png +3 -0
demo_examples/14.png +3 -0
demo_examples/17.jpg +3 -0
demo_examples/18.jpg +3 -0
demo_examples/19.jpg +3 -0
demo_examples/21.png +3 -0
demo_examples/22.png +3 -0
demo_examples/23.png +3 -0
demo_examples/24.png +3 -0
demo_examples/25.png +3 -0
demo_examples/26.png +3 -0
demo_examples/27.png +3 -0
demo_examples/28.png +3 -0
demo_examples/29.png +3 -0
demo_examples/30.png +3 -0
demo_examples/31.png +3 -0
demo_examples/32.png +3 -0
demo_examples/33.png +3 -0
demo_examples/35.png +3 -0
demo_examples/cup.png +3 -0
demo_examples/teapot.png +3 -0
gradio_demo.py +415 -0
gradio_model3dcolor-0.0.1-py3-none-any.whl +0 -0
gradio_model3dnormal-0.0.1-py3-none-any.whl +0 -0
ply2glb.py +57 -0
sam_inference.py +40 -0
style.css +32 -0
utils.py +86 -0

.gitattributes CHANGED Viewed

@@ -33,3 +33,33 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text

 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text
+demo_examples/ filter=lfs diff=lfs merge=lfs -text
+demo_examples/*.png filter=lfs diff=lfs merge=lfs -text
+demo_examples/cup.jpg filter=lfs diff=lfs merge=lfs -text
+demo_examples/teapot.png filter=lfs diff=lfs merge=lfs -text
+demo_examples/cup.png filter=lfs diff=lfs merge=lfs -text
+demo_examples/01.png filter=lfs diff=lfs merge=lfs -text
+demo_examples/12.png filter=lfs diff=lfs merge=lfs -text
+demo_examples/17.jpg filter=lfs diff=lfs merge=lfs -text
+demo_examples/25.png filter=lfs diff=lfs merge=lfs -text
+demo_examples/26.png filter=lfs diff=lfs merge=lfs -text
+demo_examples/27.png filter=lfs diff=lfs merge=lfs -text
+demo_examples/29.png filter=lfs diff=lfs merge=lfs -text
+demo_examples/31.png filter=lfs diff=lfs merge=lfs -text
+demo_examples/33.png filter=lfs diff=lfs merge=lfs -text
+demo_examples/35.png filter=lfs diff=lfs merge=lfs -text
+demo_examples/05.png filter=lfs diff=lfs merge=lfs -text
+demo_examples/22.png filter=lfs diff=lfs merge=lfs -text
+demo_examples/23.png filter=lfs diff=lfs merge=lfs -text
+demo_examples/04.png filter=lfs diff=lfs merge=lfs -text
+demo_examples/09.png filter=lfs diff=lfs merge=lfs -text
+demo_examples/18.jpg filter=lfs diff=lfs merge=lfs -text
+demo_examples/19.jpg filter=lfs diff=lfs merge=lfs -text
+demo_examples/24.png filter=lfs diff=lfs merge=lfs -text
+demo_examples/32.png filter=lfs diff=lfs merge=lfs -text
+demo_examples/03.png filter=lfs diff=lfs merge=lfs -text
+demo_examples/07.png filter=lfs diff=lfs merge=lfs -text
+demo_examples/14.png filter=lfs diff=lfs merge=lfs -text
+demo_examples/21.png filter=lfs diff=lfs merge=lfs -text
+demo_examples/28.png filter=lfs diff=lfs merge=lfs -text
+demo_examples/30.png filter=lfs diff=lfs merge=lfs -text

Dockerfile ADDED Viewed

	@@ -0,0 +1,55 @@

+FROM python:3.10-slim
+LABEL version="1.0.2"
+ENV LANG=C.UTF-8 LC_ALL=C.UTF-8
+ENV TZ=America/Los_Angeles
+RUN ln -snf /usr/share/zoneinfo/$TZ /etc/localtime && echo $TZ > /etc/timezone
+RUN apt-get update && apt-get install -y --no-install-recommends \
+    curl \
+    libx11-6 \
+    libxrender1 \
+    libxxf86vm1 \
+    libxfixes3 \
+    libxi6 \
+    libxkbcommon0 \
+    libgomp1 \
+    libsm6 \
+    libgl1 \
+    git
+RUN pip3 install --no-cache-dir \
+    numpy \
+    trimesh \
+    Pillow \
+    gradio==4.40.0 \
+    bpy \
+    opencv-python-headless
+RUN pip3 install \
+    torch torchvision torchaudio --index-url https://download.pytorch.org/whl/cpu
+RUN pip3 install git+https://github.com/facebookresearch/segment-anything.git
+# Set up a new user named "user" with user ID 1000
+RUN useradd -m -u 1000 user
+# Switch to the "user" user
+USER user
+# Set home to the user's home directory
+ENV HOME=/home/user \
+	PATH=/home/user/.local/bin:$PATH \
+    PYTHONPATH=$HOME/app \
+	PYTHONUNBUFFERED=1 \
+	SYSTEM=spaces
+# Set the working directory to the user's home directory
+WORKDIR $HOME/app
+# Copy the current directory contents into the container at $HOME/app setting the owner to the user
+COPY --chown=user . $HOME/app
+RUN pip3 install gradio_model3dcolor-0.0.1-py3-none-any.whl
+RUN pip3 install gradio_model3dnormal-0.0.1-py3-none-any.whl
+RUN mkdir ./checkpoints/ && curl https://dl.fbaipublicfiles.com/segment_anything/sam_vit_h_4b8939.pth -o ./checkpoints/sam_vit_h_4b8939.pth
+CMD ["python3", "gradio_demo.py"]

README.md CHANGED Viewed

@@ -1,6 +1,6 @@
 ---
-title: MeshFormer
-emoji: 📈
 colorFrom: pink
 colorTo: gray
 sdk: docker

 ---
+title: MeshFormer Dev
+emoji: 🏢
 colorFrom: pink
 colorTo: gray
 sdk: docker

demo_examples/01.png ADDED Viewed

Git LFS Details

SHA256: 4e17b300fd9700fab365cab312f5c6383265fa96c423fe2920a17cbbce1ca5b2
Pointer size: 130 Bytes
Size of remote file: 73.7 kB

demo_examples/03.png ADDED Viewed

Git LFS Details

SHA256: 85568b0b61217649faa5f49009be26ede5fb25ac7a906fa1a9672ece35cb7ce9
Pointer size: 130 Bytes
Size of remote file: 81.4 kB

demo_examples/04.png ADDED Viewed

Git LFS Details

SHA256: 1a72c4dd1e9cc9a82b4a7a546f919f0f6ec4fc135103ba0e5d2ac33abd822b39
Pointer size: 130 Bytes
Size of remote file: 81.8 kB

demo_examples/05.png ADDED Viewed

Git LFS Details

SHA256: 2e57f6e4e76cc85fadbd6965aeca8e875217c204bf3f68043a6b362a8773450a
Pointer size: 130 Bytes
Size of remote file: 79.3 kB

demo_examples/07.png ADDED Viewed

Git LFS Details

SHA256: 9f383df1d66e40b51eb4dfcccfe69498677552c088d4827a7c64ef6dbca5f07f
Pointer size: 130 Bytes
Size of remote file: 43.6 kB

demo_examples/09.png ADDED Viewed

Git LFS Details

SHA256: 0fc0ce5e5614214458f038e7c822ec188188c32e4596c3bbb170d42331d2174d
Pointer size: 131 Bytes
Size of remote file: 196 kB

demo_examples/12.png ADDED Viewed

Git LFS Details

SHA256: 883cbadd6f01de6d1a4d3e667441b0bfa30fb91f754e5b2bebf42d2cc513d9d3
Pointer size: 130 Bytes
Size of remote file: 51.6 kB

demo_examples/14.png ADDED Viewed

Git LFS Details

SHA256: 65189f337ef48800a8c16589a81c78ba21a1b6c48a6549333e291a4b4ad25c12
Pointer size: 131 Bytes
Size of remote file: 106 kB

demo_examples/17.jpg ADDED Viewed

Git LFS Details

SHA256: 1be16df5ef2104c48b1780cffcb0ad1e3c84f02e7dfb62989c90b942e6119f0e
Pointer size: 130 Bytes
Size of remote file: 57.3 kB

demo_examples/18.jpg ADDED Viewed

Git LFS Details

SHA256: 9e24490a9d7374cca2c403266f4068238a0af26a923b62b8b7ea0669a1697cf5
Pointer size: 130 Bytes
Size of remote file: 58.1 kB

demo_examples/19.jpg ADDED Viewed

Git LFS Details

SHA256: 9a3ba96921dad9ff96676904f7d1514a8fbbea8fbaf147cb219bd92d9766f1ec
Pointer size: 130 Bytes
Size of remote file: 78.2 kB

demo_examples/21.png ADDED Viewed

Git LFS Details

SHA256: ef94c6494d6bd9244a4903c7bf18a3770eea57c66b2a53e5c6a1cbcb99ab11eb
Pointer size: 130 Bytes
Size of remote file: 35 kB

demo_examples/22.png ADDED Viewed

Git LFS Details

SHA256: b1f5488931814df7776ecc9ff676e3f95ea6270fe202572e8d7568344024bec5
Pointer size: 130 Bytes
Size of remote file: 47 kB

demo_examples/23.png ADDED Viewed

Git LFS Details

SHA256: 340592ce713f1b552a1424d4c3a871825b8d7ac4289eb1ed10644cecb9fba1f6
Pointer size: 130 Bytes
Size of remote file: 66.7 kB

demo_examples/24.png ADDED Viewed

Git LFS Details

SHA256: 4ccd19157bc794f27bfe69802c824cfa51999b0a6add3d23bc91cd608e0717f7
Pointer size: 131 Bytes
Size of remote file: 104 kB

demo_examples/25.png ADDED Viewed

Git LFS Details

SHA256: bff2100e7b26caa71e54c9251991ca388e006d978ce22e8ebcbcc301b01a3aac
Pointer size: 130 Bytes
Size of remote file: 51.8 kB

demo_examples/26.png ADDED Viewed

Git LFS Details

SHA256: 5b5031352b0891534bc09094cd04251de3c1767c70b6b622914c64bfcda80b4f
Pointer size: 130 Bytes
Size of remote file: 51 kB

demo_examples/27.png ADDED Viewed

Git LFS Details

SHA256: df923c2c8f20361df123f2afb25254d71d5825b18842a86e40ab5559617cb70a
Pointer size: 130 Bytes
Size of remote file: 77 kB

demo_examples/28.png ADDED Viewed

Git LFS Details

SHA256: 1d2d8af59b2f2b4ca0e6546435181b4869a24b0a8394bba52b51e2f1b5a73dc8
Pointer size: 130 Bytes
Size of remote file: 63 kB

demo_examples/29.png ADDED Viewed

Git LFS Details

SHA256: 1746dbdf3dff3bfd13e201d5ab5ea30f5404057000bc658222cba0fe1d12b946
Pointer size: 130 Bytes
Size of remote file: 49.3 kB

demo_examples/30.png ADDED Viewed

Git LFS Details

SHA256: 4920b94fe72bc494c3404df3c8617ea7b837f29cfddbde73e65d901f1abd80a3
Pointer size: 131 Bytes
Size of remote file: 349 kB

demo_examples/31.png ADDED Viewed

Git LFS Details

SHA256: a2c1cadc847ee50709c175b27fa716ccff645ca3f1844bfc3ddccd213cbefb56
Pointer size: 130 Bytes
Size of remote file: 48.3 kB

demo_examples/32.png ADDED Viewed

Git LFS Details

SHA256: a551e8bcfdc1542c92fae1236fa3428bea3998f7187e772368786cff8297aa29
Pointer size: 130 Bytes
Size of remote file: 75.2 kB

demo_examples/33.png ADDED Viewed

Git LFS Details

SHA256: 4cf620024f77d04115d5cff2793d5ba5de92d7491bc9b041cd4da3f25a597abb
Pointer size: 132 Bytes
Size of remote file: 2.15 MB

demo_examples/35.png ADDED Viewed

Git LFS Details

SHA256: 5b6812a04735cb977ff7ed20ceb265ec0a0046c7273e629830348af4b38df9ec
Pointer size: 132 Bytes
Size of remote file: 1.6 MB

demo_examples/cup.png ADDED Viewed

Git LFS Details

SHA256: be790add8ea7690abba3f464d18f103a459cdb1a0bd4346cf9040edb59e3c151
Pointer size: 131 Bytes
Size of remote file: 567 kB

demo_examples/teapot.png ADDED Viewed

Git LFS Details

SHA256: 46c51d39185186764b0374f3716c18dc67518e26a19fe01fb381c48f60102d60
Pointer size: 131 Bytes
Size of remote file: 349 kB

gradio_demo.py ADDED Viewed

	@@ -0,0 +1,415 @@

+import gradio as gr
+import numpy as np
+import os
+import json
+import subprocess
+from PIL import Image
+from functools import partial
+from datetime import datetime
+from sam_inference import get_sam_predictor, sam_seg
+from utils import blend_seg, blend_seg_pure
+import cv2
+import uuid
+import torch
+import trimesh
+from huggingface_hub import snapshot_download
+from gradio_model3dcolor import Model3DColor
+from gradio_model3dnormal import Model3DNormal
+code_dir = snapshot_download("sudo-ai/MeshFormer-API", token=os.environ['HF_TOKEN'])
+with open(f'{code_dir}/api.json', 'r') as file:
+    api_dict = json.load(file)
+    SEG_CMD = api_dict["SEG_CMD"]
+    MESH_CMD = api_dict["MESH_CMD"]
+STYLE = """
+    <link href="https://cdn.jsdelivr.net/npm/bootstrap@5.3.2/dist/css/bootstrap.min.css" rel="stylesheet" integrity="sha384-T3c6CoIi6uLrA9TneNEoa7RxnatzjcDSCmG1MXxSR1GAsXEV/Dwwykc2MPK8M2HN" crossorigin="anonymous">
+"""
+# info (info-circle-fill), cursor (hand-index-thumb), wait (hourglass-split), done (check-circle)
+ICONS = {
+    "info": """<svg xmlns="http://www.w3.org/2000/svg" width="16" height="16" fill="currentColor" class="bi bi-info-circle-fill flex-shrink-0 me-2" viewBox="0 0 16 16">
+    <path d="M8 16A8 8 0 1 0 8 0a8 8 0 0 0 0 16zm.93-9.412-1 4.705c-.07.34.029.533.304.533.194 0 .487-.07.686-.246l-.088.416c-.287.346-.92.598-1.465.598-.703 0-1.002-.422-.808-1.319l.738-3.468c.064-.293.006-.399-.287-.47l-.451-.081.082-.381 2.29-.287zM8 5.5a1 1 0 1 1 0-2 1 1 0 0 1 0 2z"/>
+    </svg>""",
+    "cursor": """<svg xmlns="http://www.w3.org/2000/svg" width="16" height="16" fill="currentColor" class="bi bi-hand-index-thumb-fill flex-shrink-0 me-2" viewBox="0 0 16 16">
+    <path d="M8.5 1.75v2.716l.047-.002c.312-.012.742-.016 1.051.046.28.056.543.18.738.288.273.152.456.385.56.642l.132-.012c.312-.024.794-.038 1.158.108.37.148.689.487.88.716.075.09.141.175.195.248h.582a2 2 0 0 1 1.99 2.199l-.272 2.715a3.5 3.5 0 0 1-.444 1.389l-1.395 2.441A1.5 1.5 0 0 1 12.42 16H6.118a1.5 1.5 0 0 1-1.342-.83l-1.215-2.43L1.07 8.589a1.517 1.517 0 0 1 2.373-1.852L5 8.293V1.75a1.75 1.75 0 0 1 3.5 0z"/>
+    </svg>""",
+    "wait": """<svg xmlns="http://www.w3.org/2000/svg" width="16" height="16" fill="currentColor" class="bi bi-hourglass-split flex-shrink-0 me-2" viewBox="0 0 16 16">
+    <path d="M2.5 15a.5.5 0 1 1 0-1h1v-1a4.5 4.5 0 0 1 2.557-4.06c.29-.139.443-.377.443-.59v-.7c0-.213-.154-.451-.443-.59A4.5 4.5 0 0 1 3.5 3V2h-1a.5.5 0 0 1 0-1h11a.5.5 0 0 1 0 1h-1v1a4.5 4.5 0 0 1-2.557 4.06c-.29.139-.443.377-.443.59v.7c0 .213.154.451.443.59A4.5 4.5 0 0 1 12.5 13v1h1a.5.5 0 0 1 0 1h-11zm2-13v1c0 .537.12 1.045.337 1.5h6.326c.216-.455.337-.963.337-1.5V2h-7zm3 6.35c0 .701-.478 1.236-1.011 1.492A3.5 3.5 0 0 0 4.5 13s.866-1.299 3-1.48V8.35zm1 0v3.17c2.134.181 3 1.48 3 1.48a3.5 3.5 0 0 0-1.989-3.158C8.978 9.586 8.5 9.052 8.5 8.351z"/>
+    </svg>""",
+    "done": """<svg xmlns="http://www.w3.org/2000/svg" width="16" height="16" fill="currentColor" class="bi bi-check-circle-fill flex-shrink-0 me-2" viewBox="0 0 16 16">
+    <path d="M16 8A8 8 0 1 1 0 8a8 8 0 0 1 16 0zm-3.97-3.03a.75.75 0 0 0-1.08.022L7.477 9.417 5.384 7.323a.75.75 0 0 0-1.06 1.06L6.97 11.03a.75.75 0 0 0 1.079-.02l3.992-4.99a.75.75 0 0 0-.01-1.05z"/>
+    </svg>""",
+}
+icons2alert = {
+    "info": "primary",  # blue
+    "cursor": "info",  # light blue
+    "wait": "secondary",  # gray
+    "done": "success",  # green
+}
+def message(text, icon_type="info"):
+    return f"""{STYLE}  <div class="alert alert-{icons2alert[icon_type]} d-flex align-items-center" role="alert"> {ICONS[icon_type]}
+                            <div>
+                                {text}
+                            </div>
+                        </div>"""
+def preprocess(tmp_dir, input_img, idx=None):
+    if idx is not None:
+        print("image idx:", int(idx))
+        input_img = Image.open(input_img[int(idx)]["name"])
+    input_img.save(f"{tmp_dir}/input.png")
+    # print(SEG_CMD.format(tmp_dir=tmp_dir))
+    os.system(SEG_CMD.format(tmp_dir=tmp_dir))
+    processed_img = Image.open(f"{tmp_dir}/seg.png")
+    return processed_img.resize((320, 320), Image.Resampling.LANCZOS)
+def ply_to_glb(ply_path):
+    result = subprocess.run(
+        ["python", "ply2glb.py", "--", ply_path],
+        capture_output=True,
+        text=True,
+    )
+    print("Output of blender script:")
+    print(result.stdout)
+    glb_path = ply_path.replace(".ply", ".glb")
+    return glb_path
+def mesh_gen(tmp_dir, simplify, num_inference_steps):
+    # print(MESH_CMD.format(tmp_dir=tmp_dir, num_inference_steps=num_inference_steps))
+    os.system(MESH_CMD.format(tmp_dir=tmp_dir, num_inference_steps=num_inference_steps))
+    mesh = trimesh.load_mesh(f"{tmp_dir}/mesh.ply")
+    vertex_normals = mesh.vertex_normals
+    colors = (-vertex_normals + 1) / 2.0
+    colors = (colors * 255).astype(np.uint8)  # Convert to 8-bit color
+    mesh.visual.vertex_colors = colors[..., [2, 0, 1]]  # RGB -> BRG
+    mesh.export(f"{tmp_dir}/mesh_normal.ply", file_type="ply")
+    color_path = ply_to_glb(f"{tmp_dir}/mesh.ply")
+    normal_path = ply_to_glb(f"{tmp_dir}/mesh_normal.ply")
+    return color_path, normal_path
+def create_tmp_dir():
+    tmp_dir = (
+        "demo_exp/"
+        + datetime.now().strftime("%Y-%m-%d_%H-%M-%S")
+        + "_"
+        + str(uuid.uuid4())[:4]
+    )
+    os.makedirs(tmp_dir, exist_ok=True)
+    print("create tmp_exp_dir", tmp_dir)
+    return tmp_dir
+def vis_seg(checkbox):
+    if checkbox:
+        print("Show manual seg windows")
+        return (
+            [gr.Image(value=None, visible=True)] * 2
+            + [gr.Radio(visible=True)]
+            + [[], gr.Checkbox(visible=True)]
+        )
+    else:
+        print("Clear manual seg")
+        return (
+            [gr.Image(visible=False)] * 2
+            + [gr.Radio(visible=False)]
+            + [[], gr.Checkbox(visible=False)]
+        )
+def calc_feat(checkbox, predictor, input_image, idx=None):
+    if checkbox:
+        if idx is not None:
+            print("image idx:", int(idx))
+            input_image = Image.open(input_image[int(idx)]["name"])
+        input_image.thumbnail([512, 512], Image.Resampling.LANCZOS)
+        w, h = input_image.size
+        print("image size:", w, h)
+        side_len = np.max((w, h))
+        seg_in = Image.new(input_image.mode, (side_len, side_len), (255, 255, 255))
+        seg_in.paste(
+            input_image, (np.max((0, (h - w) // 2)), np.max((0, (w - h) // 2)))
+        )
+        print("Calculating image SAM feature...")
+        predictor.set_image(np.array(seg_in.convert("RGB")))
+        torch.cuda.empty_cache()
+        return gr.Image(value=seg_in, visible=True)
+    else:
+        print("Quit manual seg")
+        raise ValueError("Quit manual seg")
+def manual_seg(
+    predictor,
+    seg_in,
+    selected_points,
+    fg_bg_radio,
+    tmp_dir,
+    seg_mask_opt,
+    evt: gr.SelectData,
+):
+    print("Start segmentation")
+    selected_points.append(
+        {"coord": evt.index, "add_del": fg_bg_radio == "+ (add mask)"}
+    )
+    input_points = np.array([point["coord"] for point in selected_points])
+    input_labels = np.array([point["add_del"] for point in selected_points])
+    out_image = sam_seg(
+        predictor, np.array(seg_in.convert("RGB")), input_points, input_labels
+    )
+    # seg_in.save(f"{tmp_dir}/in.png")
+    # out_image.save(f"{tmp_dir}/out.png")
+    if seg_mask_opt:
+        segmentation = blend_seg_pure(
+            seg_in.convert("RGB"), out_image, input_points, input_labels
+        )
+    else:
+        segmentation = blend_seg(
+            seg_in.convert("RGB"), out_image, input_points, input_labels
+        )
+    # recenter and rescale
+    image_arr = np.array(out_image)
+    ret, mask = cv2.threshold(
+        np.array(out_image.split()[-1]), 0, 255, cv2.THRESH_BINARY
+    )
+    x, y, w, h = cv2.boundingRect(mask)
+    max_size = max(w, h)
+    ratio = 0.75
+    side_len = int(max_size / ratio)
+    padded_image = np.zeros((side_len, side_len, 4), dtype=np.uint8)
+    center = side_len // 2
+    padded_image[
+        center - h // 2 : center - h // 2 + h, center - w // 2 : center - w // 2 + w
+    ] = image_arr[y : y + h, x : x + w]
+    rgba = Image.fromarray(padded_image)
+    rgba.save(f"{tmp_dir}/seg.png")
+    torch.cuda.empty_cache()
+    return segmentation.resize((380, 380), Image.Resampling.LANCZOS), rgba.resize(
+        (320, 320), Image.Resampling.LANCZOS
+    )
+custom_theme = gr.themes.Soft(primary_hue="blue").set(
+    button_secondary_background_fill="*neutral_100",
+    button_secondary_background_fill_hover="*neutral_200",
+)
+with gr.Blocks(title="MeshFormer Demo", css="style.css", theme=custom_theme) as demo:
+    with gr.Row():
+        gr.Markdown(
+            "# MeshFormer: High-Quality Mesh Generation with 3D-Guided Reconstruction Model"
+        )
+    with gr.Row():
+        gr.Markdown(
+            "[Project Page](https://meshformer3d.github.io/) | [arXiv](https://arxiv.org/abs/TBD)"
+        )
+    with gr.Row():
+        gr.Markdown(
+            """
+<div>
+<b><em>Check out <a href="https://www.sudo.ai/3dgen">Hillbot (sudoAI)</a> for more details and advanced features.</em></b>
+</div>
+"""
+        )
+    with gr.Row():
+        guide_text_i2m = gr.HTML(message("Please input an image!"), visible=True)
+    tmp_dir_img = gr.State("./demo_exp/placeholder")
+    tmp_dir_txt = gr.State("./demo_exp/placeholder")
+    tmp_dir_3t3 = gr.State("./demo_exp/placeholder")
+    example_folder = os.path.join(os.path.dirname(__file__), "demo_examples")
+    example_fns = os.listdir(example_folder)
+    example_fns.sort()
+    img_examples = [
+        os.path.join(example_folder, x) for x in example_fns
+    ]  # if x.endswith('.png') or x.endswith('.')
+    with gr.Row(variant="panel"):
+        with gr.Row():
+            with gr.Column(scale=8):
+                input_image = gr.Image(
+                    type="pil",
+                    image_mode="RGBA",
+                    height=320,
+                    label="Input Image",
+                    interactive=True,
+                )
+                gr.Examples(
+                    examples=img_examples,
+                    inputs=[input_image],
+                    outputs=[input_image],
+                    cache_examples=False,
+                    label="Image Examples (Click one of the images below to start)",
+                    examples_per_page=27,
+                )
+                with gr.Accordion("Options", open=False):
+                    img_simplify = gr.Checkbox(
+                        False, label="simplify the generated mesh", visible=False
+                    )
+                    n_steps_img = gr.Slider(
+                        value=28,
+                        minimum=15,
+                        maximum=100,
+                        step=1,
+                        label="number of inference steps",
+                    )
+                # manual segmentation
+                checkbox_manual_seg = gr.Checkbox(False, label="manual segmentation")
+                with gr.Row():
+                    with gr.Column(scale=1):
+                        seg_in = gr.Image(
+                            type="pil",
+                            image_mode="RGBA",
+                            label="Click to segment",
+                            visible=False,
+                            show_download_button=False,
+                            height=380,
+                        )
+                    with gr.Column(scale=1):
+                        seg_out = gr.Image(
+                            type="pil",
+                            image_mode="RGBA",
+                            label="Segmentation",
+                            interactive=False,
+                            visible=False,
+                            show_download_button=False,
+                            height=380,
+                            elem_id="disp_image",
+                        )
+                fg_bg_radio = gr.Radio(
+                    ["+ (add mask)", "- (remove area)"],
+                    value="+ (add mask)",
+                    info="Select foreground (+) or background (-) point",
+                    label="Point label",
+                    visible=False,
+                    interactive=True,
+                )
+                seg_mask_opt = gr.Checkbox(
+                    True,
+                    label="show foreground mask in manual segmentation",
+                    visible=False,
+                )
+                # run
+                img_run_btn = gr.Button(
+                    "Generate", variant="primary", interactive=False
+                )
+            with gr.Column(scale=6):
+                processed_image = gr.Image(
+                    type="pil",
+                    label="Processed Image",
+                    interactive=False,
+                    height=320,
+                    image_mode="RGBA",
+                    elem_id="disp_image",
+                )
+                # with gr.Row():
+                # mesh_output = gr.Model3D(label="Generated Mesh", elem_id="model-3d-out")
+                mesh_output_normal = Model3DNormal(
+                    label="Generated Mesh (normal)",
+                    elem_id="mesh-normal-out",
+                    height=400,
+                )
+                mesh_output = Model3DColor(
+                    label="Generated Mesh (color)",
+                    elem_id="mesh-out",
+                    height=400,
+                )
+    predictor = gr.State(value=get_sam_predictor())
+    selected_points = gr.State(value=[])
+    selected_points_t2i = gr.State(value=[])
+    disable_checkbox = lambda: gr.Checkbox(value=False)
+    disable_button = lambda: gr.Button(interactive=False)
+    enable_button = lambda: gr.Button(interactive=True)
+    update_guide = lambda GUIDE_TEXT, icon_type="info": gr.HTML(
+        value=message(GUIDE_TEXT, icon_type)
+    )
+    update_md = lambda GUIDE_TEXT: gr.Markdown(value=GUIDE_TEXT)
+    def is_img_clear(input_image):
+        if not input_image:
+            raise ValueError("Input image cleared.")
+    checkbox_manual_seg.change(
+        vis_seg,
+        inputs=[checkbox_manual_seg],
+        outputs=[seg_in, seg_out, fg_bg_radio, selected_points, seg_mask_opt],
+        queue=False,
+    ).success(
+        calc_feat,
+        inputs=[checkbox_manual_seg, predictor, input_image],
+        outputs=[seg_in],
+    ).success(
+        fn=create_tmp_dir, outputs=[tmp_dir_img], queue=False
+    )
+    seg_in.select(
+        manual_seg,
+        [predictor, seg_in, selected_points, fg_bg_radio, tmp_dir_img, seg_mask_opt],
+        [seg_out, processed_image],
+    )
+    input_image.change(disable_button, outputs=img_run_btn, queue=False).success(
+        disable_checkbox, outputs=checkbox_manual_seg, queue=False
+    ).success(fn=is_img_clear, inputs=input_image, queue=False).success(
+        fn=create_tmp_dir, outputs=tmp_dir_img, queue=False
+    ).success(
+        fn=partial(update_guide, "Preprocessing the image!", "wait"),
+        outputs=[guide_text_i2m],
+        queue=False,
+    ).success(
+        fn=preprocess,
+        inputs=[tmp_dir_img, input_image],
+        outputs=[processed_image],
+        queue=True,
+    ).success(
+        fn=partial(
+            update_guide,
+            "Click <b>Generate</b> to generate mesh! If the input image was not segmented accurately, please adjust it using <b>manual segmentation</b>.",
+            "cursor",
+        ),
+        outputs=[guide_text_i2m],
+        queue=False,
+    ).success(
+        enable_button, outputs=img_run_btn, queue=False
+    )
+    img_run_btn.click(
+        fn=partial(update_guide, "Generating the mesh!", "wait"),
+        outputs=[guide_text_i2m],
+        queue=False,
+    ).success(
+        fn=mesh_gen,
+        inputs=[tmp_dir_img, img_simplify, n_steps_img],
+        outputs=[mesh_output, mesh_output_normal],
+        queue=True,
+    ).success(
+        fn=partial(
+            update_guide,
+            "Successfully generated the mesh. (It might take a few seconds to load the mesh)",
+            "done",
+        ),
+        outputs=[guide_text_i2m],
+        queue=False,
+    )
+demo.queue().launch(
+    debug=True, share=False, inline=False, show_api=False, server_name="0.0.0.0"
+)

gradio_model3dcolor-0.0.1-py3-none-any.whl ADDED Viewed

Binary file (995 kB). View file

gradio_model3dnormal-0.0.1-py3-none-any.whl ADDED Viewed

Binary file (995 kB). View file

ply2glb.py ADDED Viewed

	@@ -0,0 +1,57 @@

+import bpy
+import sys
+# Clear the scene
+bpy.ops.object.select_all(action="SELECT")
+bpy.ops.object.delete(use_global=False)
+# Load mesh.ply
+ply_path = sys.argv[-1]
+bpy.ops.wm.ply_import(filepath=ply_path)
+# Create a new material
+material = bpy.data.materials.new(name="New_Material")
+material.use_nodes = True
+# Assign the material to the object
+obj = bpy.context.selected_objects[0]
+if obj.data.materials:
+    obj.data.materials[0] = material
+else:
+    obj.data.materials.append(material)
+# Add a Vertex Color node and link it
+nodes = material.node_tree.nodes
+links = material.node_tree.links
+# Clear default nodes
+for node in nodes:
+    nodes.remove(node)
+# Create nodes
+output_node = nodes.new(type="ShaderNodeOutputMaterial")
+vertex_color_node = nodes.new(type="ShaderNodeVertexColor")
+principled_bsdf = nodes.new(type="ShaderNodeBsdfPrincipled")
+# Set the vertex color layer name
+vertex_color_node.layer_name = "Col"
+# Arrange nodes
+vertex_color_node.location = (-300, 0)
+principled_bsdf.location = (0, 0)
+output_node.location = (300, 0)
+# Link nodes
+links.new(vertex_color_node.outputs["Color"], principled_bsdf.inputs["Base Color"])
+links.new(principled_bsdf.outputs["BSDF"], output_node.inputs["Surface"])
+# Rotate the object
+bpy.context.object.rotation_euler[2] = 1.57079
+# Export the scene to a glTF file
+glb_path = ply_path.replace(".ply", ".glb")
+bpy.ops.export_scene.gltf(filepath=glb_path, export_format="GLB")
+# Free up memory
+bpy.ops.wm.read_factory_settings(use_empty=True)

sam_inference.py ADDED Viewed

	@@ -0,0 +1,40 @@

+import numpy as np
+import torch
+from segment_anything import SamPredictor, sam_model_registry
+from PIL import Image
+models = {
+    'vit_b': './checkpoints/sam_vit_b_01ec64.pth',
+    'vit_l': './checkpoints/sam_vit_l_0b3195.pth',
+    'vit_h': './checkpoints/sam_vit_h_4b8939.pth'
+}
+def get_sam_predictor(model_type='vit_h', device=None, image=None):
+    if device is None and torch.cuda.is_available():
+        device = 'cuda'
+    elif device is None:
+        device = 'cpu'
+    # sam model
+    sam = sam_model_registry[model_type](checkpoint=models[model_type])
+    sam = sam.to(device)
+    predictor = SamPredictor(sam)
+    if image is not None:
+        predictor.set_image(image)
+    return predictor
+def sam_seg(predictor, input_img, input_points, input_labels):
+    masks, scores, logits = predictor.predict(
+        point_coords=input_points,
+        point_labels=input_labels,
+        multimask_output=True,
+    )
+    opt_idx = np.argmax(scores)
+    mask = masks[opt_idx]
+    out_image = np.zeros((input_img.shape[0], input_img.shape[1], 4), dtype=np.uint8)
+    out_image[:, :, :3] = input_img
+    out_image[:, :, 3] = mask.astype(np.uint8) * 255
+    torch.cuda.empty_cache()
+    return Image.fromarray(out_image, mode='RGBA')

style.css ADDED Viewed

	@@ -0,0 +1,32 @@

+#model-3d-out {
+    height: 400px;
+}
+#disp_image {
+    text-align: center; /* Horizontally center the content */
+}
+.centered {
+    text-align: center; /* Horizontally center the content */
+}
+.centered img {
+    display: block; /* Make the image a block element */
+    margin: 0 auto; /* Center the block element (the image) horizontally */
+    height: 100px;
+}
+#prompt-container{
+    gap: 0;
+}
+#prompt-container .form{
+    border-top-right-radius: 0;
+    border-bottom-right-radius: 0;
+}
+#gen-button{
+    border-top-left-radius:0;
+    border-bottom-left-radius:0;
+}
+.tab_at_top button.selected{
+    font-size: 24px !important;
+}

utils.py ADDED Viewed

	@@ -0,0 +1,86 @@

+import cv2
+import numpy as np
+from PIL import Image
+# marker choices
+COLORS = [(246, 195, 203), (112, 221, 208)]
+MARKERS = [1, 5]
+def blend_seg(input_image, segmented_image, dot_locations, dot_labels, contour_color=(63, 126, 174)):
+    input_image = np.array(input_image)
+    segmented_image = np.array(segmented_image)
+    # Create a mask for the foreground (non-transparent) pixels
+    foreground_mask = segmented_image[:, :, 3] > 0
+    # Create a mask for the background (transparent) pixels
+    background_mask = ~foreground_mask
+    # Darken the background pixels
+    darkened_background = input_image.copy()
+    darkened_background[background_mask] = darkened_background[background_mask] * 0.52  # Adjust the multiplier as needed to control darkness
+    # Create an empty mask for the boundary
+    boundary_mask = np.zeros_like(segmented_image[:, :, 3], dtype=np.uint8)
+    solid_boundary_mask = np.zeros_like(segmented_image[:, :, 3], dtype=np.uint8)
+    # Find the contour of the segmented region
+    contours, _ = cv2.findContours(
+        segmented_image[:, :, 3], cv2.RETR_LIST, cv2.CHAIN_APPROX_SIMPLE
+    )
+    # Draw the boundary on the boundary mask
+    cv2.drawContours(boundary_mask, contours, -1, (255), thickness=6)
+    cv2.drawContours(solid_boundary_mask, contours, -1, (255), thickness=2)
+    blur_mask = cv2.GaussianBlur(boundary_mask, (0, 0), sigmaX=4)
+    # Create a mask for the contour region
+    contour_region_mask = (blur_mask > 0)
+    # Blend the contour color with the existing pixel colors
+    result_image = darkened_background.copy()
+    mask_weight = 0.9 * blur_mask[contour_region_mask, None]/255
+    result_image[contour_region_mask] = (
+        darkened_background[contour_region_mask] * (1-mask_weight) + np.array(contour_color) * mask_weight
+    ).astype(np.uint8)
+    # Overlay the contour on the result image without blending
+    result_image[solid_boundary_mask > 0] = contour_color  # Set contour pixels to blue
+    # Draw dots at the specified locations
+    dot_radius = 6
+    for location, label in zip(dot_locations, dot_labels):
+        if label:
+            cv2.circle(result_image, location, dot_radius, COLORS[label], -1)
+        else:
+            cv2.drawMarker(result_image, location, COLORS[label], markerType=MARKERS[label],
+                        markerSize=6, thickness=3)
+    return Image.fromarray(result_image)
+def blend_seg_pure(input_image, segmented_image, dot_locations, dot_labels):
+    input_image = np.array(input_image)
+    segmented_image = np.array(segmented_image)
+    # Create a mask for the foreground (non-transparent) pixels
+    foreground_mask = segmented_image[:, :, 3] > 0
+    # Blend the foreground
+    red_foreground = input_image.copy()
+    blend_weight = 0.8
+    red_foreground[foreground_mask] = red_foreground[foreground_mask] *(1-blend_weight) + np.array((255,0,0)) * blend_weight
+    result_image = red_foreground
+    # Draw dots at the specified locations
+    dot_radius = 6
+    for location, label in zip(dot_locations, dot_labels):
+        if label:
+            cv2.circle(result_image, location, dot_radius, COLORS[label], -1)
+        else:
+            cv2.drawMarker(result_image, location, COLORS[label], markerType=MARKERS[label],
+                        markerSize=6, thickness=3)
+    return Image.fromarray(result_image)