Spaces:

paulpanwang
/

Diffsplat

Running on Zero

App Files Files Community

paulpanwang commited on Feb 5

Commit

476e0f0

verified ·

1 Parent(s): f00d8af

Upload folder using huggingface_hub

Browse files

This view is limited to 50 files because it contains too many changes. See raw diff

Files changed (50) hide show

.gitattributes +100 -0
.gitignore +11 -0
LICENSE +21 -0
README.md +302 -9
app.py +165 -0
assets/_demo/1.gif +3 -0
assets/_demo/10.gif +3 -0
assets/_demo/2.gif +3 -0
assets/_demo/3.gif +3 -0
assets/_demo/4.gif +3 -0
assets/_demo/5.gif +3 -0
assets/_demo/6.gif +3 -0
assets/_demo/7.gif +3 -0
assets/_demo/8.gif +3 -0
assets/_demo/9.gif +3 -0
assets/_demo/a_frog/pas.gif +3 -0
assets/_demo/a_frog/sd15.gif +3 -0
assets/_demo/a_frog/sd35m.gif +3 -0
assets/_demo/a_frog_elevest/pas.gif +3 -0
assets/_demo/a_frog_elevest/sd15.gif +3 -0
assets/_demo/a_frog_elevest/sd35m.gif +3 -0
assets/_demo/a_frog_empty/pas.gif +3 -0
assets/_demo/a_frog_empty/sd15.gif +3 -0
assets/_demo/a_frog_empty/sd35m.gif +3 -0
assets/_demo/a_toy_robot/pas.gif +3 -0
assets/_demo/a_toy_robot/sd15.gif +3 -0
assets/_demo/a_toy_robot/sd35m.gif +3 -0
assets/_demo/controlnet/book.gif +3 -0
assets/_demo/controlnet/cookie.gif +3 -0
assets/_demo/controlnet/iron_robot.gif +3 -0
assets/_demo/controlnet/panda.gif +3 -0
assets/_demo/controlnet/plush_dog_toy.gif +3 -0
assets/_demo/controlnet/teddy_bear.gif +3 -0
assets/_demo/overview.png +3 -0
assets/crm/3D/345/215/241/351/200/232/347/213/227.webp +0 -0
assets/crm/astronaut.webp +3 -0
assets/crm/bulldog.webp +0 -0
assets/crm/ghost-eating-burger.webp +0 -0
assets/crm/kunkun.webp +0 -0
assets/crm//344/270/207/345/234/243/345/215/227/347/223/234.webp +0 -0
assets/crm//344/272/272/347/211/251/351/252/221/351/251/254.webp +0 -0
assets/crm//345/210/235/351/237/263/346/234/252/346/235/245/347/216/251/345/201/266.webp +0 -0
assets/crm//345/215/241/351/200/232/346/201/220/351/276/231.webp +0 -0
assets/crm//345/215/241/351/200/232/346/211/213/346/236/252/346/210/252/345/233/276.webp +0 -0
assets/crm//345/215/241/351/200/232/347/214/253.webp +0 -0
assets/crm//345/215/241/351/200/232/350/230/221/350/217/207/345/245/227/350/243/205.webp +0 -0
assets/crm//345/217/257/347/210/261/347/216/204/347/255/226.webp +0 -0
assets/crm/大头泡泡马特.webp +3 -0
assets/crm//345/275/251/350/211/262/350/230/221/350/217/207.webp +0 -0
assets/crm//345/275/251/350/211/262/350/230/221/350/217/2072.webp +0 -0

.gitattributes CHANGED Viewed

@@ -33,3 +33,103 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text

 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text
+assets/_demo/1.gif filter=lfs diff=lfs merge=lfs -text
+assets/_demo/10.gif filter=lfs diff=lfs merge=lfs -text
+assets/_demo/2.gif filter=lfs diff=lfs merge=lfs -text
+assets/_demo/3.gif filter=lfs diff=lfs merge=lfs -text
+assets/_demo/4.gif filter=lfs diff=lfs merge=lfs -text
+assets/_demo/5.gif filter=lfs diff=lfs merge=lfs -text
+assets/_demo/6.gif filter=lfs diff=lfs merge=lfs -text
+assets/_demo/7.gif filter=lfs diff=lfs merge=lfs -text
+assets/_demo/8.gif filter=lfs diff=lfs merge=lfs -text
+assets/_demo/9.gif filter=lfs diff=lfs merge=lfs -text
+assets/_demo/a_frog/pas.gif filter=lfs diff=lfs merge=lfs -text
+assets/_demo/a_frog/sd15.gif filter=lfs diff=lfs merge=lfs -text
+assets/_demo/a_frog/sd35m.gif filter=lfs diff=lfs merge=lfs -text
+assets/_demo/a_frog_elevest/pas.gif filter=lfs diff=lfs merge=lfs -text
+assets/_demo/a_frog_elevest/sd15.gif filter=lfs diff=lfs merge=lfs -text
+assets/_demo/a_frog_elevest/sd35m.gif filter=lfs diff=lfs merge=lfs -text
+assets/_demo/a_frog_empty/pas.gif filter=lfs diff=lfs merge=lfs -text
+assets/_demo/a_frog_empty/sd15.gif filter=lfs diff=lfs merge=lfs -text
+assets/_demo/a_frog_empty/sd35m.gif filter=lfs diff=lfs merge=lfs -text
+assets/_demo/a_toy_robot/pas.gif filter=lfs diff=lfs merge=lfs -text
+assets/_demo/a_toy_robot/sd15.gif filter=lfs diff=lfs merge=lfs -text
+assets/_demo/a_toy_robot/sd35m.gif filter=lfs diff=lfs merge=lfs -text
+assets/_demo/controlnet/book.gif filter=lfs diff=lfs merge=lfs -text
+assets/_demo/controlnet/cookie.gif filter=lfs diff=lfs merge=lfs -text
+assets/_demo/controlnet/iron_robot.gif filter=lfs diff=lfs merge=lfs -text
+assets/_demo/controlnet/panda.gif filter=lfs diff=lfs merge=lfs -text
+assets/_demo/controlnet/plush_dog_toy.gif filter=lfs diff=lfs merge=lfs -text
+assets/_demo/controlnet/teddy_bear.gif filter=lfs diff=lfs merge=lfs -text
+assets/_demo/overview.png filter=lfs diff=lfs merge=lfs -text
+assets/crm/astronaut.webp filter=lfs diff=lfs merge=lfs -text
+assets/crm/大头泡泡马特.webp filter=lfs diff=lfs merge=lfs -text
+assets/crm/武器-剑.webp filter=lfs diff=lfs merge=lfs -text
+assets/crm/毛线衣.webp filter=lfs diff=lfs merge=lfs -text
+assets/crm/翅膀道具.webp filter=lfs diff=lfs merge=lfs -text
+assets/diffsplat/1_wukong_avatar.png filter=lfs diff=lfs merge=lfs -text
+assets/diffsplat/2_wukong_sculpture.png filter=lfs diff=lfs merge=lfs -text
+assets/diffsplat/3_wukong_toy.png filter=lfs diff=lfs merge=lfs -text
+assets/diffsplat/4_mask.png filter=lfs diff=lfs merge=lfs -text
+assets/diffsplat/5_bajie.png filter=lfs diff=lfs merge=lfs -text
+assets/diffsplat/6_armor.png filter=lfs diff=lfs merge=lfs -text
+assets/grm/17_dalle3_rockingchair1.png filter=lfs diff=lfs merge=lfs -text
+assets/grm/19_dalle3_stump1.png filter=lfs diff=lfs merge=lfs -text
+assets/grm/astronaut.webp filter=lfs diff=lfs merge=lfs -text
+assets/grm/coat.webp filter=lfs diff=lfs merge=lfs -text
+assets/grm/david.png filter=lfs diff=lfs merge=lfs -text
+assets/grm/dreamcraft3d_00.png filter=lfs diff=lfs merge=lfs -text
+assets/grm/dreamcraft3d_01.png filter=lfs diff=lfs merge=lfs -text
+assets/grm/dreamcraft3d_02.png filter=lfs diff=lfs merge=lfs -text
+assets/grm/frog.png filter=lfs diff=lfs merge=lfs -text
+assets/grm/girl1_padded.png filter=lfs diff=lfs merge=lfs -text
+assets/grm/girl2_copy.png filter=lfs diff=lfs merge=lfs -text
+assets/grm/image.png filter=lfs diff=lfs merge=lfs -text
+assets/grm/ironman_helmet.png filter=lfs diff=lfs merge=lfs -text
+assets/grm/panda.png filter=lfs diff=lfs merge=lfs -text
+assets/grm/sculpture_0.png filter=lfs diff=lfs merge=lfs -text
+assets/grm/turtle.png filter=lfs diff=lfs merge=lfs -text
+assets/grm/unicorn.png filter=lfs diff=lfs merge=lfs -text
+assets/grm/zebra.png filter=lfs diff=lfs merge=lfs -text
+assets/instantmesh/blue_cat.png filter=lfs diff=lfs merge=lfs -text
+assets/instantmesh/bubble_mart_blue.png filter=lfs diff=lfs merge=lfs -text
+assets/instantmesh/bulldog.png filter=lfs diff=lfs merge=lfs -text
+assets/instantmesh/cartoon_dinosaur.png filter=lfs diff=lfs merge=lfs -text
+assets/instantmesh/cartoon_panda.png filter=lfs diff=lfs merge=lfs -text
+assets/instantmesh/chair_armed.png filter=lfs diff=lfs merge=lfs -text
+assets/instantmesh/chair_watermelon.png filter=lfs diff=lfs merge=lfs -text
+assets/instantmesh/cute_horse.jpg filter=lfs diff=lfs merge=lfs -text
+assets/instantmesh/pikachu.png filter=lfs diff=lfs merge=lfs -text
+assets/instantmesh/sea_turtle.png filter=lfs diff=lfs merge=lfs -text
+assets/instantmesh/sword.png filter=lfs diff=lfs merge=lfs -text
+extensions/RaDe-GS/SIBR_viewers/docs/img/capreal/caprealinputsonly.png filter=lfs diff=lfs merge=lfs -text
+extensions/RaDe-GS/SIBR_viewers/docs/img/capreal/caprealmesh.png filter=lfs diff=lfs merge=lfs -text
+extensions/RaDe-GS/SIBR_viewers/docs/img/capreal/caprealpointcloud.png filter=lfs diff=lfs merge=lfs -text
+extensions/RaDe-GS/SIBR_viewers/docs/img/capreal/meshlab.png filter=lfs diff=lfs merge=lfs -text
+extensions/RaDe-GS/SIBR_viewers/docs/img/diagramas/class/sibr_classes_v2.png filter=lfs diff=lfs merge=lfs -text
+extensions/RaDe-GS/SIBR_viewers/docs/img/diagramas/sequence/AssetStreamer/seq_assetStreamer.pdf filter=lfs diff=lfs merge=lfs -text
+extensions/RaDe-GS/SIBR_viewers/docs/img/diagramas/sequence/Renderers/seq_insideOut.pdf filter=lfs diff=lfs merge=lfs -text
+extensions/RaDe-GS/SIBR_viewers/docs/img/diagramas/sequence/Renderers/seq_ulr_stream.pdf filter=lfs diff=lfs merge=lfs -text
+extensions/RaDe-GS/SIBR_viewers/docs/img/diagramas/sequence/Renderers/seq_ulr_v3_landscape.pdf filter=lfs diff=lfs merge=lfs -text
+extensions/RaDe-GS/SIBR_viewers/docs/img/diagramas/sequence/Unity/seq_unity_ulr_rendering.pdf filter=lfs diff=lfs merge=lfs -text
+extensions/RaDe-GS/SIBR_viewers/docs/img/diagramas/sequence/Unity/seq_unity_ulr_texture_upload.pdf filter=lfs diff=lfs merge=lfs -text
+extensions/RaDe-GS/SIBR_viewers/docs/img/ibr_common_cmake.png filter=lfs diff=lfs merge=lfs -text
+extensions/RaDe-GS/SIBR_viewers/docs/img/jesnault_git_cheat_sheet.png filter=lfs diff=lfs merge=lfs -text
+extensions/RaDe-GS/SIBR_viewers/docs/img/multimeshmanager.png filter=lfs diff=lfs merge=lfs -text
+extensions/RaDe-GS/SIBR_viewers/docs/img/multiviewmanager.png filter=lfs diff=lfs merge=lfs -text
+extensions/RaDe-GS/SIBR_viewers/docs/img/ulr_screenshot.png filter=lfs diff=lfs merge=lfs -text
+extensions/RaDe-GS/assets/teaser.png filter=lfs diff=lfs merge=lfs -text
+extensions/RaDe-GS/paper.pdf filter=lfs diff=lfs merge=lfs -text
+extensions/RaDe-GS/submodules/diff-gaussian-rasterization/dist/diff_gaussian_rasterization-0.0.0-cp310-cp310-linux_x86_64.whl filter=lfs diff=lfs merge=lfs -text
+extensions/RaDe-GS/submodules/diff-gaussian-rasterization/third_party/glm/doc/manual/frontpage1.png filter=lfs diff=lfs merge=lfs -text
+extensions/RaDe-GS/submodules/diff-gaussian-rasterization/third_party/glm/doc/manual/frontpage2.png filter=lfs diff=lfs merge=lfs -text
+extensions/RaDe-GS/submodules/diff-gaussian-rasterization/third_party/glm/doc/manual.pdf filter=lfs diff=lfs merge=lfs -text
+extensions/RaDe-GS/submodules/frpc_linux_amd64_v0.2 filter=lfs diff=lfs merge=lfs -text
+gradio_cached_examples/22/3D[[:space:]]Gaussians[[:space:]]ply[[:space:]]format/33a17050938079dd150f/_a[[:space:]]toy[[:space:]]robot..._013020.ply filter=lfs diff=lfs merge=lfs -text
+gradio_cached_examples/22/3D[[:space:]]Gaussians[[:space:]]ply[[:space:]]format/9084f12000e4d0861282/_a[[:space:]]cute[[:space:]]panda..._013020.ply filter=lfs diff=lfs merge=lfs -text
+gradio_cached_examples/22/3D[[:space:]]Gaussians[[:space:]]ply[[:space:]]format/927242333ba684b13bb2/_a[[:space:]]book..._013020.ply filter=lfs diff=lfs merge=lfs -text
+gradio_cached_examples/23/3D[[:space:]]Gaussians[[:space:]]ply[[:space:]]format/1174ce83af0bcabb215a/_a[[:space:]]book..._013020.ply filter=lfs diff=lfs merge=lfs -text
+gradio_cached_examples/23/3D[[:space:]]Gaussians[[:space:]]ply[[:space:]]format/743ad8490995e372c5f3/_a[[:space:]]cute[[:space:]]panda..._013020.ply filter=lfs diff=lfs merge=lfs -text
+gradio_cached_examples/23/3D[[:space:]]Gaussians[[:space:]]ply[[:space:]]format/e611dc2e9fbf1acd1cfc/_a[[:space:]]toy[[:space:]]robot..._013020.ply filter=lfs diff=lfs merge=lfs -text
+tmp/input_image.png filter=lfs diff=lfs merge=lfs -text
+wheel/diff_gaussian_rasterization-0.0.0-cp310-cp310-linux_x86_64.whl filter=lfs diff=lfs merge=lfs -text

.gitignore ADDED Viewed

	@@ -0,0 +1,11 @@

+__pycache__/
+build/
+*.egg-info/
+out/
+temp/
+log/
+download/*.json
+download/*.csv
+temp*.*
+*.tar*
+*.vsix

LICENSE ADDED Viewed

	@@ -0,0 +1,21 @@

+MIT License
+Copyright (c) 2025 Chenguo Lin
+Permission is hereby granted, free of charge, to any person obtaining a copy
+of this software and associated documentation files (the "Software"), to deal
+in the Software without restriction, including without limitation the rights
+to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+copies of the Software, and to permit persons to whom the Software is
+furnished to do so, subject to the following conditions:
+The above copyright notice and this permission notice shall be included in all
+copies or substantial portions of the Software.
+THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+SOFTWARE.

README.md CHANGED Viewed

@@ -1,13 +1,306 @@
 ---
-title: Diffsplat
-emoji: ⚡
-colorFrom: yellow
-colorTo: gray
-sdk: gradio
-sdk_version: 5.15.0
 app_file: app.py
-pinned: false
-license: mit
 ---
-Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference

 ---
+title: DiffSplat
 app_file: app.py
+sdk: gradio
+sdk_version: 4.44.1
 ---
+# [ICLR 2025] DiffSplat
+<h4 align="center">
+DiffSplat: Repurposing Image Diffusion Models for Scalable Gaussian Splat Generation
+[Chenguo Lin](https://chenguolin.github.io), [Panwang Pan](https://paulpanwang.github.io), [Bangbang Yang](https://ybbbbt.com), [Zeming Li](https://www.zemingli.com), [Yadong Mu](http://www.muyadong.com)
+[![arXiv](https://img.shields.io/badge/arXiv-2501.16764-b31b1b.svg?logo=arXiv)](https://arxiv.org/abs/2501.16764)
+[![Project page](https://img.shields.io/badge/Project-Page-brightgreen)](https://chenguolin.github.io/projects/DiffSplat)
+[![Model](https://img.shields.io/badge/HF-Model-yellow)](https://huggingface.co/chenguolin/DiffSplat)
+<p>
+    <img width="144" src="./assets/_demo/1.gif">
+    <img width="144" src="./assets/_demo/2.gif">
+    <img width="144" src="./assets/_demo/3.gif">
+    <img width="144" src="./assets/_demo/4.gif">
+    <img width="144" src="./assets/_demo/5.gif">
+</p>
+<p>
+    <img width="144" src="./assets/_demo/6.gif">
+    <img width="144" src="./assets/_demo/7.gif">
+    <img width="144" src="./assets/_demo/8.gif">
+    <img width="144" src="./assets/_demo/9.gif">
+    <img width="144" src="./assets/_demo/10.gif">
+</p>
+<p>
+    <img width="730", src="./assets/_demo/overview.png">
+</p>
+</h4>
+This repository contains the official implementation of the paper: [DiffSplat: Repurposing Image Diffusion Models for Scalable Gaussian Splat Generation](https://arxiv.org/abs/2501.16764), which is accepted to ICLR 2025.
+DiffSplat is a generative framework to synthesize 3D Gaussian Splats from text prompts & single-view images in 1~2 seconds. It is fine-tuned directly from a pretrained text-to-image diffusion model.
+Feel free to contact me ([email protected]) or open an issue if you have any questions or suggestions.
+## 📢 News
+- **2025-02-02**: Inference instructions (text-conditioned & image-conditioned & controlnet) are provided.
+- **2025-01-29**: The source code and pretrained models are released. Happy 🐍 Chinese New Year 🎆!
+- **2025-01-22**: InstructScene is accepted to ICLR 2025.
+## 📋 TODO
+- [x] Provide detailed instructions for inference.
+- [ ] Provide detailed instructions for training.
+- [ ] Implement a Gradio demo.
+## 🔧 Installation
+You may need to modify the specific version of `torch` in `settings/setup.sh` according to your CUDA version.
+There are not restrictions on the `torch` version, feel free to use your preferred one.
+```bash
+git clone https://github.com/chenguolin/DiffSplat.git
+cd DiffSplat
+bash settings/setup.sh
+```
+## 📊 Dataset
+- We use [G-Objaverse](https://github.com/modelscope/richdreamer/tree/main/dataset/gobjaverse) with about 265K 3D objects and 10.6M rendered images (265K x 40 views, including RGB, normal and depth maps) for `GSRecon` and `GSVAE` training. [Its subset](https://github.com/ashawkey/objaverse_filter) with about 83K 3D objects provided by [LGM](https://me.kiui.moe/lgm) is used for `DiffSplat` training. Their text descriptions are provided by the latest version of [Cap3D](https://huggingface.co/datasets/tiange/Cap3D) (i.e., refined by [DiffuRank](https://arxiv.org/abs/2404.07984)).
+- We find the filtering is crucial for the generation quality of `DiffSplat`, and a larger dataset is beneficial for the performance of `GSRecon` and `GSVAE`.
+- We store the dataset in an internal HDFS cluster in this project. Thus, the training code can NOT be directly run on your local machine. Please implement your own dataloading logic referring to our provided dataset & dataloader code.
+## 🚀 Usage
+### 📷 Camera Conventions
+The camera and world coordinate systems in this project are both defined in the `OpenGL` convention, i.e., X: right, Y: up, Z: backward. The camera is located at `(0, 0, 1.4)` in the world coordinate system, and the camera looks at the origin `(0, 0, 0)`.
+Please refer to [kiuikit camera doc](https://kit.kiui.moe/camera) for visualizations of the camera and world coordinate systems.
+### 🤗 Pretrained Models
+All pretrained models are available at [HuggingFace🤗](https://huggingface.co/chenguolin/DiffSplat).
+| **Model Name**                | **Fine-tined From** | **#Param.** | **Link** | **Note** |
+|-------------------------------|---------------------|-------------|----------|----------|
+| **GSRecon**                   | From scratch                    | 42M            | [gsrecon_gobj265k_cnp_even4](https://huggingface.co/chenguolin/DiffSplat/tree/main/gsrecon_gobj265k_cnp_even4)         | Feed-forward reconstruct per-pixel 3DGS from (RGB, normal, point) maps         |
+| **GSVAE (SD)**                | [SD1.5 VAE](https://huggingface.co/stable-diffusion-v1-5/stable-diffusion-v1-5)                    | 84M            | [gsvae_gobj265k_sd](https://huggingface.co/chenguolin/DiffSplat/tree/main/gsvae_gobj265k_sd)         |          |
+| **GSVAE (SDXL)**              | [SDXL fp16 VAE](https://huggingface.co/madebyollin/sdxl-vae-fp16-fix)                    | 84M            | [gsvae_gobj265k_sdxl_fp16](https://huggingface.co/chenguolin/DiffSplat/tree/main/gsvae_gobj265k_sdxl_fp16)         | fp16-fixed SDXL VAE is more robust         |
+| **GSVAE (SD3)**               | [SD3 VAE](https://huggingface.co/stabilityai/stable-diffusion-3-medium)                    | 84M            | [gsvae_gobj265k_sd3](https://huggingface.co/chenguolin/DiffSplat/tree/main/gsvae_gobj265k_sd3)         |          |
+| **DiffSplat (SD1.5)**            | [SD1.5](https://huggingface.co/stable-diffusion-v1-5/stable-diffusion-v1-5)                    | 0.86B            | Text-cond: [gsdiff_gobj83k_sd15__render](https://huggingface.co/chenguolin/DiffSplat/tree/main/gsdiff_gobj83k_sd15__render)<br> Image-cond: [gsdiff_gobj83k_sd15_image__render](https://huggingface.co/chenguolin/DiffSplat/tree/main/gsdiff_gobj83k_sd15_image__render)         | Best efficiency         |
+| **DiffSplat (PixArt-Sigma)** | [PixArt-Sigma](https://huggingface.co/PixArt-alpha/PixArt-Sigma-XL-2-512-MS)                    | 0.61B            | Text-cond: [gsdiff_gobj83k_pas_fp16__render](https://huggingface.co/chenguolin/DiffSplat/tree/main/gsdiff_gobj83k_pas_fp16__render)<br> Image-cond: [gsdiff_gobj83k_pas_fp16_image__render](https://huggingface.co/chenguolin/DiffSplat/tree/main/gsdiff_gobj83k_pas_fp16_image__render)         | Best Trade-off         |
+| **DiffSplat (SD3.5m)**         | [SD3.5 median](https://huggingface.co/stabilityai/stable-diffusion-3.5-medium)                    | 2.24B            | Text-cond: [gsdiff_gobj83k_sd35m__render](https://huggingface.co/chenguolin/DiffSplat/tree/main/gsdiff_gobj83k_sd35m__render)<br> Image-cond: [gsdiff_gobj83k_sd35m_image__render](https://huggingface.co/chenguolin/DiffSplat/tree/main/gsdiff_gobj83k_sd35m_image__render)         | Best performance        |
+| **DiffSplat ControlNet (SD1.5)**         | From scratch                    | 361M            | Depth: [gsdiff_gobj83k_sd15__render__depth](https://huggingface.co/chenguolin/DiffSplat/tree/main/gsdiff_gobj83k_sd15__render__depth)<br> Normal: [gsdiff_gobj83k_sd15__render__normal](https://huggingface.co/chenguolin/DiffSplat/tree/main/gsdiff_gobj83k_sd15__render__normal)<br> Canny: [gsdiff_gobj83k_sd15__render__canny](https://huggingface.co/chenguolin/DiffSplat/tree/main/gsdiff_gobj83k_sd15__render__canny)         |          |
+| **(Optional) ElevEst**                   | [dinov2_vitb14_reg](https://github.com/facebookresearch/dinov2)                    | 86 M            | [elevest_gobj265k_b_C25](https://huggingface.co/chenguolin/DiffSplat/tree/main/elevest_gobj265k_b_C25)         | (Optional) Single-view image elevation estimation        |
+### ⚡ Inference
+#### 0. Download Pretrained Models
+Note that:
+- Pretrained weights will download from HuggingFace and stored in `./out`.
+- Other pretrained models (such as CLIP, T5, image VAE, etc.) will be downloaded automatically and stored in your HuggingFace cache directory.
+- If you face problems in visiting HuggingFace Hub, you can try to set the environment variable `export HF_ENDPOINT=https://hf-mirror.com`.
+```bash
+python3 download_ckpt.py --model_type [MODEL_TYPE] [--image_cond]
+# `MODEL_TYPE`: choose from "sd15", "pas", "sd35m", "depth", "normal", "canny", "elevest".
+# `--image_cond`: add this flag for downloading image-conditioned models
+```
+For example, to download the `text-cond SD1.5-based DiffSplat`:
+```bash
+python3 download_ckpt.py --model_type sd15
+```
+To download the `image-cond PixArt-Sigma-based DiffSplat`:
+```bash
+python3 download_ckpt.py --model_type pas --image_cond
+```
+#### 1. Text-conditioned 3D Object Generation
+Note that:
+- Model differences may not be significant for simple text prompts. We recommend using `DiffSplat (SD1.5)` for better efficiency, `DiffSplat (SD3.5m)` for better performance, and `DiffSplat (PixArt-Sigma)` for a better trade-off.
+- By default, `export HF_HOME=~/.cache/huggingface`, `export TORCH_HOME=~/.cache/torch`. You can change theses paths in `scripts/infer.sh`. SD3-related models require HuggingFace token for downloading, which is expected to be stored in `HF_HOME`.
+- Outputs will be stored in `./out/<MODEL_NAME>/inference`.
+- Prompt is specified by `--prompt` (e.g., `a_toy_robot`). Please seperate words by `_` and it will be replaced by space in the code automatically.
+- If `"gif"` is in `--output_video_type`, the output will be a `.gif` file. Otherwise, it will be a `.mp4` file. If `"fancy"` is in `--output_video_type`, the output video will be in a fancy style that 3DGS scales gradually increase while rotating.
+- `--seed` is used for random seed setting. `--gpu_id` is used for specifying the GPU device.
+- Use `--half_precision` for `BF16` half-precision inference. It will reduce the memory usage but may slightly affect the quality.
+```bash
+# DiffSplat (SD1.5)
+bash scripts/infer.sh src/infer_gsdiff_sd.py configs/gsdiff_sd15.yaml gsdiff_gobj83k_sd15__render \
+--prompt a_toy_robot --output_video_type gif \
+--gpu_id 0 --seed 0 [--half_precision]
+# DiffSplat (PixArt-Sigma)
+bash scripts/infer.sh src/infer_gsdiff_pas.py configs/gsdiff_pas.yaml gsdiff_gobj83k_pas_fp16__render \
+--prompt a_toy_robot --output_video_type gif \
+--gpu_id 0 --seed 0 [--half_precision]
+# DiffSplat (SD3.5m)
+bash scripts/infer.sh src/infer_gsdiff_sd3.py configs/gsdiff_sd35m_80g.yaml gsdiff_gobj83k_sd35m__render \
+--prompt a_toy_robot --output_video_type gif \
+--gpu_id 0 --seed 0 [--half_precision]
+```
+You will get:
+| DiffSplat (SD1.5) | DiffSplat (PixArt-Sigma) | DiffSplat (SD3.5m) |
+|-------------------------|-------------------------------|-------------------------|
+| ![sd15_text](./assets/_demo/a_toy_robot/sd15.gif) | ![pas_text](./assets/_demo/a_toy_robot/pas.gif) | ![sd35m_text](./assets/_demo/a_toy_robot/sd35m.gif) |
+**More Advanced Arguments**:
+- `--prompt_file`: instead of using `--prompt`, `--prompt_file` will read prompts from a `.txt` file line by line.
+- Diffusion configurations:
+    - `--scheduler_type`: choose from `ddim`, `dpmsolver++`, `sde-dpmsolver++`, etc.
+    - `--num_inference_timesteps`: the number of diffusion steps.
+    - `--guidance_scale`: classifier-free guidance (CFG) scale; `1.0` means no CFG.
+    - `--eta`: specified for `DDIM` scheduler; the weight of noise for added noise in diffusion steps.
+- [Instant3D](https://instant-3d.github.io) tricks:
+    - `--init_std`, `--init_noise_strength`, `--init_bg`: initial noise settings, cf. [Instant3D Sec. 3.1](https://arxiv.org/pdf/2311.06214); NOT used by default, as we found it's not that helpful in our case.
+- Others:
+    - `--elevation`: elevation for viewing and rendering; not necessary for text-conditioned generation; set to `10` by default (from xz-plane (`0`) to +y axis (`90`)).
+    - `--negative_prompt`: empty prompt (`""`) by default; used with CFG for better visual quality (e.g., more vibrant colors), but we found it causes lower metric values (such as [ImageReward](https://github.com/THUDM/ImageReward)).
+    - `--save_ply`: save the generated 3DGS as a `.ply` file; used with `--opacity_threshold_ply` to filter out low-opacity splats for much smaller `.ply` file size.
+    - `--eval_text_cond`: evaluate text-conditioned generation automatically.
+    - ...
+Please refer to [infer_gsdiff_sd.py](./src/infer_gsdiff_sd.py), [infer_gsdiff_pas.py](./src/infer_gsdiff_pas.py), and [infer_gsdiff_sd3.py](./src/infer_gsdiff_sd3.py) for more argument details.
+#### 2. Image-conditioned 3D Object Generation
+Note that:
+- Most of the arguments are the same as text-conditioned generation. Our method support **text and image as conditions simultaneously**.
+- Elevation is necessary for image-conditioned generation. You can specify the elevation angle by `--elevation` for viewing and rendering (from xz-plane (`0`) to +y axis (`90`)) or estimate it from the input image by `--use_elevest` (download the pretrained `ElevEst` model by `python3 download_ckpt.py --model_type elevest`) first. But we found that the **estimated elevation is not always accurate**, so it's better to set it manually.
+- Text prompt is **optional** for image-conditioned generation. If you want to use text prompt, you can specify it by `--prompt` (e.g., `a_frog`), otherwise, empty prompt (`""`) will be used. Note that **DiffSplat (SD3.5m)** is sensitive to text prompts, and it may generate bad results without a proper prompt.
+- Remember to set a smaller `--guidance_scale` for image-conditioned generation, as the default value is set for text-conditioned generation. `2.0` is recommended for most cases.
+- `--triangle_cfg_scaling` is a trick that set larger CFG values for far-away views from the input image, while smaller CFG values for close-up views, cf. [SV3D Sec. 3](https://arxiv.org/pdf/2403.12008).
+- `--rembg_and_center` will remove the background and center the object in the image. It can be used with `--rembg_model_name` (by default `u2net`) and `--border_ratio` (by default `0.2`).
+- Image-conditioned generation is more sensitive to arguments, and you may need to tune them for better results.
+```bash
+# DiffSplat (SD1.5)
+bash scripts/infer.sh src/infer_gsdiff_sd.py configs/gsdiff_sd15.yaml gsdiff_gobj83k_sd15_image__render \
+--rembg_and_center --triangle_cfg_scaling --output_video_type gif --guidance_scale 2 \
+--image_path assets/grm/frog.png --elevation 20 --prompt a_frog
+# DiffSplat (PixArt-Sigma)
+bash scripts/infer.sh src/infer_gsdiff_pas.py configs/gsdiff_pas.yaml gsdiff_gobj83k_pas_fp16_image__render \
+--rembg_and_center --triangle_cfg_scaling --output_video_type gif --guidance_scale 2 \
+--image_path assets/grm/frog.png --elevation 20 --prompt a_frog
+# DiffSplat (SD3.5m)
+bash scripts/infer.sh src/infer_gsdiff_sd3.py configs/gsdiff_sd35m_80g.yaml gsdiff_gobj83k_sd35m_image__render \
+--rembg_and_center --triangle_cfg_scaling --output_video_type gif --guidance_scale 2 \
+--image_path assets/grm/frog.png --elevation 20 --prompt a_frog
+```
+You will get
+| Arguments | DiffSplat (SD1.5) | DiffSplat (PixArt-Sigma) | DiffSplat (SD3.5m) |
+|---------|-------------------------|-------------------------------|-------------------------|
+| `--elevation 20 --prompt a_frog` | ![sd15_image](./assets/_demo/a_frog/sd15.gif) | ![pas_image](./assets/_demo/a_frog/pas.gif) | ![sd35m_image](./assets/_demo/a_frog/sd35m.gif) |
+| `--use_elevest --prompt a_frog` (estimated elevation: -0.78 deg) | ![sd15_image](./assets/_demo/a_frog_elevest/sd15.gif) | ![pas_image](./assets/_demo/a_frog_elevest/pas.gif) | ![sd35m_image](./assets/_demo/a_frog_elevest/sd35m.gif) |
+| `--elevation 20` (prompt is `""`) | ![sd15_image](./assets/_demo/a_frog_empty/sd15.gif) | ![pas_image](./assets/_demo/a_frog_empty/pas.gif) | ![sd35m_image](./assets/_demo/a_frog_empty/sd35m.gif) |
+**More Advanced Arguments**:
+- `--image_dir`: instead of using `--image_path`, `--image_dir` will read images from a directory.
+Please refer to [infer_gsdiff_sd.py](./src/infer_gsdiff_sd.py), [infer_gsdiff_pas.py](./src/infer_gsdiff_pas.py), and [infer_gsdiff_sd3.py](./src/infer_gsdiff_sd3.py) for more argument details.
+#### 3. ControlNet for 3D Object Generation
+Note that:
+- After downloading pretrained **DiffSplat (SD1.5)**, you shoule download the controlnet weights by `python3 download_ckpt.py --model_type [depth | normal | canny]`.
+- For **depth-controlnet**, values in depth maps are normalized to `[0, 1]` and larger values (white) mean closer to the camera (smaller depth). Please refer to [GObjaverse Dataset](./src/data/gobjaverse_parquet_dataset.py) for more details.
+- For **normal-controlnet**, input camera is normalized to locate at `(0, 0, 1.4)` and look at `(0, 0, 0)`, thus the input normal maps are transformed accordingly. Please refer to [GObjaverse Dataset](./src/data/gobjaverse_parquet_dataset.py) for more details.
+- For **canny-controlnet**, canny edges are extracted from the input RGB images automatically by `cv2.Canny`. Please refer to [GObjaverse Dataset](./src/data/gobjaverse_parquet_dataset.py) for more details.
+```bash
+# ControlNet (depth)
+bash scripts/infer.sh src/infer_gsdiff_sd.py configs/gsdiff_sd15.yaml gsdiff_gobj83k_sd15__render \
+--load_pretrained_controlnet gsdiff_gobj83k_sd15__render__depth \
+--output_video_type gif --image_path assets/diffsplat/controlnet/toy_depth.png \
+--prompt teddy_bear --elevation 10
+# ControlNet (normal)
+bash scripts/infer.sh src/infer_gsdiff_sd.py configs/gsdiff_sd15.yaml gsdiff_gobj83k_sd15__render \
+--load_pretrained_controlnet gsdiff_gobj83k_sd15__render__normal \
+--output_video_type gif --image_path assets/diffsplat/controlnet/robot_normal.png \
+--prompt iron_robot --elevation 10
+# ControlNet (canny)
+bash scripts/infer.sh src/infer_gsdiff_sd.py configs/gsdiff_sd15.yaml gsdiff_gobj83k_sd15__render \
+--load_pretrained_controlnet gsdiff_gobj83k_sd15__render__canny \
+--output_video_type gif --image_path assets/diffsplat/controlnet/cookie_canny.png \
+--prompt book --elevation 10
+```
+You will get:
+| Original Image | Input Control | `--prompt teddy_bear` | `--prompt panda` |
+|----------------|---------------|-----------------------|--------------------|
+| ![depth_image](./assets/diffsplat/controlnet/toy_image.png) | ![depth](./assets/diffsplat/controlnet/toy_depth.png) | ![controlnet_1](assets/_demo/controlnet/teddy_bear.gif) | ![controlnet_2](assets/_demo/controlnet/panda.gif) |
+| Original Image | Input Control | `--prompt iron_robot` | `--prompt plush_dog_toy` |
+|----------------|---------------|-----------------------|--------------------|
+| ![normal_image](./assets/diffsplat/controlnet/robot_image.png) | ![normal](./assets/diffsplat/controlnet/robot_normal.png) | ![controlnet_1](assets/_demo/controlnet/iron_robot.gif) | ![controlnet_2](assets/_demo/controlnet/plush_dog_toy.gif) |
+| Original Image | Input Control | `--prompt book` | `--prompt cookie` |
+|----------------|---------------|-----------------|---------------------|
+| ![canny_image](./assets/diffsplat/controlnet/cookie_image.png) | ![canny](./assets/diffsplat/controlnet/cookie_canny.png) | ![controlnet_1](assets/_demo/controlnet/book.gif) | ![controlnet_2](assets/_demo/controlnet/cookie.gif) |
+**More Advanced Arguments**:
+- `--guess_mode`: ControlNet encoder tries to recognize the content of the input image even if you remove all prompts, cf. [the original ControlNet repo](https://github.com/lllyasviel/ControlNet#guess-mode--non-prompt-mode) and [HF ControlNet](https://huggingface.co/docs/diffusers/using-diffusers/controlnet#guess-mode).
+- `--controlnet_scale`: determines how much weight to assign to the conditioning inputs; outputs of the ControlNet are multiplied by `controlnet_scale` before they are added to the residual in the original UNet.
+Please refer to [infer_gsdiff_sd.py](./src/infer_gsdiff_sd.py) for more argument details.
+### 🦾 Training
+#### 1. GSRecon
+Please refer to [train_gsrecon.py](./src/train_gsrecon.py).
+Instructions for `GSRecon` training will be provided soon.
+#### 2. GSVAE
+Please refer to [train_gsvae.py](./src/train_gsvae.py).
+Instructions for `GSVAE` training will be provided soon.
+#### 3. DiffSplat
+Please refer to [train_gsdiff_sd.py](./src/train_gsdiff_sd.py), [train_gsdiff_pas.py](./src/train_gsdiff_pas.py), and [train_gsdiff_sd3.py](./src/train_gsdiff_sd3.py).
+Instructions for `DiffSplat` training will be provided soon.
+#### 4. ControlNet
+Please refer to [train_gsdiff_sd_controlnet.py](./src/train_gsdiff_sd_controlnet.py).
+Instructions for `ControlNet` training and inference will be provided soon.
+## 😊 Acknowledgement
+We would like to thank the authors of [LGM](https://me.kiui.moe/lgm), [GRM](https://justimyhxu.github.io/projects/grm), and [Wonder3D](https://www.xxlong.site/Wonder3D) for their great work and generously providing source codes, which inspired our work and helped us a lot in the implementation.
+## 📚 Citation
+If you find our work helpful, please consider citing:
+```bibtex
+@inproceedings{lin2025diffsplat,
+  title={DiffSplat: Repurposing Image Diffusion Models for Scalable 3D Gaussian Splat Generation},
+  author={Lin, Chenguo and Pan, Panwang and Yang, Bangbang and Li, Zeming and Mu, Yadong},
+  booktitle={International Conference on Learning Representations (ICLR)},
+  year={2025}
+}
+```

app.py ADDED Viewed

	@@ -0,0 +1,165 @@

+import os
+import shlex
+import subprocess
+import imageio
+import numpy as np
+import gradio as gr
+import spaces
+import sys
+from loguru import logger
+current_path = os.path.dirname(os.path.abspath(__file__))
+MAX_SEED = np.iinfo(np.int32).max
+TMP_DIR = os.path.join(current_path, 'out')
+os.makedirs(TMP_DIR, exist_ok=True)
+TAG = "gsdiff_gobj83k_sd15__render"
+# download checkpoints
+# subprocess.run(shlex.split("python3 download_ckpt.py --model_type pas")) # for txt condition
+# subprocess.run(shlex.split("python3 download_ckpt.py --model_type pas --image_cond")) # for img condition
+# img_commands = "PYTHONPATH=./ bash scripts/infer.sh src/infer_gsdiff_pas.py configs/gsdiff_pas.yaml {} \
+# --rembg_and_center --triangle_cfg_scaling --save_ply --output_video_type mp4 --guidance_scale {} \
+# --image_path {} --elevation {} --prompt {} --seed {}"
+# txt_commands = "PYTHONPATH=./ bash scripts/infer.sh src/infer_gsdiff_pas.py configs/gsdiff_pas.yaml \
+# --rembg_and_center --triangle_cfg_scaling --save_ply --output_video_type mp4 --guidance_scale {} \
+# --image_path {} --elevation {} --prompt {} --seed {}"
+# SD1.5
+subprocess.run(shlex.split("python3 download_ckpt.py --model_type sd15")) # for txt condition
+# subprocess.run(shlex.split("python3 download_ckpt.py --model_type sd15 --image_cond")) # for img condition
+img_commands = "PYTHONPATH=./ bash scripts/infer.sh src/infer_gsdiff_sd.py configs/gsdiff_sd15.yaml  \
+--rembg_and_center --triangle_cfg_scaling --save_ply --output_video_type mp4 --guidance_scale {} \
+--image_path {} --elevation {} --prompt {} --seed {}"
+txt_commands = "PYTHONPATH=./ bash scripts/infer.sh src/infer_gsdiff_sd.py  configs/gsdiff_sd15.yaml {} \
+--rembg_and_center --save_ply --output_video_type mp4 --guidance_scale {} \
+ --elevation {} --prompt {} --seed {}"
+# process function
+@spaces.GPU
+def process(input_image, prompt='a_high_quality_3D_asset', prompt_neg='ugly, blurry, pixelated obscure, unnatural colors, poor lighting, dull, unclear, cropped, lowres, low quality, artifacts, duplicate', input_elevation=20, guidance_scale=2., input_seed=0):
+    if input_image is not None:
+        image_path = os.path.join(TMP_DIR, "input_image.png")
+        image_name = image_path.split('/')[-1].split('.')[0]
+        input_image.save(image_path)
+        full_command = img_commands.format(TAG, guidance_scale, image_path, input_elevation, prompt, input_seed)
+    else:
+        full_command = txt_commands.format(TAG, guidance_scale, input_elevation, prompt, input_seed)
+        image_name = ""
+    os.system(full_command)
+    # save video and ply files
+    ckpt_dir = os.path.join(TMP_DIR, TAG, "checkpoints")
+    infer_from_iter = int(sorted(os.listdir(ckpt_dir))[-1])
+    MAX_NAME_LEN = 20  # TODO: make `20` configurable
+    prompt = prompt.replace("_", " ")
+    prompt_name = prompt[:MAX_NAME_LEN] + "..." if prompt[:MAX_NAME_LEN] != "" else prompt
+    name = f"[{image_name}]_[{prompt_name}]_{infer_from_iter:06d}"
+    output_video_path = os.path.join(TMP_DIR, TAG, "inference",  name + ".mp4")
+    output_ply_path = os.path.join(TMP_DIR, TAG, "inference",  name + ".ply")
+    output_img_path = os.path.join(TMP_DIR, TAG, "inference",  name + "_gs.png")
+    logger.info(full_command, output_video_path, output_ply_path)
+    output_image = imageio.imread(output_img_path)
+    return output_image, output_video_path, output_ply_path
+# gradio UI
+_TITLE = '''DiffSplat: Repurposing Image Diffusion Models for Scalable Gaussian Splat Generation'''
+_DESCRIPTION = '''
+### If you find our work helpful, please consider citing our paper 📚 or giving the repo a star 🌟
+<div>
+<a style="display:inline-block; margin-left: .5em" href="https://chenguolin.github.io/projects/DiffSplat"><img src='https://img.shields.io/badge/Project-Page-brightgreen'/></a>
+<a style="display:inline-block; margin-left: .5em" href="https://arxiv.org/abs/2501.16764"><img src='https://img.shields.io/badge/arXiv-2501.16764-b31b1b.svg?logo=arXiv'/></a>
+<a style="display:inline-block; margin-left: .5em" href="https://github.com/chenguolin/DiffSplat"><img src='https://img.shields.io/github/stars/chenguolin/DiffSplat?style=social'/></a>
+<a style="display:inline-block; margin-left: .5em" href="https://huggingface.co/chenguolin/DiffSplat"><img src='https://img.shields.io/badge/HF-Model-yellow'/></a>
+</div>
+* Input can be only text, only image, or both image and text.
+* If you find the generated 3D asset satisfactory, click "Extract GLB" to extract the GLB file and download it.
+* Upload an image and click "Generate" to create a 3D asset. If the image has alpha channel, it be used as the mask. Otherwise, we use `rembg` to remove the background.
+'''
+block = gr.Blocks(title=_TITLE).queue()
+with block:
+    with gr.Row():
+        with gr.Column(scale=1):
+            gr.Markdown('# ' + _TITLE)
+    gr.Markdown(_DESCRIPTION)
+    with gr.Row(variant='panel'):
+        with gr.Column(scale=1):
+            # input image
+            input_image = gr.Image(label="image", type='pil')
+            # input prompt
+            input_text = gr.Textbox(label="prompt",value="a_high_quality_3D_asset")
+            # negative prompt
+            input_neg_text = gr.Textbox(label="negative prompt", value="")
+            # guidance_scale
+            guidance_scale = gr.Slider(label="guidance scale", minimum=1., maximum=7.5, step=0.5, value=2.0)
+            # elevation
+            input_elevation = gr.Slider(label="elevation", minimum=-90, maximum=90, step=1, value=20)
+            # # inference steps
+            # input_num_steps = gr.Slider(label="inference steps", minimum=1, maximum=100, step=1, value=30)
+            # random seed
+            input_seed = gr.Slider(label="random seed", minimum=0, maximum=100000, step=1, value=0)
+            # gen button
+            button_gen = gr.Button("Generate")
+        with gr.Column(scale=1):
+            with gr.Tab("Video"):
+                # final video results
+                output_video = gr.Video(label="video")
+                # ply file
+                output_file = gr.File(label="3D Gaussians (ply format)")
+            with gr.Tab("Splatter Images"):
+                output_image = gr.Image(interactive=False, show_label=False)
+        button_gen.click(process, inputs=[input_image, input_text, input_neg_text, input_elevation, guidance_scale, input_seed], outputs=[output_image, output_video, output_file])
+    gr.Examples(
+        examples=[
+                f'assets/diffsplat/{image}'
+                for image in os.listdir("assets/diffsplat") if image.endswith('.png')
+        ],
+        inputs=[input_image],
+        outputs=[output_image, output_video, output_file],
+        fn=lambda x: process(input_image=x),
+        # cache_examples=True,
+        run_on_click=True,
+        label='Image-to-3D Examples'
+    )
+    gr.Examples(
+        examples=[
+            "a_toy_robot",
+            "a_cute_panda",
+            "a_book"
+        ],
+        inputs=[input_text],
+        outputs=[output_image, output_video, output_file],
+        fn=lambda x: process(input_image=None, prompt=x),
+        # cache_examples=True,
+        run_on_click=True,
+        label='Text-to-3D Examples'
+    )
+# Launch the Gradio app
+if __name__ == "__main__":
+    block.launch(share=True)

assets/_demo/1.gif ADDED Viewed

Git LFS Details

SHA256: e5026f63c1c69ba4d31c34cc82ccef0ac75c24b947893376a4f227ff04fc00dc
Pointer size: 132 Bytes
Size of remote file: 1.87 MB

assets/_demo/10.gif ADDED Viewed

Git LFS Details

SHA256: e6d6191e04b32f0b74a299bb3cf35735fa329bec309165056128405e5a1e55ef
Pointer size: 132 Bytes
Size of remote file: 1.76 MB

assets/_demo/2.gif ADDED Viewed

Git LFS Details

SHA256: f63f122c00335401c849c73e0bb71c12785d1754f506acb32c5fe324404cefd7
Pointer size: 132 Bytes
Size of remote file: 4.61 MB

assets/_demo/3.gif ADDED Viewed

Git LFS Details

SHA256: acf87ce7deebc7693fd6c72e25fc22deb3642b0cf5ff732a68bd330f3b5472af
Pointer size: 132 Bytes
Size of remote file: 4.96 MB

assets/_demo/4.gif ADDED Viewed

Git LFS Details

SHA256: 2f88df29b6f2e06006df95d61a4be87d4c3774da455526b255dc7aacd4ec7ef6
Pointer size: 132 Bytes
Size of remote file: 3.22 MB

assets/_demo/5.gif ADDED Viewed

Git LFS Details

SHA256: 006f05b05d3630b7ebfe0cf067de203d55fa778472d7d038cbf87363e40c70a9
Pointer size: 132 Bytes
Size of remote file: 4.12 MB

assets/_demo/6.gif ADDED Viewed

Git LFS Details

SHA256: c16ba28c12d40ea83d0cc705af89659c2e671bc93c254c49583d1d0fbca2ea56
Pointer size: 132 Bytes
Size of remote file: 1.97 MB

assets/_demo/7.gif ADDED Viewed

Git LFS Details

SHA256: 79a27742114d96e0e767d8e722e70ea5f83b06e8fc44b3e782c2b7ce2f64a4bb
Pointer size: 132 Bytes
Size of remote file: 1.81 MB

assets/_demo/8.gif ADDED Viewed

Git LFS Details

SHA256: 8a99d281c8bc17a8c4655585cf4dbc1da51e3490229e55294582d35f26fba7a1
Pointer size: 132 Bytes
Size of remote file: 2.64 MB

assets/_demo/9.gif ADDED Viewed

Git LFS Details

SHA256: aff03087a11381171ce700dffb0ffc194ff009ba36a486de01de8f2bb04f3069
Pointer size: 132 Bytes
Size of remote file: 3.31 MB

assets/_demo/a_frog/pas.gif ADDED Viewed

Git LFS Details

SHA256: 078c2374d80b8e3ecfdb0e54b024237708e06b6035ef750e16d05c39b97f4998
Pointer size: 132 Bytes
Size of remote file: 3.57 MB

assets/_demo/a_frog/sd15.gif ADDED Viewed

Git LFS Details

SHA256: cf8db71ca8962c9337fceabed510081ee5be63029c5194ec936e0809ef9c0814
Pointer size: 132 Bytes
Size of remote file: 3.53 MB

assets/_demo/a_frog/sd35m.gif ADDED Viewed

Git LFS Details

SHA256: ccbd8ced948c77606826e9baad190c82a97312cad3f73d875213c74480bba167
Pointer size: 132 Bytes
Size of remote file: 4.06 MB

assets/_demo/a_frog_elevest/pas.gif ADDED Viewed

Git LFS Details

SHA256: 2ba7e65d04231c4a686c2545925eb185e662633f99d8e62f46e4787f00a84cde
Pointer size: 132 Bytes
Size of remote file: 3.55 MB

assets/_demo/a_frog_elevest/sd15.gif ADDED Viewed

Git LFS Details

SHA256: a6054d11ee74288eee98bde90db223a40c79fa158f64b7cc6f27dac37d74dfbf
Pointer size: 132 Bytes
Size of remote file: 3.38 MB

assets/_demo/a_frog_elevest/sd35m.gif ADDED Viewed

Git LFS Details

SHA256: a167109dfd1c1cd46f14648b3845d23b8d7f49e0cdaf089f78b356ff3300b34f
Pointer size: 132 Bytes
Size of remote file: 3.73 MB

assets/_demo/a_frog_empty/pas.gif ADDED Viewed

Git LFS Details

SHA256: 18443bb88dcab653c41b2dcddfa8423d735fac1adf664cc374d45ef5ed9e5d53
Pointer size: 132 Bytes
Size of remote file: 3.49 MB

assets/_demo/a_frog_empty/sd15.gif ADDED Viewed

Git LFS Details

SHA256: b0b550b17d9dc85af20324ad7bb310a37599f3d6502fc9969fda1d29897dacf9
Pointer size: 132 Bytes
Size of remote file: 3.43 MB

assets/_demo/a_frog_empty/sd35m.gif ADDED Viewed

Git LFS Details

SHA256: c8ad473274b2cd9b2c7d4f7368a0bed22685ac8ca823e0984c7ca993c2b6898c
Pointer size: 132 Bytes
Size of remote file: 3.55 MB

assets/_demo/a_toy_robot/pas.gif ADDED Viewed

Git LFS Details

SHA256: 68d9b2d11a8129c5e1567664ab40d48da8123e283638bb2b5813d3461284b247
Pointer size: 132 Bytes
Size of remote file: 2.02 MB

assets/_demo/a_toy_robot/sd15.gif ADDED Viewed

Git LFS Details

SHA256: c213115602ac16f60cb3e877d5bfb57111ff1b7cfc2f47f3c188a096a421a658
Pointer size: 132 Bytes
Size of remote file: 2.14 MB

assets/_demo/a_toy_robot/sd35m.gif ADDED Viewed

Git LFS Details

SHA256: 850dab4e311c96d23db7c4c2fe9b15598c695512a29b5643e7dcad220845bd9f
Pointer size: 132 Bytes
Size of remote file: 2.11 MB

assets/_demo/controlnet/book.gif ADDED Viewed

Git LFS Details

SHA256: 8d138dcba04ea3079a21b083416146a292a2b0f300bf3403aeb4c43918e29272
Pointer size: 132 Bytes
Size of remote file: 2.23 MB

assets/_demo/controlnet/cookie.gif ADDED Viewed

Git LFS Details

SHA256: 0d842886ed5e13d2d03ded8d877cc6c25fbb09681fbcc1884e240a09e8cdbfd4
Pointer size: 132 Bytes
Size of remote file: 2.01 MB

assets/_demo/controlnet/iron_robot.gif ADDED Viewed

Git LFS Details

SHA256: c7d16871a73b989c0632dd722ab7134738ebf4d42e8953cec0dcc3eddc27d9c2
Pointer size: 132 Bytes
Size of remote file: 2.76 MB

assets/_demo/controlnet/panda.gif ADDED Viewed

Git LFS Details

SHA256: b7e53a7407d05617033fd9b7b90ff1e75c9e17983d60abd00499f48c0bc67ec4
Pointer size: 132 Bytes
Size of remote file: 2.77 MB

assets/_demo/controlnet/plush_dog_toy.gif ADDED Viewed

Git LFS Details

SHA256: 6c1e7731f8400beacf065db130f721789593f4c67a57473f5c5a1c935fa5c00a
Pointer size: 132 Bytes
Size of remote file: 3.18 MB

assets/_demo/controlnet/teddy_bear.gif ADDED Viewed

Git LFS Details

SHA256: 32941570f92e60addec09091c0cac24ab28f85ceb2d732aa8f8e0bcb4a774493
Pointer size: 132 Bytes
Size of remote file: 3.12 MB

assets/_demo/overview.png ADDED Viewed

Git LFS Details

SHA256: f09b1aadf070bed1c9e4ca503b09c2ee0d6790951b4718f97ff2a24d4c3281dd
Pointer size: 131 Bytes
Size of remote file: 236 kB

assets/crm/3D/345/215/241/351/200/232/347/213/227.webp ADDED Viewed

assets/crm/astronaut.webp ADDED Viewed

Git LFS Details

SHA256: c3e9157b31885c0fbccdba965f8ad1e27b51c41fbdb609ee8fc5728e6f4e4c3d
Pointer size: 131 Bytes
Size of remote file: 101 kB

assets/crm/bulldog.webp ADDED Viewed

assets/crm/ghost-eating-burger.webp ADDED Viewed

assets/crm/kunkun.webp ADDED Viewed

assets/crm//344/270/207/345/234/243/345/215/227/347/223/234.webp ADDED Viewed

assets/crm//344/272/272/347/211/251/351/252/221/351/251/254.webp ADDED Viewed

assets/crm//345/210/235/351/237/263/346/234/252/346/235/245/347/216/251/345/201/266.webp ADDED Viewed

assets/crm//345/215/241/351/200/232/346/201/220/351/276/231.webp ADDED Viewed

assets/crm//345/215/241/351/200/232/346/211/213/346/236/252/346/210/252/345/233/276.webp ADDED Viewed

assets/crm//345/215/241/351/200/232/347/214/253.webp ADDED Viewed

assets/crm//345/215/241/351/200/232/350/230/221/350/217/207/345/245/227/350/243/205.webp ADDED Viewed

assets/crm//345/217/257/347/210/261/347/216/204/347/255/226.webp ADDED Viewed

assets/crm/大头泡泡马特.webp ADDED Viewed

Git LFS Details

SHA256: 7135922c38ef118eace0abe2a7fbf78574ebebcf973aeb8cf67ed6cfdde1fcdd
Pointer size: 131 Bytes
Size of remote file: 354 kB

assets/crm//345/275/251/350/211/262/350/230/221/350/217/207.webp ADDED Viewed

assets/crm//345/275/251/350/211/262/350/230/221/350/217/2072.webp ADDED Viewed