Spaces:

prs-eth
/

marigold-intrinsics

Running on Zero

App Files Files Community

marigold-intrinsics / app.py

toshas

update homepage and arxiv

5de45cd 6 months ago

raw

history blame contribute delete

9.42 kB

	# Copyright 2023-2025 Marigold Team, ETH Zürich. All rights reserved.
	#
	# Licensed under the Apache License, Version 2.0 (the "License");
	# you may not use this file except in compliance with the License.
	# You may obtain a copy of the License at
	#
	# http://www.apache.org/licenses/LICENSE-2.0
	#
	# Unless required by applicable law or agreed to in writing, software
	# distributed under the License is distributed on an "AS IS" BASIS,
	# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
	# See the License for the specific language governing permissions and
	# limitations under the License.
	# --------------------------------------------------------------------------
	# More information about Marigold:
	# https://marigoldmonodepth.github.io
	# https://marigoldcomputervision.github.io
	# Efficient inference pipelines are now part of diffusers:
	# https://huggingface.co/docs/diffusers/using-diffusers/marigold_usage
	# https://huggingface.co/docs/diffusers/api/pipelines/marigold
	# Examples of trained models and live demos:
	# https://huggingface.co/prs-eth
	# Related projects:
	# https://marigolddepthcompletion.github.io/
	# https://rollingdepth.github.io/
	# Citation (BibTeX):
	# https://github.com/prs-eth/Marigold#-citation
	# https://github.com/prs-eth/Marigold-DC#-citation
	# https://github.com/prs-eth/rollingdepth#-citation
	# --------------------------------------------------------------------------

	import os
	os.system("pip freeze")
	import spaces

	import gradio as gr
	import torch as torch
	from diffusers import MarigoldIntrinsicsPipeline, DDIMScheduler
	from gradio_dualvision import DualVisionApp
	from huggingface_hub import login
	from PIL import Image

	CHECKPOINT_APPEARANCE = "prs-eth/marigold-iid-appearance-v1-1"
	CHECKPOINT_LIGHTING = "prs-eth/marigold-iid-lighting-v1-1"

	if "HF_TOKEN_LOGIN" in os.environ:
	login(token=os.environ["HF_TOKEN_LOGIN"])

	device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
	dtype = torch.bfloat16 if torch.cuda.is_available() else torch.float32

	pipe_appearance = MarigoldIntrinsicsPipeline.from_pretrained(CHECKPOINT_APPEARANCE)
	pipe_appearance.scheduler = DDIMScheduler.from_config(pipe_appearance.scheduler.config, timestep_spacing="trailing")
	pipe_appearance = pipe_appearance.to(device=device, dtype=dtype)
	pipe_lighting = MarigoldIntrinsicsPipeline.from_pretrained(CHECKPOINT_LIGHTING)
	pipe_lighting.scheduler = DDIMScheduler.from_config(pipe_lighting.scheduler.config, timestep_spacing="trailing")
	pipe_lighting = pipe_lighting.to(device=device, dtype=dtype)
	try:
	import xformers

	pipe_appearance.enable_xformers_memory_efficient_attention()
	pipe_lighting.enable_xformers_memory_efficient_attention()
	except:
	pass


	class MarigoldIIDApp(DualVisionApp):
	DEFAULT_SEED = 2024
	DEFAULT_ENSEMBLE_SIZE = 1
	DEFAULT_DENOISE_STEPS = 4
	DEFAULT_PROCESSING_RES = 768

	def make_header(self):
	gr.Markdown(
	"""
	<h2><a href="https://huggingface.co/spaces/prs-eth/marigold-intrinsics" style="color: black;">Marigold Intrinsic Image Decomposition</a></h2>
	"""
	)
	with gr.Row(elem_classes="remove-elements"):
	gr.Markdown(
	f"""
	<p align="center">
	<a title="Website" href="https://marigoldcomputervision.github.io/" target="_blank" rel="noopener noreferrer" style="display: inline-block;">
	<img src="https://img.shields.io/badge/%E2%99%A5%20Project%20-Website-blue">
	</a>
	<a title="diffusers" href="https://huggingface.co/docs/diffusers/using-diffusers/marigold_usage" target="_blank" rel="noopener noreferrer" style="display: inline-block;">
	<img src="https://img.shields.io/badge/%F0%9F%A7%A8%20Read_diffusers-Tutorial-yellow?labelColor=green">
	</a>
	<a title="arXiv" href="https://arxiv.org/abs/2505.09358" target="_blank" rel="noopener noreferrer" style="display: inline-block;">
	<img src="https://img.shields.io/badge/%F0%9F%93%84%20Read%20-Paper-AF3436">
	</a>
	<a title="Github" href="https://github.com/prs-eth/marigold" target="_blank" rel="noopener noreferrer" style="display: inline-block;">
	<img src="https://img.shields.io/github/stars/prs-eth/marigold?label=GitHub%20%E2%98%85&logo=github&color=C8C" alt="badge-github-stars">
	</a>
	<a title="Image Depth" href="https://huggingface.co/spaces/prs-eth/marigold" target="_blank" rel="noopener noreferrer" style="display: inline-block;">
	<img src="https://img.shields.io/badge/%F0%9F%A4%97%20Image%20Depth%20-Demo-yellow" alt="imagedepth">
	</a>
	<a title="Image Normals" href="https://huggingface.co/spaces/prs-eth/marigold-normals" target="_blank" rel="noopener noreferrer" style="display: inline-block;">
	<img src="https://img.shields.io/badge/%F0%9F%A4%97%20Image%20Normals%20-Demo-yellow" alt="imagedepth">
	</a>
	<a title="Social" href="https://twitter.com/antonobukhov1" target="_blank" rel="noopener noreferrer" style="display: inline-block;">
	<img src="https://shields.io/twitter/follow/:?label=Subscribe%20for%20updates!" alt="social">
	</a>
	</p>
	<p align="center" style="margin-top: 0px;">
	Upload a photo or select an example below to compute intrinsic image decomposition in real time.
	Use the slider to reveal areas of interest.
	Use the radio-buttons to switch between modalities.
	Check our other demo badges above for new functionality.
	</p>
	"""
	)

	def build_user_components(self):
	with gr.Column():
	ensemble_size = gr.Slider(
	label="Ensemble size",
	minimum=1,
	maximum=10,
	step=1,
	value=self.DEFAULT_ENSEMBLE_SIZE,
	)
	denoise_steps = gr.Slider(
	label="Number of denoising steps",
	minimum=1,
	maximum=20,
	step=1,
	value=self.DEFAULT_DENOISE_STEPS,
	)
	processing_res = gr.Radio(
	[
	("Native", 0),
	("Recommended", 768),
	],
	label="Processing resolution",
	value=self.DEFAULT_PROCESSING_RES,
	)
	return {
	"ensemble_size": ensemble_size,
	"denoise_steps": denoise_steps,
	"processing_res": processing_res,
	}

	def process(self, image_in: Image.Image, **kwargs):
	ensemble_size = kwargs.get("ensemble_size", self.DEFAULT_ENSEMBLE_SIZE)
	denoise_steps = kwargs.get("denoise_steps", self.DEFAULT_DENOISE_STEPS)
	processing_res = kwargs.get("processing_res", self.DEFAULT_PROCESSING_RES)
	generator = torch.Generator(device=device).manual_seed(self.DEFAULT_SEED)

	pipe_out_appearance = pipe_appearance(
	image_in,
	ensemble_size=ensemble_size,
	num_inference_steps=denoise_steps,
	processing_resolution=processing_res,
	batch_size=1 if processing_res == 0 else 2,
	output_uncertainty=ensemble_size >= 3,
	generator=generator,
	)

	iid_appearance_vis = pipe_appearance.image_processor.visualize_intrinsics(
	pipe_out_appearance.prediction, pipe_appearance.target_properties
	)

	pipe_out_lighting = pipe_lighting(
	image_in,
	ensemble_size=ensemble_size,
	num_inference_steps=denoise_steps,
	processing_resolution=processing_res,
	batch_size=1 if processing_res == 0 else 2,
	output_uncertainty=ensemble_size >= 3,
	generator=generator,
	)

	iid_lighting_vis = pipe_lighting.image_processor.visualize_intrinsics(
	pipe_out_lighting.prediction, pipe_lighting.target_properties
	)

	out_modalities = {
	"Albedo": iid_appearance_vis[0]["albedo"],
	"Materials": iid_appearance_vis[0]["material"],
	"Roughness": iid_appearance_vis[0]["roughness"],
	"Metallicity": iid_appearance_vis[0]["metallicity"],
	"Albedo (HyperSim)": iid_lighting_vis[0]["albedo"],
	"Shading (HyperSim)": iid_lighting_vis[0]["shading"],
	"Residual (HyperSim)": iid_lighting_vis[0]["residual"],
	}
	# Additionally, uncertainty can be computed on any of the output modalities; we skip it to keep the demo light

	out_settings = {
	"ensemble_size": ensemble_size,
	"denoise_steps": denoise_steps,
	"processing_res": processing_res,
	}
	return out_modalities, out_settings


	with MarigoldIIDApp(
	title="Marigold Intrinsic Image Decomposition",
	examples_path="files/image",
	examples_per_page=12,
	left_selector_visible=True,
	squeeze_canvas=True,
	spaces_zero_gpu_enabled=True,
	) as demo:
	demo.queue(
	api_open=False,
	).launch(
	server_name="0.0.0.0",
	server_port=7860,
	)