Spaces:

sitatech
/

vibe-shopping

Running

App Files Files Community

vibe-shopping / mcp_server.py

sitatech

Fix Vitual try app name on modal

b410cdf 6 months ago

raw

history blame

5.27 kB

	import requests
	import base64

	from mcp.server.fastmcp import FastMCP
	from mcp.types import ImageContent
	import modal

	mcp = FastMCP("Virtual Try MCP Server")
	_virtual_try_model = None


	def virtual_try_model():
	"""Get or create an VirtualTryModel instance.
	We want to create the class instance inside the tool,
	so the init errors will bubble up to the tool and hence the MCP client instead of silently failing
	during the server creation.
	"""
	global _virtual_try_model
	if _virtual_try_model is None:
	virtual_try_model_class = modal.Cls.from_name(
	"vibe-shopping-virtual-try",
	"VirtualTryModel",
	environment_name="vibe-shopping",
	)
	_virtual_try_model = virtual_try_model_class()

	return _virtual_try_model


	def bytes_to_image(result_image_bytes: bytes, format: str = "webp") -> ImageContent:
	base64_image = base64.b64encode(result_image_bytes).decode("utf-8")

	return ImageContent(data=base64_image, type="image", mimeType=f"image/{format}")


	@mcp.tool()
	def try_item_with_masking(
	prompt: str,
	item_image_url: str,
	target_image_url: str,
	mask_image_url: str,
	) -> "ImageContent":
	"""
	Try an item on a target image by inpainting (with a diffusion model) the item onto the target image using a provided mask.

	For example, if the item is a purple skirt, the target image is a woman standing, you could use this prompt:
	The pair of images highlights a skirt and its fit on a woman, high resolution, 4K, 8K;
	[IMAGE1] Detailed product shot of a purple skirt
	[IMAGE2] The same skirt is worn by a woman standing in a realistic lifestyle setting, the skirt fits naturally.

	Args:
	prompt: A prompt for the diffusion model to use for inpainting. Be specific, e.g: for a short dress, say short dress, not just dress.
	item_image_url: URL of the item image to try.
	target_image_url: URL of the target image where the item will be tried.
	mask_image_url: Optional URL of a mask image to use.

	Returns:
	The image where the item is applied to the target image.
	"""
	item_image_bytes = requests.get(item_image_url).content
	target_image_bytes = requests.get(target_image_url).content
	mask_image_bytes = requests.get(mask_image_url).content

	result_image_bytes: bytes = virtual_try_model().try_it.remote(
	prompt=prompt,
	image_bytes=target_image_bytes,
	item_to_try_bytes=item_image_bytes,
	mask_bytes=mask_image_bytes,
	)

	# The virtual_try_model return a webp image
	return bytes_to_image(result_image_bytes, format="webp")


	@mcp.tool()
	def try_item_with_auto_masking(
	prompt: str,
	item_image_url: str,
	target_image_url: str,
	masking_prompt: str,
	) -> "ImageContent":
	"""
	Try an item on a target image by inpainting the item onto the target image using an auto-generated mask based on the masking_prompt.
	For example, if the item is a sofa and the target image is a living room containing a yellow sofa, the masking prompt could be "yellow sofa" and the prompt could be:
	The pair of images highlights a yellow sofa and how it fits in a living room, high resolution, 4K, 8K;
	[IMAGE1] Detailed product shot of a yellow sofa
	[IMAGE2] The same sofa is shown in a living room in a realistic lifestyle setting, the sofa fits in naturally with the room decor.

	For cases where a similar item is present but masking it won't cover enough area for the item to be applied, if you can, you should use a composite mask prompt.
	For example if the item is a long-sleeved shirt and the target image is a person wearing a short-sleeved t-shirt, the masking prompt could be "t-shirt, arms, neck".
	If the the item is a dress and the target image is a person wearing a t-shirt and jeans, the masking prompt could be "t-shirt, jeans, arms, legs".
	Make sure the mask prompt include all the parts where the item will be applied to.

	This tool requires a similar item to be present in the target image, so it can generate a mask of the item using the masking_prompt.

	Args:
	prompt: A prompt for the diffusion model to use for inpainting. Be specific, e.g: for a long-sleeved shirt, say long-sleeved shirt, not just shirt.
	item_image_url: URL of the item image to try.
	target_image_url: URL of the target image where the item will be tried.
	masking_prompt: Prompt for generating a mask of the corresponding item in the target image. It need to be short and descriptive, e.g. "red dress", "blue sofa", "tire", "skirt, legs" etc.

	Returns:
	The image where the item is applied to the target image.
	"""
	item_image_bytes = requests.get(item_image_url).content
	target_image_bytes = requests.get(target_image_url).content
	virtual_try = virtual_try_model()

	result_image_bytes: bytes = virtual_try.try_it.remote(
	prompt=prompt,
	image_bytes=target_image_bytes,
	item_to_try_bytes=item_image_bytes,
	masking_prompt=masking_prompt,
	)

	# The virtual_try_model return a webp image
	return bytes_to_image(result_image_bytes, format="webp")


	if __name__ == "__main__":
	# Run the MCP server
	mcp.run()