mart9992
/

vierundvi

Inference Endpoints

Model card Files Files and versions Community

vierundvi / test.py

mart9992's picture

m

8fc5cce 10 months ago

3.02 kB

	import os
	import subprocess
	import torch
	import requests
	from PIL import Image
	from io import BytesIO
	import subprocess
	import sys

	if False:
	def pip_command(command):
	subprocess.check_call([sys.executable, "-m", "pip"] + command.split())

	is_production = False

	os.chdir("/repository" if is_production else ".")
	os.environ['AM_I_DOCKER'] = 'False'
	os.environ['BUILD_WITH_CUDA'] = 'True'
	os.environ['CUDA_HOME'] = '/usr/local/cuda-11.7/' if is_production else '/usr/local/cuda-12.1/'

	pip_command("install -e segment_anything")

	pip_command("install -e GroundingDINO")

	response = requests.get("https://huggingface.co/Uminosachi/sam-hq/resolve/main/sam_hq_vit_h.pth")
	with open('./sam_hq_vit_h.pth', 'wb') as file:
	file.write(response.content)

	pip_command("install --upgrade diffusers[torch]")

	subprocess.run(["git", "submodule", "update", "--init", "--recursive"])
	subprocess.run(["bash", "grounded-sam-osx/install.sh"], cwd="grounded-sam-osx")

	subprocess.run(["git", "clone", "https://github.com/xinyu1205/recognize-anything.git"])

	pip_command("install -r ./recognize-anything/requirements.txt")

	pip_command("install -e ./recognize-anything/")

	from grounded_sam_demo import grounded_sam_demo
	import numpy as np
	from PIL import Image
	from scipy.ndimage import convolve
	from scipy.ndimage import binary_dilation


	def get_sd_mask(color_mask_pil, target=(72, 4, 84), tolerance=50):
	image_array = np.array(color_mask_pil)

	# Update target based on the number of color channels in the image array
	target = np.array(list(target) + [255] *
	(image_array.shape[-1] - len(target)))

	mask = np.abs(image_array - target) <= tolerance
	mask = np.all(mask, axis=-1)

	new_image_array = np.ones_like(image_array) * 255 # Start with white
	# Apply black where condition met
	new_image_array[mask] = [0] * image_array.shape[-1]

	return Image.fromarray(new_image_array)


	def expand_white_pixels(input_pil, expand_by=1):
	img_array = np.array(input_pil)
	is_white = np.all(img_array == 255, axis=-1)

	kernel = np.ones((2expand_by+1, 2expand_by+1), bool)
	expanded_white = binary_dilation(is_white, structure=kernel)

	expanded_array = np.where(expanded_white[..., None], 255, img_array)

	expanded_pil = Image.fromarray(expanded_array.astype('uint8'))
	return expanded_pil


	config_file = "GroundingDINO/groundingdino/config/GroundingDINO_SwinT_OGC.py"
	grounded_checkpoint = "groundingdino_swint_ogc.pth"
	sam_checkpoint = "sam_hq_vit_h.pth"


	def just_get_sd_mask(input_pil, text_prompt, padding):
	print("Doing sam")

	colored_mask_pil = grounded_sam_demo(
	input_pil, config_file, grounded_checkpoint, sam_checkpoint, text_prompt)

	print("doing to white")

	sd_mask_pil = get_sd_mask(colored_mask_pil)

	print("expanding white pixels")

	sd_mask_withpadding_pil = expand_white_pixels(sd_mask_pil, padding)

	return sd_mask_withpadding_pil