Spaces:

sentencebird
/

image-color-vectorization

Running

App Files Files Community

image-color-vectorization / torchvision_funcs.py

sentencebird

Update torchvision_funcs.py

5717cac about 3 years ago

raw

history blame contribute delete

1.79 kB

	import os
	import numpy as np
	import cv2
	from PIL import Image
	import pickle
	from google_drive_downloader import GoogleDriveDownloader as gdd

	import torch
	import torchvision
	from torchvision import transforms
	from torchvision.models.segmentation import deeplabv3_resnet101
	from torchvision.models.segmentation.deeplabv3 import DeepLabHead


	def deeplabv3_remove_bg(img):
	img = np.array(img, dtype=np.uint8)
	# img = cv2.imread(image_path)
	# img = img[...,::-1] #BGR->RGB
	h,w,_ = img.shape
	# img = cv2.resize(img,(1000,1000))

	device = torch.device("cuda:0" if torch.cuda.is_available() else "cpu")
	# if not os.path.exists('./deeplabv3_resnet101.pkl'):
	# gdd.download_file_from_google_drive(file_id=os.environ['MODEL_ID'], dest_path='/tmp/deeplabv3_resnet101.pkl')
	# with open('./deeplabv3_resnet101.pkl', 'rb') as f:
	# model = pickle.load(f)
	model = deeplabv3_resnet101(pretrained=True)
	model.classifier = DeepLabHead(2048, num_classes=1)
	model = model.to(device)
	model.eval()

	preprocess = transforms.Compose([
	transforms.ToTensor(),
	transforms.Normalize(mean=[0.485, 0.456, 0.406], std=[0.229, 0.224, 0.225]),
	])
	input_tensor = preprocess(img)
	input_batch = input_tensor.unsqueeze(0).to(device)

	with torch.no_grad():
	output = model(input_batch)['out'][0]
	del model
	output = output.argmax(0)
	mask = output.byte().cpu().numpy()
	# mask = cv2.resize(mask,(w,h))
	# img = cv2.resize(img,(w,h))
	mask[mask>0] = 1.0 # NOTE: なぜか3が入っていたので
	mask = np.dstack([mask, mask, mask])
	img_masked = Image.fromarray(cv2.multiply(img, mask))
	index_masked = np.where(np.array(mask)[:,:,2]==0)
	return img_masked, index_masked