English
Inference Endpoints
real-esrgan / handler.py
garg-aayush's picture
weight path fix
68853b7
raw
history blame
6.04 kB
import torch
from PIL import Image
from io import BytesIO
from realesrgan import RealESRGANer
from typing import Dict, List, Any
import os
from pathlib import Path
from basicsr.archs.rrdbnet_arch import RRDBNet
import numpy as np
import cv2
import PIL
import boto3
import uuid, io
import torch
import base64
import requests
class EndpointHandler:
def __init__(self, path=""):
self.tiling_size = int(os.environ["TILING_SIZE"])
# Initialize the Real-ESRGAN model with specified parameters
self.model = RealESRGANer(
scale=4, # Scale factor for the model
# Path to the pre-trained model weights
model_path=f"/repository/weights/Real-ESRGAN-x4plus.pth",
# model_path=f"/workspace/real-esrgan/weights/Real-ESRGAN-x4plus.pth",
# Initialize the RRDBNet model architecture with specified parameters
model= RRDBNet(num_in_ch=3,
num_out_ch=3,
num_feat=64,
num_block=23,
num_grow_ch=32,
scale=4
),
tile=self.tiling_size,
tile_pad=0,
half=True,
)
# Initialize the S3 client with AWS credentials from environment variables
self.s3 = boto3.client('s3',
aws_access_key_id=os.environ['AWS_ACCESS_KEY_ID'],
aws_secret_access_key=os.environ['AWS_SECRET_ACCESS_KEY'],
)
# Get the S3 bucket name from environment variables
self.bucket_name = os.environ["S3_BUCKET_NAME"]
def __call__(self, data: Any) -> Dict[str, List[float]]:
try:
# get inputs
inputs = data.pop("inputs", data)
# get outscale
outscale = float(inputs.pop("outscale", 3))
# decode base64 image to PIL
image = self.download_image_url(inputs['image_url'])
in_size, in_mode = image.size, image.mode
# check image size and mode and return dict
assert in_mode in ["RGB", "RGBA", "L"], f"Unsupported image mode: {in_mode}"
if self.tiling_size == 0:
assert in_size[0] * in_size[1] < 1400*1400, f"Image is too large: {in_size}: {in_size[0] * in_size[1]} is greater than {self.tiling_size*self.tiling_size}"
assert outscale > 1 and outscale <=10, f"Outscale must be between 1 and 10: {outscale}"
# debug
print(f"image.size: {in_size}, image.mode: {in_mode}, outscale: {outscale}")
# Convert RGB to BGR (PIL uses RGB, OpenCV expects BGR)
opencv_image = np.array(image)
if in_mode == "RGB":
opencv_image = cv2.cvtColor(opencv_image, cv2.COLOR_RGB2BGR)
elif in_mode == "RGBA":
opencv_image = cv2.cvtColor(opencv_image, cv2.COLOR_RGBA2BGRA)
elif in_mode == "L":
opencv_image = cv2.cvtColor(opencv_image, cv2.COLOR_GRAY2RGB)
else:
raise ValueError(f"Unsupported image mode: {in_mode}")
# enhance image
output, _ = self.model.enhance(opencv_image, outscale=outscale)
# debug
print(f"output.shape: {output.shape}")
# convert to RGB/RGBA format
out_shape = output.shape
if len(out_shape) == 3:
if out_shape[2] == 3:
output = cv2.cvtColor(output, cv2.COLOR_BGR2RGB)
elif out_shape[2] == 4:
output = cv2.cvtColor(output, cv2.COLOR_BGRA2RGBA)
else:
output = cv2.cvtColor(output, cv2.COLOR_GRAY2RGB)
# convert to PIL image
img_byte_arr = BytesIO()
output = Image.fromarray(output)
# # save to BytesIO
# output.save(img_byte_arr, format='PNG')
# img_str = base64.b64encode(img_byte_arr.getvalue())
# img_str = img_str.decode()
image_url, key = self.upload_to_s3(output)
return {"image_url": image_url,
"image_key": key,
"error": None
}
# handle errors
except AssertionError as e:
print(f"AssertionError: {e}")
return {"out_image": None, "error": str(e)}
except KeyError as e:
print(f"KeyError: {e}")
return {"out_image": None, "error": f"Missing key: {e}"}
except ValueError as e:
print(f"ValueError: {e}")
return {"out_image": None, "error": str(e)}
except PIL.UnidentifiedImageError as e:
print(f"PIL.UnidentifiedImageError: {e}")
return {"out_image": None, "error": "Invalid image format"}
except Exception as e:
print(f"Exception: {e}")
return {"out_image": None, "error": "An unexpected error occurred"}
def upload_to_s3(self, image):
"Upload the image to s3 and return the url."
prefix = str(uuid.uuid4())
# Save the image to an in-memory file
in_mem_file = io.BytesIO()
image.save(in_mem_file, 'PNG')
in_mem_file.seek(0)
# Upload the image to s3
key = f"{prefix}.png"
self.s3.upload_fileobj(in_mem_file, Bucket=self.bucket_name, Key=key)
image_url = "https://{0}.s3.amazonaws.com/{1}".format(self.bucket_name, key)
# return the url and the key
return image_url, key
def download_image_url(self, image_url):
"Download the image from the url and return the image."
response = requests.get(image_url)
image = Image.open(BytesIO(response.content))
return image