2022-03-05 23:25:56 +00:00
|
|
|
from typing import Any
|
|
|
|
|
|
|
|
import numpy as np
|
|
|
|
from PIL import Image, ImageOps
|
|
|
|
|
|
|
|
|
|
|
|
# Notice Preprocess class Must be named "Preprocess"
|
|
|
|
from clearml import StorageManager
|
|
|
|
|
|
|
|
|
|
|
|
class Preprocess(object):
|
|
|
|
def __init__(self):
|
|
|
|
# set internal state, this will be called only once. (i.e. not per request)
|
|
|
|
pass
|
|
|
|
|
2022-03-20 23:00:19 +00:00
|
|
|
def preprocess(self, body: dict, collect_custom_statistics_fn=None) -> Any:
|
2022-03-05 23:25:56 +00:00
|
|
|
# we expect to get two valid on the dict x0, and x1
|
|
|
|
url = body.get("url")
|
|
|
|
if not url:
|
|
|
|
raise ValueError("'url' entry not provided, expected http/s link to image")
|
|
|
|
|
|
|
|
local_file = StorageManager.get_local_copy(remote_url=url)
|
|
|
|
image = Image.open(local_file)
|
|
|
|
image = ImageOps.grayscale(image).resize((28, 28))
|
|
|
|
return np.array(image).flatten()
|
|
|
|
|
2022-03-20 23:00:19 +00:00
|
|
|
def postprocess(self, data: Any, collect_custom_statistics_fn=None) -> dict:
|
2022-03-05 23:25:56 +00:00
|
|
|
# post process the data returned from the model inference engine
|
|
|
|
# data is the return value from model.predict we will put is inside a return value as Y
|
|
|
|
if not isinstance(data, np.ndarray):
|
|
|
|
# this should not happen
|
|
|
|
return dict(digit=-1)
|
|
|
|
|
|
|
|
# data is returned as probability per class (10 class/digits)
|
|
|
|
return dict(digit=int(data.flatten().argmax()))
|