from tensorflow.python.saved_model import builder
from tensorflow.python.saved_model.signature_def_utils import predict_signature_def
from tensorflow.python.saved_model import tag_constants

build  = builder.SavedModelBuilder(exportdir)

signature = predict_signature_def(inputs={"inputs":loaded_model.input}, outputs = {"score":loaded_model.output})

This saves as a .pb or protobuf. It is going to create a whole directory essentially.

from keras import backend as K
with K.get_session() as sess:
    build.add_meta_graph_and_variables(
    sess=sess, tags=[tags_constants.SERVING, signature_def_map={"serving_default":signature}]    
)
    build.save()

Tar the complete directory and upload to S3

import sagemaker

sagemaker_session = sagemaker.Session()
inputs = sagemaker_session.upload_data(path="model.tar.gz", key_prefix="model")

Actual deployment.
There is a bug in sagemaker and entrypoint needs an empty train.py file.

!touch train.py

from sagemaker.tensorflow.model import TensorFlowModel
sagemaker_model = TensorflowModel(model_data="s3://"+sagemaker_session.default_bucket()+"model/model.tar.gz",
role=role,
framework_version="1.12",
entry_point="train.py")

predictor = sagemaker_model.deploy(initial_instance_count=1,
instance_type="ml.m4.xlarge")

predictor.endpoint

Using the deployed model

endpoint_name="output from above command"
import sagemaker
from sagemaker.tensorflow.model import TensorFlowModel
predictor = sagemaker.tensorflow.model.TensorFlowPredictor(endpoint_name, sagemaker_session)

data = train_X[0:]

# to run stuff on local (inside AWS)
client = boto3.client("runtime.sagemaker")
response = client.invoke_endpoint(EndpointName=endpoint_name, Body=json.dumps(data))
response_body = response["Body"]


# outside AWS
boto3.client("runtime.sagemaker", region_name="us-east-1",
aws_access_key_id="",
aws_secret_access_key="")
# these access keys comes from IAM (identity and access management)

Table of contents

Table of contents

Serving using tensorflow

Mini batching

Some positive points

Edge device serving using tensorflowlite

Deploying models on AWS

Things required for AWS deployment