cloud-node/model.py

import os
import uuid
import json
import base64
from functools import reduce
import shutil

import boto3
from keras import backend as K
from keras.models import load_model
from keras.losses import categorical_crossentropy, mean_squared_error
from keras.optimizers import SGD, Adam
import numpy as np
import tensorflowjs as tfjs
import coremltools
from coremltools.converters import keras as keras_converter
from coremltools.proto import FeatureTypes_pb2 as _FeatureTypes_pb2
from coremltools.models.neural_network import SgdParams, AdamParams
from coremltools.models import MLModel
import tensorflow as tf
tf.compat.v1.disable_v2_behavior()

import state
from message import LibraryType
from parse_weights import calculate_new_weights


TEMP_FOLDER = 'temp'
UNLIMITED_EPOCHS = 100000

def convert_and_save_b64model(base64_h5_model):
    """
    Takes the initial h5 model encoded in Base64, decodes it, saves it on
    disk (in `<TEMP_FOLDER>/<repo_id>/<session_id>/model.h5`), then calls the
    helper function `_convert_and_save_model()` to convert the model into a 
    tf.js model which will be served to library nodes.

    This function is to be called at the beginning of a DML Session with
    Javascript libraries.

    Args:
        base64_h5_model (str): base64 string of an h5 Keras model
    """
    h5_model_path = save_h5_model(base64_h5_model)
    # Convert and save model for serving
    _convert_and_save_model(h5_model_path)

def fetch_keras_model():
    """
    Download the initial Keras model.

    This function is to be called at the beginning of a DML Session.
    """
    model_path = _fetch_model_folder()

    # Create directory if necessary
    if not os.path.exists(model_path):
        os.makedirs(model_path)

    # Save model on disk
    h5_model_path = model_path + '/model.h5'
    try:
        repo_id = state.state["repo_id"]
        session_id = state.state["session_id"]
        s3 = boto3.resource("s3")
        model_s3_key = "{0}/{1}/{2}/model.h5"
        model_s3_key = model_s3_key.format(repo_id, session_id, 0)
        object = s3.Object("updatestore", model_s3_key)
        object.download_file(h5_model_path)
    except Exception as e:
        print("S3 Error: {0}".format(e))

    state.state['h5_model_path'] = h5_model_path
    
    return state.state['h5_model_path']

def fetch_mlmodel():
    """
    Download the MLModel converted from a Keras model.

    This function is to be called at the beginning of a DML Session.

    NOTE: This function is only for text models to be used with iOS libraries.
    """
    model_path = _fetch_model_folder()

    # Create directory if necessary
    if not os.path.exists(model_path):
        os.makedirs(model_path)

    # Save model on disk
    mlmodel_path = model_path + '/my_model.mlmodel'
    try:
        repo_id = state.state["repo_id"]
        session_id = state.state["session_id"]
        s3 = boto3.resource("s3")
        model_s3_key = "{0}/{1}/{2}/model.mlmodel"
        model_s3_key = model_s3_key.format(repo_id, session_id, 0)
        object = s3.Object("updatestore", model_s3_key)
        object.download_file(h5_model_path)
    except Exception as e:
        print("S3 Error: {0}".format(e))

    state.state['mlmodel_path'] = h5_model_path
    
    return state.state['mlmodel_path']
    
def save_mlmodel_weights(binary_weights):
    """
    Save the provided binary weights from the iOS Library so that gradient
    calculation can be done.

    Only called after round 1 of training with the iOS Library for text data.
    
    Args:
        binary_weights (str): The binary weights to be saved.
    """
    mlmodel_path = _fetch_model_folder()
    mlmodel_weights_path = os.path.join(mlmodel_folder_path, "weights")
    with open(mlmodel_folder_path, "rb") as f:
        f.write(binary_weights)
        state.state["mlmodel_weights_path"] = mlmodel_weights_path

def get_encoded_h5_model():
    """
    Get the encoded string of the h5 Keras model.

    Returns:
        str: Returns a base64 string of the h5 Keras model
    """
    with open(state.state["h5_model_path"], mode='rb') as file:
        file_content = file.read()
        encoded_content = base64.encodebytes(file_content)
        h5_model = encoded_content.decode('ascii')
        return h5_model

def get_keras_model():
    """
    Load the Keras model from the `.h5` file.

    Returns:
        keras.engine.Model: Returns the loaded Keras model.
    """
    return load_model(state.state["h5_model_path"])

def convert_keras_model_to_tfjs():
    """
    Retrieves the current Keras model, converts it (from the path) into a
    tf.js model, extracts metadata from the model, and prepares the temp 
    folder where this new converted model will be served from.

    The new converted model gets stored in:
        `<TEMP_FOLDER>/<repo_id>/<session_id>/<current_round>`

    Where the following files get created:
        - `group1.-shard1of1.bin`
        - `model.json`
        - `metadata.json`
    """
    model_path = _fetch_model_folder()
    session_id = state.state["session_id"]
    current_round = state.state["current_round"]
    tfjs_model_path = os.path.join(model_path, str(current_round))
    state.state["tfjs_model_path"] = tfjs_model_path

    _keras_2_tfjs()

    model_json_path = state.state["tfjs_model_path"] + "/model.json"
    with open(model_json_path, 'r') as fp:
        model_json = json.loads(fp.read())
        state.state["weights_shape"] = model_json["weightsManifest"][0]["weights"]

    metadata_path = state.state["tfjs_model_path"] + '/metadata.json'
    metadata = {
        "session_id": session_id,
        "current_round": current_round,
    }
    with open(metadata_path, 'w') as fp:
        json.dump(metadata, fp, sort_keys=True, indent=4)

def convert_keras_model_to_mlmodel():
    """
    Retrieves the current Keras model, converts it (from the path) into a
    MLModel and prepares the temp folder where this new converted model will
    be served from.

    The new converted model gets stored in:
        `<TEMP_FOLDER>/<repo_id>/<session_id>/<current_round>`

    Where the following files get created:
        - `my_model.mlmodel`
    """
    model_path = _fetch_model_folder()
    current_round = state.state["current_round"]
    mlmodel_folder_path = os.path.join(model_path, str(current_round))
    if not os.path.exists(mlmodel_folder_path):
        os.makedirs(mlmodel_folder_path)
    state.state["mlmodel_path"] = os.path.join(mlmodel_folder_path, "my_model.mlmodel")

    _keras_2_mlmodel_image()

def swap_weights():
    """
    For most libraries, load the stored h5 model, swap the weights with the 
    aggregated weights currently in the global state, then saves the new model 
    in <TEMP_FOLDER>/<repo_id>/<session_id>/model<round>.h5.

    For iOS libraries, read the binary weights file at the old weights path,
    and write to a new binary weights file at 
    <TEMP_FOLDER>/<repo_id>/<session_id>/weights.

    For Javascript libraries, this function also reconverts the Keras model
    to a TFJS model.

    For iOS libraries (image), this function also reconverts the Keras model
    to a iOS model.
    """
    model = get_keras_model()
    _clear_checkpoint()

    base_model_path = _fetch_model_folder()
    current_round = state.state["current_round"]
    new_h5_model_path = base_model_path + '/model{0}.h5'.format(current_round)
    state.state['h5_model_path'] = new_h5_model_path

    if state.state["library_type"] == LibraryType.PYTHON.value:
        gradients = state.state["current_gradients"]
        learning_rate = model.optimizer.lr
        weights = model.get_weights()
        new_weights = np.subtract(weights, gradients)
        model.set_weights(new_weights)
        model.save(new_h5_model_path)
    elif state.state["library_type"] == LibraryType.IOS_IMAGE.value:
        gradients = state.state["current_gradients"]
        learning_rate = K.eval(model.optimizer.lr)
        new_weights = []
        k = 0

        for old_weight, grad in zip(model.get_weights(), gradients):
            num_params = np.prod(old_weight.shape)
            if len(grad) > num_params:
                grad = grad[:num_params]
            grad = np.array(grad)
            grad = np.reshape(grad, list(reversed(old_weight.shape)))
            if len(old_weight.shape) > 1:
                grad = np.transpose(grad)
            new_weights.append(old_weight - grad)

        model.set_weights(new_weights)
        model.save(new_h5_model_path)
        convert_keras_model_to_mlmodel()
    elif state.state["library_type"] == LibraryType.IOS_TEXT.value:
        old_mlmodel_weights_path = state.state["mlmodel_weights_path"]
        new_mlmodel_weights_path = base_model_path + '/weights{0}'.format(current_round)
        gradients = state.state["current_gradients"]
        learning_rate = K.eval(model.optimizer.lr)
        _ = calculate_new_weights(old_mlmodel_weights_path, \
                new_mlmodel_weights_path, lr=learning_rate)
        state.state["mlmodel_weights_path"] = new_mlmodel_weights_path
    else:
        weights_flat = state.state["current_weights"]
        weights_shape = state.state["weights_shape"]
        weights, start = [], 0
        for shape_data in weights_shape:
            shape = shape_data["shape"]
            size = reduce(lambda x, y: x*y, shape)
            weights_np = np.array(weights_flat[start:start+size])
            weights_np.resize(tuple(shape))
            weights.append(weights_np)
            start += size
        model.set_weights(weights)
        model.save(new_h5_model_path)
        convert_keras_model_to_tfjs()

    K.clear_session()

def _clear_checkpoint():
    """
    Removes the current model.

    NOTE: Only call when model no longer needed!
    """
    os.remove(state.state["h5_model_path"])
    if state.state["library_type"] == LibraryType.JS.value:
        shutil.rmtree(state.state['tfjs_model_path'])

def _keras_2_tfjs():
    """
    Converts a Keras h5 model into a tf.js model and saves it on disk.
    """
    model = get_keras_model()
    tfjs.converters.save_keras_model(model, state.state["tfjs_model_path"], np.uint16)
    K.clear_session()

def _keras_2_mlmodel_image():
    """
    Converts a Keras h5 model into ML Model for image data and saves it on 
    disk.

    NOTE: Image configuration must be specified from Explora. 

    NOTE: Currently, only categorical cross entropy loss is supported.
    """
    model = get_keras_model()
    ios_config = state.state["ios_config"]
    class_labels = ios_config["class_labels"]
    mlmodel = keras_converter.convert(model, input_names=['image'],
                                output_names=['output'],
                                class_labels=class_labels,
                                predicted_feature_name='label')
    mlmodel.save(state.state["mlmodel_path"])

    image_config = ios_config["image_config"]
    spec = coremltools.utils.load_spec(state.state["mlmodel_path"])
    builder = coremltools.models.neural_network.NeuralNetworkBuilder(spec=spec)

    dims = image_config["dims"]
    spec.description.input[0].type.imageType.width = dims[0]
    spec.description.input[0].type.imageType.height = dims[1]

    cs = _FeatureTypes_pb2.ImageFeatureType.ColorSpace.Value(image_config["color_space"])
    spec.description.input[0].type.imageType.colorSpace = cs

    trainable_layer_names = [layer.name for layer in model.layers if layer.get_weights()]
    builder.make_updatable(trainable_layer_names)

    builder.set_categorical_cross_entropy_loss(name='loss', input='output')

    if isinstance(model.optimizer, SGD):
        params = SgdParams(
            lr=K.eval(model.optimizer.lr), 
            batch=state.state["hyperparams"]["batch_size"],
        )
        builder.set_sgd_optimizer(params)
    elif isinstance(model.optimizer, Adam):
        params = AdamParams(
            lr=K.eval(model.optimizer.lr), 
            batch_size=state.state["hyperparams"]["batch_size"],
            beta1=model.optimizer.beta1,
            beta2=model.optimizer.beta2,
            eps=model.optimizer.eps,    
        )
        builder.set_adam_optimizer(params)
    else:
        raise Exception("iOS optimizer must be SGD or Adam!")

    builder.set_epochs(UNLIMITED_EPOCHS)
    builder.set_shuffle(state.state["hyperparams"]["shuffle"])  

    mlmodel_updatable = MLModel(spec)
    mlmodel_updatable.save(state.state["mlmodel_path"])

    K.clear_session()

def _fetch_model_folder():
    """
    Retreive the model folder for this session.
    """
    repo_id = state.state["repo_id"]
    session_id = state.state["session_id"]
    return os.path.join(TEMP_FOLDER, repo_id, session_id)


# def decode_weights(h5_model_path):
#     """
#     Do Keras stuff here
#     """
#     model = keras.models.load_model(h5_model_path)
#     weights = model.get_weights()
#     return weights


# def _test2():
#     out = decode_weights('../notebooks/saved_mlp_model_with_w.h5')
#     print(out)