api_key = 'PASTE YOUR PLATFORM API KEY HERE'
location = 'PASTE YOUR INSTANCE LOCATION HERE'


wml_credentials = {
    "apikey": api_key,
    "url": 'https://' + location + '.ml.cloud.ibm.com'
}


!pip install -U ibm-watson-machine-learning


from ibm_watson_machine_learning import APIClient

client = APIClient(wml_credentials)


space_id = 'PASTE YOUR SPACE ID HERE'


client.spaces.list(limit=10)


client.set.default_space(space_id)


!mkdir -p linalgnorm-0.1/linalg_norm


%%writefile linalgnorm-0.1/linalg_norm/sklearn_transformers.py

from sklearn.base import BaseEstimator, TransformerMixin
import numpy as np


class LNormalizer(BaseEstimator, TransformerMixin):
    def __init__(self, norm_ord=2):
        self.norm_ord = norm_ord
        self.row_norm_vals = None

    def fit(self, X, y=None):
        self.row_norm_vals = np.linalg.norm(X, ord=self.norm_ord, axis=0)

    def transform(self, X, y=None):
        return X / self.row_norm_vals

    def fit_transform(self, X, y=None):
        self.fit(X, y)
        return self.transform(X, y)

    def get_norm_vals(self):
        return self.row_norm_vals


%%writefile linalgnorm-0.1/linalg_norm/__init__.py

__version__ = "0.1"


%%writefile linalgnorm-0.1/README.md

A simple library containing a simple custom scikit estimator.


%%writefile linalgnorm-0.1/setup.py

from setuptools import setup

VERSION='0.1'
setup(name='linalgnorm',
      version=VERSION,
      url='https://github.ibm.com/NGP-TWC/repository/',
      author='IBM',
      author_email='[email protected]',
      license='IBM',
      packages=[
            'linalg_norm'
      ],
      zip_safe=False
)


%%bash

cd linalgnorm-0.1
python setup.py sdist --formats=zip
cd ..
mv linalgnorm-0.1/dist/linalgnorm-0.1.zip .
rm -rf linalgnorm-0.1


!pip install linalgnorm-0.1.zip


!rm -rf dataset
!mkdir dataset


!wget https://archive.ics.uci.edu/ml/machine-learning-databases/00452/GNFUV%20USV%20Dataset.zip --output-document=dataset/gnfuv_dataset.zip


!unzip dataset/gnfuv_dataset.zip -d dataset


import json
import pandas as pd
import numpy as np
import os
from datetime import datetime
from json import JSONDecodeError


home_dir = './dataset'
pi_dirs = os.listdir(home_dir)

data_list = []
base_time = None
columns = None

for pi_dir in pi_dirs:
    if 'pi' not in pi_dir:
        continue
    curr_dir = os.path.join(home_dir, pi_dir)
    data_file = os.path.join(curr_dir, os.listdir(curr_dir)[0])
    with open(data_file, 'r') as f:
        line = f.readline().strip().replace("'", '"')
        while line != '':
            try:
                input_json = json.loads(line)
                sensor_datetime = datetime.fromtimestamp(input_json['time'])
                if base_time is None:
                    base_time = datetime(sensor_datetime.year, sensor_datetime.month, sensor_datetime.day, 0, 0, 0, 0)
                input_json['time'] = (sensor_datetime - base_time).seconds
                data_list.append(list(input_json.values()))
                if columns is None:
                    columns = list(input_json.keys())
            except JSONDecodeError as je:
                pass
            line = f.readline().strip().replace("'", '"')

data_df = pd.DataFrame(data_list, columns=columns)


data_df.head()


from sklearn.preprocessing import MinMaxScaler
from sklearn.model_selection import train_test_split

Y = data_df['temperature']
X = data_df.drop('temperature', axis=1)

X_train, X_test, y_train, y_test = train_test_split(X, Y, test_size=0.25, random_state=143)


from linalg_norm.sklearn_transformers import LNormalizer


lnorm_transf = LNormalizer()


from sklearn.pipeline import Pipeline
from sklearn.linear_model import LinearRegression


skl_pipeline = Pipeline(steps=[('normalizer', lnorm_transf), ('regression_estimator', LinearRegression())])
skl_pipeline.fit(X_train.loc[:, ['time', 'humidity']].values, y_train)


y_pred = skl_pipeline.predict(X_test.loc[:, ['time', 'humidity']].values)
rmse = np.mean((np.round(y_pred) - y_test.values)**2)**0.5
print('RMSE: {}'.format(rmse))


meta_prop_pkg_extn = {
    client.package_extensions.ConfigurationMetaNames.NAME: "K_Linag_norm_skl",
    client.package_extensions.ConfigurationMetaNames.DESCRIPTION: "Pkg extension for custom lib",
    client.package_extensions.ConfigurationMetaNames.TYPE: "pip_zip"
}

pkg_extn_details = client.package_extensions.store(meta_props=meta_prop_pkg_extn, file_path="linalgnorm-0.1.zip")
pkg_extn_uid = client.package_extensions.get_uid(pkg_extn_details)
pkg_extn_url = client.package_extensions.get_href(pkg_extn_details)


details = client.package_extensions.get_details(pkg_extn_uid)


client.software_specifications.ConfigurationMetaNames.show()


client.software_specifications.list()


base_sw_spec_uid = client.software_specifications.get_uid_by_name("runtime-23.1-py3.10")


meta_prop_sw_spec = {
    client.software_specifications.ConfigurationMetaNames.NAME: "linalgnorm-0.1",
    client.software_specifications.ConfigurationMetaNames.DESCRIPTION: "Software specification for linalgnorm-0.1",
    client.software_specifications.ConfigurationMetaNames.BASE_SOFTWARE_SPECIFICATION: {"guid": base_sw_spec_uid}
}

sw_spec_details = client.software_specifications.store(meta_props=meta_prop_sw_spec)
sw_spec_uid = client.software_specifications.get_uid(sw_spec_details)


client.software_specifications.add_package_extension(sw_spec_uid, pkg_extn_uid)


model_props = {
    client.repository.ModelMetaNames.NAME: "Temp prediction model with custom lib",
    client.repository.ModelMetaNames.TYPE: 'scikit-learn_1.1',
    client.repository.ModelMetaNames.SOFTWARE_SPEC_UID: sw_spec_uid
    
}


published_model = client.repository.store_model(model=skl_pipeline, meta_props=model_props)


published_model_uid = client.repository.get_model_id(published_model)
model_details = client.repository.get_details(published_model_uid)
print(json.dumps(model_details, indent=2))


metadata = {
    client.deployments.ConfigurationMetaNames.NAME: "Deployment of custom lib model",
    client.deployments.ConfigurationMetaNames.ONLINE: {}
}

created_deployment = client.deployments.create(published_model_uid, meta_props=metadata)


deployment_uid = client.deployments.get_uid(created_deployment)


scoring_endpoint = client.deployments.get_scoring_href(created_deployment)
print(scoring_endpoint)


scoring_payload = {
    "input_data": [{
        'fields': ["time", "humidity"],
        'values': [[79863, 47]]}]
}


predictions = client.deployments.score(deployment_uid, scoring_payload)


print(json.dumps(predictions, indent=2))

Use scikit-learn and custom library to predict temperature with `ibm-watson-machine-learning`¶

Learning goals¶

Contents¶

1. Set up the environment¶

Connection to WML¶

Install and import the `ibm-watson-machine-learning` package¶

Working with spaces¶

2. Install the library containing custom transformer¶

3. Download training dataset and prepare training data¶

4. Train a model¶

Import the custom transformer¶

5. Persist the model and custom library¶

Create package extension¶

Create software specification and add custom library¶

List base software specifications¶

Select base software specification to extend¶

Define new software specification based on base one and custom library¶

Save the model¶

6 Deploy and Score¶

Deploy the model¶

Predict using the deployed model¶

7. Clean up¶

8. Summary¶

Author¶

Use scikit-learn and custom library to predict temperature with ibm-watson-machine-learning¶

Learning goals¶

Contents¶

1. Set up the environment¶

Connection to WML¶

Install and import the ibm-watson-machine-learning package¶

Working with spaces¶

2. Install the library containing custom transformer¶

3. Download training dataset and prepare training data¶

4. Train a model¶

Import the custom transformer¶

5. Persist the model and custom library¶

Create package extension¶

Create software specification and add custom library¶

List base software specifications¶

Select base software specification to extend¶

Define new software specification based on base one and custom library¶

Save the model¶

6 Deploy and Score¶

Deploy the model¶

Predict using the deployed model¶

7. Clean up¶

8. Summary¶

Author¶

Use scikit-learn and custom library to predict temperature with `ibm-watson-machine-learning`¶

Install and import the `ibm-watson-machine-learning` package¶