!pip install ibm-watsonx-ai==1.0.335 | tail -n 1
!pip install scikit-learn | tail -n 1
!pip install matplotlib | tail -n 1
!pip install wget | tail -n 1


import getpass

credentials = {
    "url": "https://us-south.ml.cloud.ibm.com",
    "apikey": getpass.getpass("Please enter your WML api key (hit enter): ")
}


import os

try:
    project_id = os.environ["PROJECT_ID"]
except KeyError:
    project_id = input("Please enter your project_id (hit enter): ")


from ibm_watsonx_ai import APIClient

client = APIClient(credentials)


client.set.default_project(project_id)

'SUCCESS'


filename = 'cfpb_train.json'


import wget
import os

url = "https://raw.github.com/IBM/watson-machine-learning-samples/master/cloud/data/prompt_tuning/cfpb_train.json"
if not os.path.isfile(filename): 
    wget.download(url)
    
asset_details = client.data_assets.create(name=filename, file_path=filename)

Creating data asset...
SUCCESS


asset_id = client.data_assets.get_id(asset_details)


from ibm_watsonx_ai.helpers import DataConnection

data_conn = DataConnection(data_asset_id=asset_id)


from ibm_watsonx_ai.experiment import TuneExperiment

experiment = TuneExperiment(credentials, project_id=project_id)


{task.name: task.value for task in experiment.Tasks}

{'QUESTION_ANSWERING': 'question_answering',
 'SUMMARIZATION': 'summarization',
 'RETRIEVAL_AUGMENTED_GENERATION': 'retrieval_augmented_generation',
 'CLASSIFICATION': 'classification',
 'GENERATION': 'generation',
 'CODE_GENERATION_AND_CONVERSION': 'code',
 'EXTRACTION': 'extraction'}


prompt_tuner = experiment.prompt_tuner(name="sample SDK run auto_update True",
                                       task_id=experiment.Tasks.CLASSIFICATION,
                                       base_model='google/flan-t5-xl',
                                       accumulate_steps=32,
                                       batch_size=16,
                                       learning_rate=0.2,
                                       max_input_tokens=256,
                                       max_output_tokens=20,
                                       num_epochs=6,
                                       tuning_type=experiment.PromptTuningTypes.PT,
                                       verbalizer="Including narratives choice the best match product with the items from the list: 'credit_card', 'debt_collection', 'mortgages_and_loans', 'credit_reporting', 'retail_banking'. Input: {{input}} Output: ",
                                       auto_update_model=True
                                       )


prompt_tuner.get_params()

{'base_model': {'model_id': 'google/flan-t5-xl'},
 'accumulate_steps': 32,
 'batch_size': 16,
 'learning_rate': 0.2,
 'max_input_tokens': 256,
 'max_output_tokens': 20,
 'num_epochs': 6,
 'task_id': 'classification',
 'tuning_type': 'prompt_tuning',
 'verbalizer': "Including narratives choice the best match product with the items from the list: 'credit_card', 'debt_collection', 'mortgages_and_loans', 'credit_reporting', 'retail_banking'. Input: {{input}} Output: ",
 'name': 'sample SDK run auto_update True',
 'description': 'Prompt tuning with SDK',
 'auto_update_model': True,
 'group_by_name': False}


tuning_details = prompt_tuner.run(training_data_references=[data_conn], background_mode=False)


##############################################

Running 'b4300476-f8dd-4684-81ec-290c15d1ed95'

##############################################


pending........
running.....................................................................................
completed
Training of 'b4300476-f8dd-4684-81ec-290c15d1ed95' finished successfully.


prompt_tuner.get_run_status()

'completed'


prompt_tuner.get_run_details()

{'metadata': {'created_at': '2023-12-06T14:31:27.126Z',
  'description': 'Prompt tuning with SDK',
  'id': 'b4300476-f8dd-4684-81ec-290c15d1ed95',
  'modified_at': '2023-12-06T14:41:17.834Z',
  'name': 'sample SDK run auto_update True',
  'project_id': '70b1b2eb-b820-41ee-bcfb-76d8d83ee5c0',
  'tags': ['prompt_tuning',
   'wx_prompt_tune.2e31c747-cb30-49ce-9cff-ccad973ad9d2']},
 'entity': {'auto_update_model': True,
  'description': 'Prompt tuning with SDK',
  'model_id': 'a0613c34-faa5-49c0-86b5-9d3357293ce1',
  'name': 'sample SDK run auto_update True',
  'project_id': '70b1b2eb-b820-41ee-bcfb-76d8d83ee5c0',
  'prompt_tuning': {'accumulate_steps': 32,
   'base_model': {'model_id': 'google/flan-t5-xl'},
   'batch_size': 16,
   'init_method': 'random',
   'learning_rate': 0.2,
   'max_input_tokens': 256,
   'max_output_tokens': 20,
   'num_epochs': 6,
   'num_virtual_tokens': 100,
   'task_id': 'classification',
   'tuning_type': 'prompt_tuning',
   'verbalizer': "Including narratives choice the best match product with the items from the list: 'credit_card', 'debt_collection', 'mortgages_and_loans', 'credit_reporting', 'retail_banking'. Input: {{input}} Output: "},
  'results_reference': {'connection': {},
   'location': {'path': 'default_tuning_output',
    'training': 'default_tuning_output/b4300476-f8dd-4684-81ec-290c15d1ed95',
    'training_status': 'default_tuning_output/b4300476-f8dd-4684-81ec-290c15d1ed95/training-status.json',
    'model_request_path': 'default_tuning_output/b4300476-f8dd-4684-81ec-290c15d1ed95/assets/b4300476-f8dd-4684-81ec-290c15d1ed95/resources/wml_model/request.json',
    'assets_path': 'default_tuning_output/b4300476-f8dd-4684-81ec-290c15d1ed95/assets'},
   'type': 'container'},
  'status': {'completed_at': '2023-12-06T14:41:17.672Z', 'state': 'completed'},
  'tags': ['prompt_tuning',
   'wx_prompt_tune.2e31c747-cb30-49ce-9cff-ccad973ad9d2'],
  'training_data_references': [{'connection': {},
    'location': {'href': '/v2/assets/606d9ab5-4672-4807-83f0-33615279392d',
     'id': '606d9ab5-4672-4807-83f0-33615279392d'},
    'type': 'data_asset'}]}}


prompt_tuner.summary()


prompt_tuner.plot_learning_curve()


model_id = None

if 'model_id' in tuning_details.get('entity', {}):
    model_id = tuning_details['entity']['model_id']
model_id

'a0613c34-faa5-49c0-86b5-9d3357293ce1'


from datetime import datetime
meta_props = {
    client.deployments.ConfigurationMetaNames.NAME: "PT DEPLOYMENT SDK - project",
    client.deployments.ConfigurationMetaNames.ONLINE: {},
    client.deployments.ConfigurationMetaNames.SERVING_NAME : f"pt_sdk_deployment_{datetime.utcnow().strftime('%Y_%m_%d_%H%M%S')}"
}
deployment_details = client.deployments.create(model_id, meta_props)


#######################################################################################

Synchronous deployment creation for uid: 'a0613c34-faa5-49c0-86b5-9d3357293ce1' started

#######################################################################################


initializing
ready


------------------------------------------------------------------------------------------------
Successfully finished deployment creation, deployment_uid='5217e49f-3c61-4f06-ac67-ca1b2de4bdf2'
------------------------------------------------------------------------------------------------


deployment_details


deployment_id = deployment_details['metadata']['id']
deployment_id

'5217e49f-3c61-4f06-ac67-ca1b2de4bdf2'


from ibm_watsonx_ai.metanames import GenTextParamsMetaNames as GenParams

generate_params = {
    GenParams.MAX_NEW_TOKENS: 20,
    GenParams.STOP_SEQUENCES: ["\n"]
}


from ibm_watsonx_ai.foundation_models import ModelInference

tuned_model = ModelInference(
    deployment_id=deployment_id,
    params=generate_params,
    api_client=client
)


tuned_model.get_details()


response = tuned_model.generate_text(prompt="Including narratives choice the best match product with the items from the list: 'credit_card', 'debt_collection', 'mortgages_and_loans', 'credit_reporting', 'retail_banking'.\nComment: hi landed job reside ca needed room rent found place rent paid deposit dollar however position going didnt work longer needed rent place bay asked landlord refund security deposit refused told called back wellsfargo disputed transaction recently noticed card reversal checking account got charged amount dollar called bank werent able refund money also emailed landlord asking refund money ten day passed still response hope cfpb take action successfully resolve issue thank\nProduct:\n")
response

'credit_card'


import pandas as pd

filename = 'cfpb_test.json'

url = "https://raw.github.com/IBM/watson-machine-learning-samples/master/cloud/data/prompt_tuning/cfpb_test.json"
if not os.path.isfile(filename): 
    wget.download(url)
    
data = pd.read_json(filename)


prompts = list(data.input)
products = list(data.output)


prompts_batch = ["\n".join([prompt]) for prompt in prompts]


tuned_model_results = tuned_model.generate_text(prompt=prompts_batch)


from sklearn.metrics import accuracy_score

print(f'accuracy_score: {accuracy_score(products, tuned_model_results)}')

accuracy_score: 0.6266666666666667


base_model = ModelInference(
    model_id='google/flan-t5-xl',
    params=generate_params,
    api_client=client
)


base_model_results = base_model.generate_text(prompt=prompts_batch)


from sklearn.metrics import accuracy_score

print(f'base model accuracy_score: {accuracy_score(products, base_model_results)}')

base model accuracy_score: 0.5333333333333333

	Enhancements	Base model	Auto store	Epochs	loss
Model Name
model_b4300476-f8dd-4684-81ec-290c15d1ed95	[prompt_tuning]	google/flan-t5-xl	True	6	0.356224

Use watsonx to tune Google 'flan-t5-xl' model with Consumer Financial Protection Bureau document¶

Disclaimers¶

Notebook content¶

Learning goal¶

Contents¶

Set up the environment¶

Install and import the `datasets` and dependecies¶

Watsonx API connection¶

Defining the project id¶

Data loading¶

Initialize experiment¶

Run Prompt Tuning¶

Prompt Tuning details¶

Deploy¶

Foundation Models Inference on `watsonx.ai`¶

Analyze the product classes.¶

Calculate the accuracy of tuned model¶

Calculate the accuracy of base model¶

Summary and next steps¶

Authors:¶

Use watsonx to tune Google 'flan-t5-xl' model with Consumer Financial Protection Bureau document¶

Disclaimers¶

Notebook content¶

Learning goal¶

Contents¶

Set up the environment¶

Install and import the datasets and dependecies¶

Watsonx API connection¶

Defining the project id¶

Data loading¶

Initialize experiment¶

Run Prompt Tuning¶

Prompt Tuning details¶

Deploy¶

Foundation Models Inference on watsonx.ai¶

Analyze the product classes.¶

Calculate the accuracy of tuned model¶

Calculate the accuracy of base model¶

Summary and next steps¶

Authors:¶

Install and import the `datasets` and dependecies¶

Foundation Models Inference on `watsonx.ai`¶