!pip install "langchain==0.1.10" | tail -n 1
!pip install "ibm-watsonx-ai>=0.2.6" | tail -n 1
!pip install -U langchain_ibm | tail -n 1
!pip install wget | tail -n 1
!pip install sentence-transformers | tail -n 1
!pip install "chromadb==0.3.26" | tail -n 1
!pip install "pydantic==1.10.0" | tail -n 1
!pip install "sqlalchemy==2.0.1" | tail -n 1


import os, getpass


credentials = {
    "url": "https://us-south.ml.cloud.ibm.com",
    "apikey": getpass.getpass("Please enter your WML api key (hit enter): ")
}


try:
    project_id = os.environ["PROJECT_ID"]
except KeyError:
    project_id = input("Please enter your project_id (hit enter): ")


import wget

filename = 'state_of_the_union.txt'
url = 'https://raw.github.com/IBM/watson-machine-learning-samples/master/cloud/data/foundation_models/state_of_the_union.txt'

if not os.path.isfile(filename):
    wget.download(url, out=filename)


from langchain.document_loaders import TextLoader
from langchain.text_splitter import CharacterTextSplitter
from langchain.vectorstores import Chroma

loader = TextLoader(filename)
documents = loader.load()
text_splitter = CharacterTextSplitter(chunk_size=1000, chunk_overlap=0)
texts = text_splitter.split_documents(documents)


from ibm_watsonx_ai.foundation_models.utils import get_embedding_model_specs

get_embedding_model_specs(credentials.get('url'))


from langchain_ibm import WatsonxEmbeddings
from ibm_watsonx_ai.foundation_models.utils.enums import EmbeddingTypes

embeddings = WatsonxEmbeddings(
    model_id=EmbeddingTypes.IBM_SLATE_30M_ENG.value,
    url=credentials["url"],
    apikey=credentials["apikey"],
    project_id=project_id
    )
docsearch = Chroma.from_documents(texts, embeddings)


help(WatsonxEmbeddings)


from ibm_watsonx_ai.foundation_models.utils.enums import ModelTypes

model_id = ModelTypes.GRANITE_13B_CHAT_V2


from ibm_watsonx_ai.metanames import GenTextParamsMetaNames as GenParams
from ibm_watsonx_ai.foundation_models.utils.enums import DecodingMethods

parameters = {
    GenParams.DECODING_METHOD: DecodingMethods.GREEDY,
    GenParams.MIN_NEW_TOKENS: 1,
    GenParams.MAX_NEW_TOKENS: 100,
    GenParams.STOP_SEQUENCES: ["<|endoftext|>"]
}


from langchain_ibm import WatsonxLLM

watsonx_granite = WatsonxLLM(
    model_id=model_id.value,
    url=credentials.get("url"),
    apikey=credentials.get("apikey"),
    project_id=project_id,
    params=parameters
)


from langchain.chains import RetrievalQA

qa = RetrievalQA.from_chain_type(llm=watsonx_granite, chain_type="stuff", retriever=docsearch.as_retriever())


query = "What did the president say about Ketanji Brown Jackson"
qa.invoke(query)

{'query': 'What did the president say about Ketanji Brown Jackson',
 'result': ' The president said, "One of our nation’s top legal minds, who will continue Justice Breyer’s legacy of excellence." This statement was made in reference to Ketanji Brown Jackson, who was nominated by the president to serve on the United States Supreme Court.'}

Use watsonx Granite Model Series, Chroma, and LangChain to answer questions (RAG)¶

Disclaimers¶

Notebook content¶

About Retrieval Augmented Generation¶

Contents¶

Set up the environment¶

Install and import the dependecies¶

watsonx API connection¶

Defining the project id¶

Document data loading¶

Build up knowledge base¶

Create an embedding function¶

Compatibility watsonx.ai Embeddings with LangChain¶

Foundation Models on `watsonx.ai`¶

Defining model¶

Defining the model parameters¶

LangChain CustomLLM wrapper for watsonx model¶

Generate a retrieval-augmented response to a question¶

Select questions¶

Summary and next steps¶

Use watsonx Granite Model Series, Chroma, and LangChain to answer questions (RAG)¶

Disclaimers¶

Notebook content¶

About Retrieval Augmented Generation¶

Contents¶

Set up the environment¶

Install and import the dependecies¶

watsonx API connection¶

Defining the project id¶

Document data loading¶

Build up knowledge base¶

Create an embedding function¶

Compatibility watsonx.ai Embeddings with LangChain¶

Foundation Models on watsonx.ai¶

Defining model¶

Defining the model parameters¶

LangChain CustomLLM wrapper for watsonx model¶

Generate a retrieval-augmented response to a question¶

Select questions¶

Summary and next steps¶

Foundation Models on `watsonx.ai`¶