diff --git a/01_Generation/00_generate_w_bedrock.ipynb b/01_Generation/00_generate_w_bedrock.ipynb
index f0c182ce..c51f02bf 100644
--- a/01_Generation/00_generate_w_bedrock.ipynb
+++ b/01_Generation/00_generate_w_bedrock.ipynb
@@ -117,7 +117,7 @@
"source": [
"## Generate text\n",
"\n",
- "Following on the use case explained above, let's prepare an input for the Amazon Bedrock service to generate an email"
+ "Following on the use case explained above, let's prepare an input for the Amazon Bedrock service to generate an email. Note that this prompt would need to be modified with [Human:/Assistant: formatting for Claude.](https://docs.anthropic.com/claude/docs/human-and-assistant-formatting)"
]
},
{
@@ -181,8 +181,8 @@
"- `amazon.titan-tg1-large`\n",
"- `ai21.j2-grande-instruct`\n",
"- `ai21.j2-jumbo-instruct`\n",
- "- `anthropic.claude-instant-v1`\n",
- "- `anthropic.claude-v1`"
+ "- `anthropic.claude-instant-v2`\n",
+ "- `anthropic.claude-v2`"
]
},
{
diff --git a/01_Generation/01_zero_shot_generation.ipynb b/01_Generation/01_zero_shot_generation.ipynb
index c67ea8b7..58c7b835 100644
--- a/01_Generation/01_zero_shot_generation.ipynb
+++ b/01_Generation/01_zero_shot_generation.ipynb
@@ -126,8 +126,8 @@
"- amazon.titan-tg1-large\n",
"- ai21.j2-grande-instruct\n",
"- ai21.j2-jumbo-instruct\n",
- "- anthropic.claude-instant-v1\n",
- "- anthropic.claude-v1\n",
+ "- anthropic.claude-instant-v2\n",
+ "- anthropic.claude-v2\n",
"\n",
"Note that different models support different `model_kwargs`."
]
@@ -152,7 +152,7 @@
"}\n",
"\n",
"textgen_llm = Bedrock(\n",
- " model_id=\"anthropic.claude-v1\",\n",
+ " model_id=\"anthropic.claude-v2\",\n",
" client=boto3_bedrock,\n",
" model_kwargs=inference_modifier,\n",
")"
@@ -198,9 +198,13 @@
},
"outputs": [],
"source": [
- "response = textgen_llm(\"\"\"Write an email from Bob, Customer Service Manager, \n",
+ "response = textgen_llm(\"\"\"\n",
+ "\n",
+ "Human: Write an email from Bob, Customer Service Manager, \n",
"to the customer \"John Doe\" that provided negative feedback on the service \n",
- "provided by our customer support engineer.\\n\\nHuman:\"\"\")\n",
+ "provided by our customer support engineer.\n",
+ "\n",
+ "Assistant:\"\"\")\n",
"\n",
"print_ww(response)"
]
diff --git a/01_Generation/02_contextual_generation.ipynb b/01_Generation/02_contextual_generation.ipynb
index fc1a2a31..4aa94040 100644
--- a/01_Generation/02_contextual_generation.ipynb
+++ b/01_Generation/02_contextual_generation.ipynb
@@ -134,8 +134,8 @@
"- amazon.titan-tg1-large\n",
"- ai21.j2-grande-instruct\n",
"- ai21.j2-jumbo-instruct\n",
- "- anthropic.claude-instant-v1\n",
- "- anthropic.claude-v1\n",
+ "- anthropic.claude-instant-v2\n",
+ "- anthropic.claude-v2\n",
"\n",
"Note that different models support different `model_kwargs`."
]
@@ -158,7 +158,7 @@
" \"stop_sequences\": [\"\\n\\nHuman\"]\n",
" }\n",
"\n",
- "textgen_llm = Bedrock(model_id = \"anthropic.claude-v1\",\n",
+ "textgen_llm = Bedrock(model_id = \"anthropic.claude-v2\",\n",
" client = boto3_bedrock, \n",
" model_kwargs = inference_modifier \n",
" )\n"
@@ -190,9 +190,14 @@
"# Create a prompt template that has multiple input variables\n",
"multi_var_prompt = PromptTemplate(\n",
" input_variables=[\"customerServiceManager\", \"customerName\", \"feedbackFromCustomer\"], \n",
- " template=\"\"\"Create an apology email from the Service Manager {customerServiceManager} to {customerName}. \n",
- " in response to the following feedback that was received from the customer: {feedbackFromCustomer}.\n",
- " \"\"\"\n",
+ " template=\"\"\"\n",
+ "\n",
+ "Human: Create an apology email from the Service Manager {customerServiceManager} to {customerName} in response to the following feedback that was received from the customer: \n",
+ "\n",
+ "{feedbackFromCustomer}\n",
+ "\n",
+ "\n",
+ "Assistant:\"\"\"\n",
")\n",
"\n",
"# Pass in values to the input variables\n",
diff --git a/02_Summarization/01.small-text-summarization-claude.ipynb b/02_Summarization/01.small-text-summarization-claude.ipynb
index 72060d25..276e80ee 100644
--- a/02_Summarization/01.small-text-summarization-claude.ipynb
+++ b/02_Summarization/01.small-text-summarization-claude.ipynb
@@ -138,7 +138,7 @@
" \"top_p\":0.5,\n",
" \"stop_sequences\":[]\n",
" },\n",
- " modelId=\"anthropic.claude-v1\", \n",
+ " modelId=\"anthropic.claude-v2\", \n",
" accept=accept, \n",
" contentType=contentType)\n",
"\n",
@@ -161,8 +161,9 @@
"outputs": [],
"source": [
"prompt = \"\"\"\n",
- "Please provide a summary of the following text.\n",
"\n",
+ "Human: Please provide a summary of the following text.\n",
+ "\n",
"AWS took all of that feedback from customers, and today we are excited to announce Amazon Bedrock, \\\n",
"a new service that makes FMs from AI21 Labs, Anthropic, Stability AI, and Amazon accessible via an API. \\\n",
"Bedrock is the easiest way for customers to build and scale generative AI-based applications using FMs, \\\n",
@@ -173,8 +174,9 @@
"customize FMs with their own data, and easily integrate and deploy them into their applications using the AWS \\\n",
"tools and capabilities they are familiar with, without having to manage any infrastructure (including integrations \\\n",
"with Amazon SageMaker ML features like Experiments to test different models and Pipelines to manage their FMs at scale).\n",
+ "\n",
"\n",
- "\"\"\""
+ "Assistant:\"\"\""
]
},
{
@@ -224,7 +226,7 @@
},
"outputs": [],
"source": [
- "modelId = 'anthropic.claude-v1' # change this to use a different version from the model provider\n",
+ "modelId = 'anthropic.claude-v2' # change this to use a different version from the model provider\n",
"accept = 'application/json'\n",
"contentType = 'application/json'\n",
"\n",
diff --git a/03_QuestionAnswering/01_qa_w_rag_claude.ipynb b/03_QuestionAnswering/01_qa_w_rag_claude.ipynb
index 4cba18b3..e25938d0 100644
--- a/03_QuestionAnswering/01_qa_w_rag_claude.ipynb
+++ b/03_QuestionAnswering/01_qa_w_rag_claude.ipynb
@@ -175,7 +175,7 @@
"- `ai21.j2-grande-instruct`\n",
"- `ai21.j2-jumbo-instruct`\n",
"- `anthropic.claude-instant-v1`\n",
- "- `anthropic.claude-v1`\n",
+ "- `anthropic.claude-v2`"
"\n",
"Similarly for Embeddings:\n",
"\n",
@@ -195,7 +195,7 @@
"from langchain.llms.bedrock import Bedrock\n",
"\n",
"# - create the Anthropic Model\n",
- "llm = Bedrock(model_id=\"anthropic.claude-v1\", client=boto3_bedrock, model_kwargs={'max_tokens_to_sample':200})\n",
+ "llm = Bedrock(model_id=\"anthropic.claude-v2\", client=boto3_bedrock, model_kwargs={'max_tokens_to_sample':200})\n",
"bedrock_embeddings = BedrockEmbeddings(model_id=\"amazon.titan-embed-g1-text-02\", client=boto3_bedrock)"
]
},
@@ -412,7 +412,7 @@
"### Quick way\n",
"You have the possibility to use the wrapper provided by LangChain which wraps around the Vector Store and takes input the LLM.\n",
"This wrapper performs the following steps behind the scences:\n",
- "- Takes input the question\n",
+ "- Take the question as input\n",
"- Create question embedding\n",
"- Fetch relevant documents\n",
"- Stuff the documents and the question into a prompt\n",
@@ -468,7 +468,7 @@
"### Customisable option\n",
"In the above scenario you explored the quick and easy way to get a context-aware answer to your question. Now let's have a look at a more customizable option with the helpf of [RetrievalQA](https://python.langchain.com/en/latest/modules/chains/index_examples/vector_db_qa.html) where you can customize how the documents fetched should be added to prompt using `chain_type` parameter. Also, if you want to control how many relevant documents should be retrieved then change the `k` parameter in the cell below to see different outputs. In many scenarios you might want to know which were the source documents that the LLM used to generate the answer, you can get those documents in the output using `return_source_documents` which returns the documents that are added to the context of the LLM prompt. `RetrievalQA` also allows you to provide a custom [prompt template](https://python.langchain.com/en/latest/modules/prompts/prompt_templates/getting_started.html) which can be specific to the model.\n",
"\n",
- "Note: In this example we are using Anthropic Claude as the LLM under Amazon Bedrock, this particular model performs best if the inputs are provided under `Human:` and the model is requested to generate an output after `Assistant:`. In the cell below you see an example of how to control the prompt such that the LLM stays grounded and doesn't answer outside the context."
+ "Note: In this example we are using Anthropic Claude as the LLM under Amazon Bedrock. This particular model [performs best](https://docs.anthropic.com/claude/docs/human-and-assistant-formatting) if the inputs are provided under `Human:` and the model is requested to generate an output after `Assistant:`. In the cell below you see an example of how to control the prompt such that the LLM stays grounded and doesn't answer outside the context."
]
},
{
@@ -482,11 +482,15 @@
"from langchain.chains import RetrievalQA\n",
"from langchain.prompts import PromptTemplate\n",
"\n",
- "prompt_template = \"\"\"Human: Use the following pieces of context to provide a concise answer to the question at the end. If you don't know the answer, just say that you don't know, don't try to make up an answer.\n",
+ "prompt_template = \"\"\"\n",
"\n",
+ "Human: Use the following pieces of context to provide a concise answer to the question at the end. If you don't know the answer, just say that you don't know, don't try to make up an answer.\n",
+ "\n",
"{context}\n",
+ "\n",
"{history}\n",
+ "\n",
"\n",
- "\n",
- "Human: {input}\n",
- "\n",
+ "Here is the human's next reply:\n",
+ "\n",
+ "{input}\n",
+ "\n",
"\n",
"Assistant:\n",
"\"\"\")\n",
@@ -556,7 +561,7 @@
"source": [
"### Interactive session using ipywidgets\n",
"\n",
- "The following utility class allows us to interact with Claude in a more natural way. We write out question in an input box, and get Claude answer. We can then continue our conversation."
+ "The following utility class allows us to interact with Claude in a more natural way. We write out the question in an input box, and get Claude's answer. We can then continue our conversation."
]
},
{
@@ -591,7 +596,7 @@
" else: \n",
" prompt = self.name.value\n",
" if 'q' == prompt or 'quit' == prompt or 'Q' == prompt:\n",
- " print(\"Thank you , that was a nice chat !!\")\n",
+ " print(\"Thank you , that was a nice chat!!\")\n",
" return\n",
" elif len(prompt) > 0:\n",
" with self.out:\n",
@@ -719,8 +724,8 @@
"# store previous interactions using ConversationalBufferMemory and add custom prompts to the chat.\n",
"memory = ConversationBufferMemory()\n",
"memory.chat_memory.add_user_message(\"You will be acting as a career coach. Your goal is to give career advice to users\")\n",
- "memory.chat_memory.add_ai_message(\"I am career coach and give career advice\")\n",
- "cl_llm = Bedrock(model_id=\"anthropic.claude-v1\",client=boto3_bedrock)\n",
+ "memory.chat_memory.add_ai_message(\"I am a career coach and give career advice\")\n",
+ "cl_llm = Bedrock(model_id=\"anthropic.claude-v2\",client=boto3_bedrock)\n",
"conversation = ConversationChain(\n",
" llm=cl_llm, verbose=True, memory=memory\n",
")\n",
@@ -809,7 +814,7 @@
"metadata": {},
"source": [
"## Chatbot with Context \n",
- "In this use case we will ask the Chatbot to answer question from some external corpus it has likely never seen before. To do this we apply a pattern called RAG (Retrieval Augmented Generation): the idea is to index the corpus in chunks, then lookup which sections of the corpus might be relevant to provide an answer by using semantic similarity between the chunks and the question. Finally the most relevant chunks are aggregated and passed as context to the ConversationChain, similar to providing an history.\n",
+ "In this use case we will ask the Chatbot to answer question from some external corpus it has likely never seen before. To do this we apply a pattern called RAG (Retrieval Augmented Generation): the idea is to index the corpus in chunks, then look up which sections of the corpus might be relevant to provide an answer by using semantic similarity between the chunks and the question. Finally the most relevant chunks are aggregated and passed as context to the ConversationChain, similar to providing a history.\n",
"\n",
"We will take a csv file and use **Titan Embeddings Model** to create vectors for each line of the csv. This vector is then stored in FAISS, an open source library providing an in-memory vector datastore. When the chatbot is asked a question, we query FAISS with the question and retrieve the text which is semantically closest. This will be our answer. "
]
@@ -1173,8 +1178,8 @@
"\n",
"Assistant: Question:\"\"\")\n",
"\n",
- "# recreate the Claude LLM with more tokens to sample - this provide longer responses but introduces some latency\n",
- "cl_llm = Bedrock(model_id=\"anthropic.claude-v1\", client=boto3_bedrock, model_kwargs={\"max_tokens_to_sample\": 500})\n",
+ "# recreate the Claude LLM with more tokens to sample - this provides longer responses but introduces some latency\n",
+ "cl_llm = Bedrock(model_id=\"anthropic.claude-v2\", client=boto3_bedrock, model_kwargs={\"max_tokens_to_sample\": 500})\n",
"memory_chain = ConversationBufferMemory(memory_key=\"chat_history\", return_messages=True)\n",
"qa = ConversationalRetrievalChain.from_llm(\n",
" llm=cl_llm, \n",
@@ -1192,7 +1197,6 @@
"qa.combine_docs_chain.llm_chain.prompt = PromptTemplate.from_template(\"\"\"\n",
"{context}\n",
"\n",
- "\n",
"Human: Use at maximum 3 sentences to answer the question inside the XML tags. \n",
"\n",
"{question}
\n",
diff --git a/06_CodeGeneration/00_code_generatation_w_bedrock.ipynb b/06_CodeGeneration/00_code_generatation_w_bedrock.ipynb
index 2a0cf1e6..eb9e25eb 100644
--- a/06_CodeGeneration/00_code_generatation_w_bedrock.ipynb
+++ b/06_CodeGeneration/00_code_generatation_w_bedrock.ipynb
@@ -213,6 +213,7 @@
"# Analyzing sales\n",
"\n",
"prompt_data = \"\"\"\n",
+ "\n",
"Human: You have a CSV, sales.csv, with columns:\n",
"- date (YYYY-MM-DD)\n",
"- product_id\n",
@@ -227,6 +228,7 @@
"- Visualize monthly sales using a bar chart\n",
"\n",
"Ensure the code is syntactically correct, bug-free, optimized, not span multiple lines unnessarily, and prefer to use standard libraries. Return only python code without any surrounding text, explanation or context.\n",
+ "\n",
"Assistant:\n",
"\"\"\""
]
diff --git a/06_CodeGeneration/01_sql_query_generate_w_bedrock.ipynb b/06_CodeGeneration/01_sql_query_generate_w_bedrock.ipynb
index 7edf9a99..0d9710fa 100644
--- a/06_CodeGeneration/01_sql_query_generate_w_bedrock.ipynb
+++ b/06_CodeGeneration/01_sql_query_generate_w_bedrock.ipynb
@@ -131,13 +131,14 @@
"source": [
"# create the prompt to generate SQL query\n",
"prompt_data = \"\"\"\n",
- "Command: Human: AnyCompany has a database with a table named sales_data containing sales records. The table has following columns:\n",
+ "\n",
+ "Human: AnyCompany has a database with a table named sales_data containing sales records. The table has following columns:\n",
"- date (YYYY-MM-DD)\n",
"- product_id\n",
"- price\n",
"- units_sold\n",
"\n",
- "Can you generate SQL queries for below: \n",
+ "Can you generate SQL queries for the below: \n",
"- Identify the top 5 best selling products by total sales for the year 2023\n",
"- Calculate the monthly average sales for the year 2023\n",
"\n",
@@ -227,7 +228,9 @@
"outputs": [],
"source": [
"# create the prompt\n",
- "prompt_sql_data = \"\"\"Command: You're provided with a database schema representing any hospital's patient management system.\n",
+ "prompt_sql_data = \"\"\"\n",
+ "\n",
+ "Human: You're provided with a database schema representing any hospital's patient management system.\n",
"The system holds records about patients, their prescriptions, doctors, and the medications prescribed.\n",
"\n",
"Here's the schema:\n",
diff --git a/06_CodeGeneration/02_code_interpret_w_langchain.ipynb b/06_CodeGeneration/02_code_interpret_w_langchain.ipynb
index 202353e1..5bf3b38b 100644
--- a/06_CodeGeneration/02_code_interpret_w_langchain.ipynb
+++ b/06_CodeGeneration/02_code_interpret_w_langchain.ipynb
@@ -130,8 +130,8 @@
"- amazon.titan-tg1-large\n",
"- ai21.j2-grande-instruct\n",
"- ai21.j2-jumbo-instruct\n",
- "- anthropic.claude-instant-v1\n",
- "- anthropic.claude-v1\n",
+ "- anthropic.claude-instant-v2\n",
+ "- anthropic.claude-v2\n",
"\n",
"Note that different models support different `model_kwargs`."
]
@@ -275,11 +275,15 @@
"# Create a prompt template that has multiple input variables\n",
"multi_var_prompt = PromptTemplate(\n",
" input_variables=[\"code\", \"programmingLanguage\"], \n",
- " template=\"\"\"Human: You will be acting as an expert software developer in {programmingLanguage}. \n",
- " You will explain below code and highlight if any red flags or not following best practices.\n",
- " {code}\n",
- " Assistant: \n",
- " \"\"\"\n",
+ " template=\"\"\"\n",
+ "\n",
+ "Human: You will be acting as an expert software developer in {programmingLanguage}. \n",
+ "You will explain the below code and highlight if there are any red flags or where best practices are not being followed.\n",
+ "\n",
+ "{code}\n",
+ "
\n",
+ "\n",
+ "Assistant:\"\"\"\n",
")\n",
"\n",
"# Pass in values to the input variables\n",
diff --git a/06_CodeGeneration/03_code_translate_w_langchain.ipynb b/06_CodeGeneration/03_code_translate_w_langchain.ipynb
index c8300e08..18f37d47 100644
--- a/06_CodeGeneration/03_code_translate_w_langchain.ipynb
+++ b/06_CodeGeneration/03_code_translate_w_langchain.ipynb
@@ -129,8 +129,8 @@
"- amazon.titan-tg1-large\n",
"- ai21.j2-grande-instruct\n",
"- ai21.j2-jumbo-instruct\n",
- "- anthropic.claude-instant-v1\n",
- "- anthropic.claude-v1\n",
+ "- anthropic.claude-instant-v2\n",
+ "- anthropic.claude-v2\n",
"\n",
"Note that different models support different `model_kwargs`."
]
@@ -274,11 +274,15 @@
"# Create a prompt template that has multiple input variables\n",
"multi_var_prompt = PromptTemplate(\n",
" input_variables=[\"code\", \"srcProgrammingLanguage\", \"targetProgrammingLanguage\"], \n",
- " template=\"\"\"Human: You will be acting as an expert software developer in {srcProgrammingLanguage} and {targetProgrammingLanguage}. \n",
- " You will tranlslate below code from {srcProgrammingLanguage} to {targetProgrammingLanguage} while following coding best practices.\n",
- " {code}\n",
- " Assistant: \n",
- " \"\"\"\n",
+ " template=\"\"\"\n",
+ "\n",
+ "Human: You will be acting as an expert software developer in {srcProgrammingLanguage} and {targetProgrammingLanguage}. \n",
+ "You will tranlslate below code from {srcProgrammingLanguage} to {targetProgrammingLanguage} while following coding best practices.\n",
+ "\n",
+ "{code}\n",
+ "
\n",
+ "\n",
+ "Assistant: \"\"\"\n",
")\n",
"\n",
"# Pass in values to the input variables\n",