Merge branch 'main' into main

langchain-ai · Sep 25, 2024 · 5fafc89 · 5fafc89
2 parents e1fc8ba + c27923a
commit 5fafc89
Show file tree

Hide file tree

Showing 29 changed files with 1,007 additions and 864 deletions.
diff --git a/README.md b/README.md
@@ -40,17 +40,16 @@ in [LangChain.js](https://js.langchain.com/docs/ecosystem/langserve).
 
 ## ⚠️ LangGraph Compatibility
 
-LangServe is designed to primarily deploy simple Runnables and wok with well-known primitives in langchain-core.
+LangServe is designed to primarily deploy simple Runnables and work with well-known primitives in langchain-core.
 
 If you need a deployment option for LangGraph, you should instead be looking at [LangGraph Cloud (beta)](https://langchain-ai.github.io/langgraph/cloud/) which will
 be better suited for deploying LangGraph applications.
 
 ## Limitations
 
 - Client callbacks are not yet supported for events that originate on the server
-- OpenAPI docs will not be generated when using Pydantic V2. Fast API does not
-  support [mixing pydantic v1 and v2 namespaces](https://github.com/tiangolo/fastapi/issues/10360).
-  See section below for more details.
+- Versions of LangServe <= 0.2.0, will not generate OpenAPI docs properly when using Pydantic V2 as Fast API does not support [mixing pydantic v1 and v2 namespaces](https://github.com/tiangolo/fastapi/issues/10360).
+  See section below for more details. Either upgrade to LangServe>=0.3.0 or downgrade Pydantic to pydantic 1.
 
 ## Security
 
@@ -208,8 +207,9 @@ app.add_middleware(
 
 If you've deployed the server above, you can view the generated OpenAPI docs using:
 
-> ⚠️ If using pydantic v2, docs will not be generated for _invoke_, _batch_, _stream_,
+> ⚠️ If using LangServe <= 0.2.0 and pydantic v2, docs will not be generated for _invoke_, _batch_, _stream_,
 > _stream_log_. See [Pydantic](#pydantic) section below for more details.
+> To resolve please upgrade to LangServe 0.3.0.
 
 ```sh
 curl localhost:8000/docs
@@ -380,7 +380,7 @@ prompt = ChatPromptTemplate.from_messages(
     ]
 )
 
-chain = prompt | ChatAnthropic(model="claude-2")
+chain = prompt | ChatAnthropic(model="claude-2.1")
 
 
 class InputChat(BaseModel):
@@ -472,7 +472,9 @@ gcloud run deploy [your-service-name] --source . --port 8001 --allow-unauthentic
 
 ## Pydantic
 
-LangServe provides support for Pydantic 2 with some limitations.
+LangServe>=0.3 fully supports Pydantic 2.
+
+If you're using an earlier version of LangServe (<= 0.2), then please note that support for Pydantic 2 has the following limitations:
 
 1. OpenAPI docs will not be generated for invoke/batch/stream/stream_log when using
    Pydantic V2. Fast API does not support [mixing pydantic v1 and v2 namespaces]. To fix this, use `pip install pydantic==1.10.17`.
@@ -772,7 +774,7 @@ prompt = ChatPromptTemplate.from_messages(
     ]
 )
 
-chain = prompt | ChatAnthropic(model="claude-2")
+chain = prompt | ChatAnthropic(model="claude-2.1")
 
 
 class MessageListInput(BaseModel):

diff --git a/examples/chat_playground/legacy_input/server.py b/examples/chat_playground/legacy_input/server.py
@@ -28,7 +28,7 @@
     ]
 )
 
-chain = prompt | ChatAnthropic(model="claude-2")
+chain = prompt | ChatAnthropic(model="claude-2.1")
 
 
 class InputChat(BaseModel):

diff --git a/examples/chat_with_persistence/server.py b/examples/chat_with_persistence/server.py
@@ -76,7 +76,7 @@ def get_chat_history(session_id: str) -> FileChatMessageHistory:
     ]
 )
 
-chain = prompt | ChatAnthropic(model="claude-2")
+chain = prompt | ChatAnthropic(model="claude-2.1")
 
 
 class InputChat(BaseModel):

diff --git a/examples/configurable_chain/client.ipynb b/examples/configurable_chain/client.ipynb
@@ -23,14 +23,7 @@
     "tags": []
    },
    "outputs": [],
-   "source": [
-    "import requests\n",
-    "\n",
-    "inputs = {\"input\": {\"topic\": \"sports\"}}\n",
-    "response = requests.post(\"http://localhost:8000/configurable_temp/invoke\", json=inputs)\n",
-    "\n",
-    "response.json()"
-   ]
+   "source": ["import requests\n\ninputs = {\"input\": {\"topic\": \"sports\"}}\nresponse = requests.post(\"http://localhost:8000/configurable_temp/invoke\", json=inputs)\n\nresponse.json()"]
   },
   {
    "cell_type": "markdown",
@@ -46,11 +39,7 @@
     "tags": []
    },
    "outputs": [],
-   "source": [
-    "from langserve import RemoteRunnable\n",
-    "\n",
-    "remote_runnable = RemoteRunnable(\"http://localhost:8000/configurable_temp\")"
-   ]
+   "source": ["from langserve import RemoteRunnable\n\nremote_runnable = RemoteRunnable(\"http://localhost:8000/configurable_temp\")"]
   },
   {
    "cell_type": "markdown",
@@ -66,9 +55,7 @@
     "tags": []
    },
    "outputs": [],
-   "source": [
-    "response = await remote_runnable.ainvoke({\"topic\": \"sports\"})"
-   ]
+   "source": ["response = await remote_runnable.ainvoke({\"topic\": \"sports\"})"]
   },
   {
    "cell_type": "markdown",
@@ -84,11 +71,7 @@
     "tags": []
    },
    "outputs": [],
-   "source": [
-    "from langchain.schema.runnable.config import RunnableConfig\n",
-    "\n",
-    "remote_runnable.batch([{\"topic\": \"sports\"}, {\"topic\": \"cars\"}])"
-   ]
+   "source": ["from langchain_core.runnables import RunnableConfig\n\nremote_runnable.batch([{\"topic\": \"sports\"}, {\"topic\": \"cars\"}])"]
   },
   {
    "cell_type": "markdown",
@@ -104,10 +87,7 @@
     "tags": []
    },
    "outputs": [],
-   "source": [
-    "async for chunk in remote_runnable.astream({\"topic\": \"bears, but a bit verbose\"}):\n",
-    "    print(chunk, end=\"\", flush=True)"
-   ]
+   "source": ["async for chunk in remote_runnable.astream({\"topic\": \"bears, but a bit verbose\"}):\n    print(chunk, end=\"\", flush=True)"]
   },
   {
    "cell_type": "markdown",
@@ -157,14 +137,7 @@
     "tags": []
    },
    "outputs": [],
-   "source": [
-    "await remote_runnable.ainvoke(\n",
-    "    {\"topic\": \"sports\"},\n",
-    "    config={\n",
-    "        \"configurable\": {\"prompt\": \"how to say {topic} in french\", \"llm\": \"low_temp\"}\n",
-    "    },\n",
-    ")"
-   ]
+   "source": ["await remote_runnable.ainvoke(\n    {\"topic\": \"sports\"},\n    config={\n        \"configurable\": {\"prompt\": \"how to say {topic} in french\", \"llm\": \"low_temp\"}\n    },\n)"]
   },
   {
    "cell_type": "markdown",
@@ -221,13 +194,7 @@
    "execution_count": null,
    "metadata": {},
    "outputs": [],
-   "source": [
-    "# The model will fail with an auth error\n",
-    "unauthenticated_response = requests.post(\n",
-    "    \"http://localhost:8000/auth_from_header/invoke\", json={\"input\": \"hello\"}\n",
-    ")\n",
-    "unauthenticated_response.json()"
-   ]
+   "source": ["# The model will fail with an auth error\nunauthenticated_response = requests.post(\n    \"http://localhost:8000/auth_from_header/invoke\", json={\"input\": \"hello\"}\n)\nunauthenticated_response.json()"]
   },
   {
    "cell_type": "markdown",
@@ -244,25 +211,14 @@
    "execution_count": null,
    "metadata": {},
    "outputs": [],
-   "source": [
-    "# The model will succeed as long as the above shell script is run previously\n",
-    "import os\n",
-    "\n",
-    "test_key = os.environ[\"TEST_API_KEY\"]\n",
-    "authenticated_response = requests.post(\n",
-    "    \"http://localhost:8000/auth_from_header/invoke\",\n",
-    "    json={\"input\": \"hello\"},\n",
-    "    headers={\"x-api-key\": test_key},\n",
-    ")\n",
-    "authenticated_response.json()"
-   ]
+   "source": ["# The model will succeed as long as the above shell script is run previously\nimport os\n\ntest_key = os.environ[\"TEST_API_KEY\"]\nauthenticated_response = requests.post(\n    \"http://localhost:8000/auth_from_header/invoke\",\n    json={\"input\": \"hello\"},\n    headers={\"x-api-key\": test_key},\n)\nauthenticated_response.json()"]
   },
   {
    "cell_type": "code",
    "execution_count": null,
    "metadata": {},
    "outputs": [],
-   "source": []
+   "source": [""]
   }
  ],
  "metadata": {

diff --git a/examples/llm/client.ipynb b/examples/llm/client.ipynb
@@ -16,9 +16,7 @@
     "tags": []
    },
    "outputs": [],
-   "source": [
-    "from langchain.prompts.chat import ChatPromptTemplate"
-   ]
+   "source": ["from langchain_core.prompts import ChatPromptTemplate"]
   },
   {
    "cell_type": "code",
@@ -27,12 +25,7 @@
     "tags": []
    },
    "outputs": [],
-   "source": [
-    "from langserve import RemoteRunnable\n",
-    "\n",
-    "openai_llm = RemoteRunnable(\"http://localhost:8000/openai/\")\n",
-    "anthropic = RemoteRunnable(\"http://localhost:8000/anthropic/\")"
-   ]
+   "source": ["from langserve import RemoteRunnable\n\nopenai_llm = RemoteRunnable(\"http://localhost:8000/openai/\")\nanthropic = RemoteRunnable(\"http://localhost:8000/anthropic/\")"]
   },
   {
    "cell_type": "markdown",
@@ -48,18 +41,7 @@
     "tags": []
    },
    "outputs": [],
-   "source": [
-    "prompt = ChatPromptTemplate.from_messages(\n",
-    "    [\n",
-    "        (\n",
-    "            \"system\",\n",
-    "            \"You are a highly educated person who loves to use big words. \"\n",
-    "            + \"You are also concise. Never answer in more than three sentences.\",\n",
-    "        ),\n",
-    "        (\"human\", \"Tell me about your favorite novel\"),\n",
-    "    ]\n",
-    ").format_messages()"
-   ]
+   "source": ["prompt = ChatPromptTemplate.from_messages(\n    [\n        (\n            \"system\",\n            \"You are a highly educated person who loves to use big words. \"\n            + \"You are also concise. Never answer in more than three sentences.\",\n        ),\n        (\"human\", \"Tell me about your favorite novel\"),\n    ]\n).format_messages()"]
   },
   {
    "cell_type": "markdown",
@@ -86,9 +68,7 @@
      "output_type": "execute_result"
     }
    ],
-   "source": [
-    "anthropic.invoke(prompt)"
-   ]
+   "source": ["anthropic.invoke(prompt)"]
   },
   {
    "cell_type": "code",
@@ -97,9 +77,7 @@
     "tags": []
    },
    "outputs": [],
-   "source": [
-    "openai_llm.invoke(prompt)"
-   ]
+   "source": ["openai_llm.invoke(prompt)"]
   },
   {
    "cell_type": "markdown",
@@ -126,9 +104,7 @@
      "output_type": "execute_result"
     }
    ],
-   "source": [
-    "await openai_llm.ainvoke(prompt)"
-   ]
+   "source": ["await openai_llm.ainvoke(prompt)"]
   },
   {
    "cell_type": "code",
@@ -149,9 +125,7 @@
      "output_type": "execute_result"
     }
    ],
-   "source": [
-    "anthropic.batch([prompt, prompt])"
-   ]
+   "source": ["anthropic.batch([prompt, prompt])"]
   },
   {
    "cell_type": "code",
@@ -172,9 +146,7 @@
      "output_type": "execute_result"
     }
    ],
-   "source": [
-    "await anthropic.abatch([prompt, prompt])"
-   ]
+   "source": ["await anthropic.abatch([prompt, prompt])"]
   },
   {
    "cell_type": "markdown",
@@ -198,10 +170,7 @@
      ]
     }
    ],
-   "source": [
-    "for chunk in anthropic.stream(prompt):\n",
-    "    print(chunk.content, end=\"\", flush=True)"
-   ]
+   "source": ["for chunk in anthropic.stream(prompt):\n    print(chunk.content, end=\"\", flush=True)"]
   },
   {
    "cell_type": "code",
@@ -218,19 +187,14 @@
      ]
     }
    ],
-   "source": [
-    "async for chunk in anthropic.astream(prompt):\n",
-    "    print(chunk.content, end=\"\", flush=True)"
-   ]
+   "source": ["async for chunk in anthropic.astream(prompt):\n    print(chunk.content, end=\"\", flush=True)"]
   },
   {
    "cell_type": "code",
    "execution_count": 13,
    "metadata": {},
    "outputs": [],
-   "source": [
-    "from langchain.schema.runnable import RunnablePassthrough"
-   ]
+   "source": ["from langchain_core.runnables import RunnablePassthrough"]
   },
   {
    "cell_type": "code",
@@ -239,37 +203,7 @@
     "tags": []
    },
    "outputs": [],
-   "source": [
-    "comedian_chain = (\n",
-    "    ChatPromptTemplate.from_messages(\n",
-    "        [\n",
-    "            (\n",
-    "                \"system\",\n",
-    "                \"You are a comedian that sometimes tells funny jokes and other times you just state facts that are not funny. Please either tell a joke or state fact now but only output one.\",\n",
-    "            ),\n",
-    "        ]\n",
-    "    )\n",
-    "    | openai_llm\n",
-    ")\n",
-    "\n",
-    "joke_classifier_chain = (\n",
-    "    ChatPromptTemplate.from_messages(\n",
-    "        [\n",
-    "            (\n",
-    "                \"system\",\n",
-    "                \"Please determine if the joke is funny. Say `funny` if it's funny and `not funny` if not funny. Then repeat the first five words of the joke for reference...\",\n",
-    "            ),\n",
-    "            (\"human\", \"{joke}\"),\n",
-    "        ]\n",
-    "    )\n",
-    "    | anthropic\n",
-    ")\n",
-    "\n",
-    "\n",
-    "chain = {\"joke\": comedian_chain} | RunnablePassthrough.assign(\n",
-    "    classification=joke_classifier_chain\n",
-    ")"
-   ]
+   "source": ["comedian_chain = (\n    ChatPromptTemplate.from_messages(\n        [\n            (\n                \"system\",\n                \"You are a comedian that sometimes tells funny jokes and other times you just state facts that are not funny. Please either tell a joke or state fact now but only output one.\",\n            ),\n        ]\n    )\n    | openai_llm\n)\n\njoke_classifier_chain = (\n    ChatPromptTemplate.from_messages(\n        [\n            (\n                \"system\",\n                \"Please determine if the joke is funny. Say `funny` if it's funny and `not funny` if not funny. Then repeat the first five words of the joke for reference...\",\n            ),\n            (\"human\", \"{joke}\"),\n        ]\n    )\n    | anthropic\n)\n\n\nchain = {\"joke\": comedian_chain} | RunnablePassthrough.assign(\n    classification=joke_classifier_chain\n)"]
   },
   {
    "cell_type": "code",
@@ -290,9 +224,7 @@
      "output_type": "execute_result"
     }
    ],
-   "source": [
-    "chain.invoke({})"
-   ]
+   "source": ["chain.invoke({})"]
   }
  ],
  "metadata": {