Merge remote-tracking branch 'origin/feat/deepinfra-llm-and-chat' int…

…o feat/deepinfra-llm-and-chat
langchain-ai · Jun 5, 2024 · a791836 · a791836
2 parents 98f34c5 + 4e2355f
commit a791836
Show file tree

Hide file tree

Showing 114 changed files with 3,292 additions and 1,129 deletions.
diff --git a/.github/workflows/standard-tests.yml b/.github/workflows/standard-tests.yml
@@ -0,0 +1,92 @@
+name: Standard Tests (Integration)
+
+on:
+  workflow_dispatch:
+  schedule:
+    - cron: '0 13 * * *'
+
+jobs:
+  standard-tests:
+    runs-on: ubuntu-latest
+    strategy:
+      matrix:
+        package: [anthropic, cohere, google-genai, groq, mistralai]
+    steps:
+      - uses: actions/checkout@v4
+      - name: Use Node.js 18.x
+        uses: actions/setup-node@v3
+        with:
+          node-version: 18.x
+          cache: "yarn"
+      - name: Install dependencies
+        run: yarn install --immutable --mode=skip-build
+      - name: Run standard tests (integration) for ${{ matrix.package }}
+        run: yarn test:standard:int --filter=@langchain/${{ matrix.package }}
+        env:
+          ANTHROPIC_API_KEY: ${{ secrets.ANTHROPIC_API_KEY }}
+          COHERE_API_KEY: ${{ secrets.COHERE_API_KEY }}
+          GOOGLE_API_KEY: ${{ secrets.GOOGLE_API_KEY }}
+          GROQ_API_KEY: ${{ secrets.GROQ_API_KEY }}
+          MISTRAL_API_KEY: ${{ secrets.MISTRAL_API_KEY }}
+
+  # The `@langchain/openai` package contains standard tests for ChatOpenAI and AzureChatOpenAI
+  # We want to run these separately, so we need to pass the exact path for each test, which means
+  # we need separate jobs for each test.
+  standard-tests-openai:
+    runs-on: ubuntu-latest
+    steps:
+      - uses: actions/checkout@v4
+      - name: Use Node.js 18.x
+        uses: actions/setup-node@v3
+        with:
+          node-version: 18.x
+          cache: "yarn"
+      - name: Install dependencies
+        run: yarn install --immutable --mode=skip-build
+      - name: Build `@langchain/openai`
+        run: yarn build --filter=@langchain/openai
+      - name: Run standard tests (integration) for ChatOpenAI
+        run: yarn workspace @langchain/openai test:single src/tests/chat_models.standard.int.test.ts
+        env:
+          OPENAI_API_KEY: ${{ secrets.OPENAI_API_KEY }}
+
+  standard-tests-azure-openai:
+    runs-on: ubuntu-latest
+    steps:
+      - uses: actions/checkout@v4
+      - name: Use Node.js 18.x
+        uses: actions/setup-node@v3
+        with:
+          node-version: 18.x
+          cache: "yarn"
+      - name: Install dependencies
+        run: yarn install --immutable --mode=skip-build
+      - name: Build `@langchain/openai`
+        run: yarn build --filter=@langchain/openai
+      - name: Run standard tests (integration) for `@langchain/openai` AzureChatOpenAI
+        run: yarn workspace @langchain/openai test:single src/tests/azure/chat_models.standard.int.test.ts
+        env:
+          AZURE_OPENAI_API_KEY: ${{ secrets.AZURE_OPENAI_API_KEY }}
+          AZURE_OPENAI_API_DEPLOYMENT_NAME: "chat"
+          AZURE_OPENAI_API_VERSION: ${{ secrets.AZURE_OPENAI_API_VERSION }}
+          AZURE_OPENAI_BASE_PATH: ${{ secrets.AZURE_OPENAI_BASE_PATH }}
+
+  standard-tests-bedrock:
+    runs-on: ubuntu-latest
+    steps:
+      - uses: actions/checkout@v4
+      - name: Use Node.js 18.x
+        uses: actions/setup-node@v3
+        with:
+          node-version: 18.x
+          cache: "yarn"
+      - name: Install dependencies
+        run: yarn install --immutable --mode=skip-build
+      - name: Build `@langchain/community`
+        run: yarn build --filter=@langchain/community
+      - name: Run standard tests (integration) for `@langchain/community` BedrockChat
+        run: yarn workspace @langchain/community test:single src/chat_models/tests/chatbedrock.standard.int.test.ts
+        env:
+          BEDROCK_AWS_REGION: "us-east-1"
+          BEDROCK_AWS_SECRET_ACCESS_KEY: ${{ secrets.BEDROCK_AWS_SECRET_ACCESS_KEY }}
+          BEDROCK_AWS_ACCESS_KEY_ID: ${{ secrets.BEDROCK_AWS_ACCESS_KEY_ID }}
diff --git a/docs/core_docs/docs/concepts.mdx b/docs/core_docs/docs/concepts.mdx
@@ -1,3 +1,34 @@
+---
+keywords:
+  [
+    prompt,
+    prompttemplate,
+    chatprompttemplate,
+    tool,
+    tools,
+    runnable,
+    runnables,
+    invoke,
+    vector,
+    vectorstore,
+    vectorstores,
+    embedding,
+    embeddings,
+    chat,
+    chat model,
+    llm,
+    llms,
+    retriever,
+    retrievers,
+    loader,
+    loaders,
+    document,
+    documents,
+    output,
+    output parser,
+  ]
+---
+
 # Conceptual guide
 
 This section contains introductions to key parts of LangChain.
@@ -641,8 +672,9 @@ LangChain provides several advanced retrieval types. A full list is below, along
 | [Multi Vector](/docs/how_to/multi_vector/)                           | Vectorstore + Document Store | Sometimes during indexing | If you are able to extract information from documents that you think is more relevant to index than the text itself.                    | This involves creating multiple vectors for each document. Each vector could be created in a myriad of ways - examples include summaries of the text and hypothetical questions.                                                                                     |
 | [Self Query](/docs/how_to/self_query/)                               | Vectorstore                  | Yes                       | If users are asking questions that are better answered by fetching documents based on metadata rather than similarity with the text.    | This uses an LLM to transform user input into two things: (1) a string to look up semantically, (2) a metadata filer to go along with it. This is useful because oftentimes questions are about the METADATA of documents (not the content itself).                  |
 | [Contextual Compression](/docs/how_to/contextual_compression/)       | Any                          | Sometimes                 | If you are finding that your retrieved documents contain too much irrelevant information and are distracting the LLM.                   | This puts a post-processing step on top of another retriever and extracts only the most relevant information from retrieved documents. This can be done with embeddings or an LLM.                                                                                   |
-| [Time-Weighted Vectorstore](/docs/how_to/time_weighted_vectorstore/) | Vectorstore                  | No                        | If you have timestamps associated with your documents, and you want to retrieve the most recent ones                                    | This fetches documents based on a combination of semantic similarity (as in normal vector retrieval) and recency (looking at timestamps of indexed documents)                                                                                                        |
-| [Multi-Query Retriever](/docs/how_to/multiple_queries/)              | Any                          | Yes                       | If users are asking questions that are complex and require multiple pieces of distinct information to respond                           | This uses an LLM to generate multiple queries from the original one. This is useful when the original query needs pieces of information about multiple topics to be properly answered. By generating multiple queries, we can then fetch documents for each of them. |
+| [Time-Weighted Vectorstore](/docs/how_to/time_weighted_vectorstore/) | Vectorstore                  | No                        | If you have timestamps associated with your documents, and you want to retrieve the most recent ones.                                   | This fetches documents based on a combination of semantic similarity (as in normal vector retrieval) and recency (looking at timestamps of indexed documents)                                                                                                        |
+| [Multi-Query Retriever](/docs/how_to/multiple_queries/)              | Any                          | Yes                       | If users are asking questions that are complex and require multiple pieces of distinct information to respond.                          | This uses an LLM to generate multiple queries from the original one. This is useful when the original query needs pieces of information about multiple topics to be properly answered. By generating multiple queries, we can then fetch documents for each of them. |
+| [Ensemble](/docs/how_to/ensemble_retriever)                          | Any                          | No                        | If you have multiple retrieval methods and want to try combining them.                                                                  | This fetches documents from multiple retrievers and then combines them.                                                                                                                                                                                              |
 
 ### Text splitting
 

diff --git a/docs/core_docs/docs/how_to/document_loader_html.ipynb b/docs/core_docs/docs/how_to/document_loader_html.ipynb
@@ -45,7 +45,7 @@
     "1. Download & start the Docker container:\n",
     "  \n",
     "```bash\n",
-    "docker run -p 8000:8000 -d --rm --name unstructured-api quay.io/unstructured-io/unstructured-api:latest --port 8000 --host 0.0.0.0\n",
+    "docker run -p 8000:8000 -d --rm --name unstructured-api downloads.unstructured.io/unstructured-io/unstructured-api:latest --port 8000 --host 0.0.0.0\n",
     "```\n",
     "\n",
     "2. Get a free API key & API URL [here](https://unstructured.io/api-key), and set it in your environment (as per the Unstructured website, it may take up to an hour to allocate your API key & URL.):\n",

diff --git a/docs/core_docs/docs/how_to/document_loader_markdown.ipynb b/docs/core_docs/docs/how_to/document_loader_markdown.ipynb
@@ -50,7 +50,7 @@
     "1. Download & start the Docker container:\n",
     "  \n",
     "```bash\n",
-    "docker run -p 8000:8000 -d --rm --name unstructured-api quay.io/unstructured-io/unstructured-api:latest --port 8000 --host 0.0.0.0\n",
+    "docker run -p 8000:8000 -d --rm --name unstructured-api downloads.unstructured.io/unstructured-io/unstructured-api:latest --port 8000 --host 0.0.0.0\n",
     "```\n",
     "\n",
     "2. Get a free API key & API URL [here](https://unstructured.io/api-key), and set it in your environment (as per the Unstructured website, it may take up to an hour to allocate your API key & URL.):\n",

diff --git a/docs/core_docs/docs/how_to/ensemble_retriever.mdx b/docs/core_docs/docs/how_to/ensemble_retriever.mdx
@@ -0,0 +1,29 @@
+# How to combine results from multiple retrievers
+
+:::info Prerequisites
+
+This guide assumes familiarity with the following concepts:
+
+- [Documents](/docs/concepts#document)
+- [Retrievers](/docs/concepts#retrievers)
+
+:::
+
+The [EnsembleRetriever](https://api.js.langchain.com/classes/langchain_retrievers_ensemble.EnsembleRetriever.html) supports ensembling of results from multiple retrievers. It is initialized with a list of [BaseRetriever](https://api.js.langchain.com/classes/langchain_core_retrievers.BaseRetriever.html) objects. EnsembleRetrievers rerank the results of the constituent retrievers based on the [Reciprocal Rank Fusion](https://plg.uwaterloo.ca/~gvcormac/cormacksigir09-rrf.pdf) algorithm.
+
+By leveraging the strengths of different algorithms, the `EnsembleRetriever` can achieve better performance than any single algorithm.
+
+One useful pattern is to combine a keyword matching retriever with a dense retriever (like embedding similarity), because their strengths are complementary. This can be considered a form of "hybrid search". The sparse retriever is good at finding relevant documents based on keywords, while the dense retriever is good at finding relevant documents based on semantic similarity.
+
+Below we demonstrate ensembling of a [simple custom retriever](/docs/how_to/custom_retriever/) that simply returns documents that directly contain the input query with a retriever derived from a [demo, in-memory, vector store](https://api.js.langchain.com/classes/langchain_vectorstores_memory.MemoryVectorStore.html).
+
+import CodeBlock from "@theme/CodeBlock";
+import Example from "@examples/retrievers/ensemble_retriever.ts";
+
+<CodeBlock language="typescript">{Example}</CodeBlock>
+
+## Next steps
+
+You've now learned how to combine results from multiple retrievers.
+Next, check out some other retrieval how-to guides, such as how to [improve results using multiple embeddings per document](/docs/how_to/multi_vector)
+or how to [create your own custom retriever](/docs/how_to/custom_retriever).
diff --git a/docs/core_docs/docs/how_to/index.mdx b/docs/core_docs/docs/how_to/index.mdx
@@ -133,6 +133,7 @@ Retrievers are responsible for taking a query and returning relevant documents.
 - [How to: generate multiple queries to retrieve data for](/docs/how_to/multiple_queries)
 - [How to: use contextual compression to compress the data retrieved](/docs/how_to/contextual_compression)
 - [How to: write a custom retriever class](/docs/how_to/custom_retriever)
+- [How to: combine the results from multiple retrievers](/docs/how_to/ensemble_retriever)
 - [How to: generate multiple embeddings per document](/docs/how_to/multi_vector)
 - [How to: retrieve the whole document for a chunk](/docs/how_to/parent_document_retriever)
 - [How to: generate metadata filters](/docs/how_to/self_query)

diff --git a/docs/core_docs/docs/how_to/recursive_text_splitter.ipynb b/docs/core_docs/docs/how_to/recursive_text_splitter.ipynb
@@ -1,5 +1,18 @@
 {
  "cells": [
+  {
+   "cell_type": "raw",
+   "metadata": {
+    "vscode": {
+     "languageId": "raw"
+    }
+   },
+   "source": [
+    "---\n",
+    "keywords: [recursivecharactertextsplitter]\n",
+    "---"
+   ]
+  },
   {
    "cell_type": "markdown",
    "metadata": {},

diff --git a/docs/core_docs/docs/how_to/sequence.ipynb b/docs/core_docs/docs/how_to/sequence.ipynb
@@ -2,10 +2,14 @@
  "cells": [
   {
    "cell_type": "raw",
-   "metadata": {},
+   "metadata": {
+    "vscode": {
+     "languageId": "raw"
+    }
+   },
    "source": [
     "---\n",
-    "keywords: [Runnable, Runnables, LCEL]\n",
+    "keywords: [chain, chaining, runnablesequence]\n",
     "---"
    ]
   },

diff --git a/docs/core_docs/docs/how_to/tool_calling.ipynb b/docs/core_docs/docs/how_to/tool_calling.ipynb
@@ -1,5 +1,18 @@
 {
   "cells": [
+    {
+      "cell_type": "raw",
+      "metadata": {
+        "vscode": {
+          "languageId": "raw"
+        }
+      },
+      "source": [
+        "---\n",
+        "keywords: [function, function calling, tool, tool calling]\n",
+        "---"
+      ]
+    },
     {
       "cell_type": "markdown",
       "metadata": {},

diff --git a/docs/core_docs/docs/integrations/chat/ollama_functions.mdx b/docs/core_docs/docs/integrations/chat/ollama_functions.mdx
@@ -19,7 +19,7 @@ Follow [these instructions](https://github.com/jmorganca/ollama) to set up and r
 You can initialize this wrapper the same way you'd initialize a standard `ChatOllama` instance:
 
 ```typescript
-import { OllamaFunctions } from "langchain/experimental/chat_models/ollama_functions";
+import { OllamaFunctions } from "@langchain/community/experimental/chat_models/ollama_functions";
 
 const model = new OllamaFunctions({
   temperature: 0.1,

diff --git a/docs/core_docs/docs/integrations/document_loaders/file_loaders/unstructured.mdx b/docs/core_docs/docs/integrations/document_loaders/file_loaders/unstructured.mdx
@@ -11,7 +11,7 @@ This example covers how to use Unstructured to load files of many types. Unstruc
 You can run Unstructured locally in your computer using Docker. To do so, you need to have Docker installed. You can find the instructions to install Docker [here](https://docs.docker.com/get-docker/).
 
 ```bash
-docker run -p 8000:8000 -d --rm --name unstructured-api quay.io/unstructured-io/unstructured-api:latest --port 8000 --host 0.0.0.0
+docker run -p 8000:8000 -d --rm --name unstructured-api downloads.unstructured.io/unstructured-io/unstructured-api:latest --port 8000 --host 0.0.0.0
 ```
 
 ## Usage

diff --git a/docs/core_docs/docs/integrations/platforms/aws.mdx b/docs/core_docs/docs/integrations/platforms/aws.mdx
@@ -1,3 +1,7 @@
+---
+keywords: [bedrock]
+---
+
 # AWS
 
 All functionality related to [Amazon AWS](https://aws.amazon.com/) platform

diff --git a/docs/core_docs/docs/integrations/platforms/microsoft.mdx b/docs/core_docs/docs/integrations/platforms/microsoft.mdx
@@ -1,3 +1,7 @@
+---
+keywords: [azure]
+---
+
 import CodeBlock from "@theme/CodeBlock";
 
 # Microsoft

diff --git a/docs/core_docs/docs/integrations/platforms/openai.mdx b/docs/core_docs/docs/integrations/platforms/openai.mdx
@@ -1,3 +1,7 @@
+---
+keywords: [openai]
+---
+
 # OpenAI
 
 All functionality related to OpenAI

diff --git a/docs/core_docs/docs/integrations/text_embedding/openai.mdx b/docs/core_docs/docs/integrations/text_embedding/openai.mdx
@@ -1,3 +1,7 @@
+---
+keywords: [openaiembeddings]
+---
+
 # OpenAI
 
 The `OpenAIEmbeddings` class uses the OpenAI API to generate embeddings for a given text. By default it strips new line characters from the text, as recommended by OpenAI, but you can disable this by passing `stripNewLines: false` to the constructor.

diff --git a/docs/core_docs/docs/integrations/vectorstores/googlevertexai.mdx b/docs/core_docs/docs/integrations/vectorstores/googlevertexai.mdx
@@ -63,10 +63,10 @@ initial testing, you will want to use something like a
 [GoogleCloudStorageDocstore](https://v02.api.js.langchain.com/classes/langchain_stores_doc_gcs.GoogleCloudStorageDocstore.html) to store it more permanently.
 
 ```typescript
-import { MatchingEngine } from "langchain/vectorstores/googlevertexai";
+import { MatchingEngine } from "@langchain/community/vectorstores/googlevertexai";
 import { Document } from "langchain/document";
 import { SyntheticEmbeddings } from "langchain/embeddings/fake";
-import { GoogleCloudStorageDocstore } from "langchain/stores/doc/gcs";
+import { GoogleCloudStorageDocstore } from "@langchain/community/stores/doc/gcs";
 
 const embeddings = new SyntheticEmbeddings({
   vectorSize: Number.parseInt(