forked from langchain-ai/langchainjs
-
Notifications
You must be signed in to change notification settings - Fork 0
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
Adds metadata filtering for SemanticSimilarityExampleSelector, update…
…s docs (langchain-ai#2834) * Adds metadata filtering for SemanticSimilarityExampleSelector, updates docs * Update docs
- Loading branch information
1 parent
a672831
commit fa98f73
Showing
7 changed files
with
298 additions
and
62 deletions.
There are no files selected for viewing
28 changes: 28 additions & 0 deletions
28
docs/snippets/modules/model_io/prompts/example_selectors/similarity.mdx
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -1,4 +1,32 @@ | ||
import CodeBlock from "@theme/CodeBlock"; | ||
import ExampleSimilarity from "@examples/prompts/semantic_similarity_example_selector.ts"; | ||
|
||
The fields of the examples object will be used as parameters to format the `examplePrompt` passed to the `FewShotPromptTemplate`. | ||
Each example should therefore contain all required fields for the example prompt you are using. | ||
|
||
<CodeBlock language="typescript">{ExampleSimilarity}</CodeBlock> | ||
|
||
By default, each field in the examples object is concatenated together, embedded, and stored in the vectorstore for | ||
later similarity search against user queries. | ||
|
||
If you only want to embed specific keys | ||
(e.g., you only want to search for examples that have a similar query to the one the user provides), you can pass an `inputKeys` | ||
array in the final `options` parameter. | ||
|
||
## Loading from an existing vectorstore | ||
|
||
You can also use a pre-initialized vector store by passing an instance to the `SemanticSimilarityExampleSelector` constructor | ||
directly, as shown below. You can also add more examples via the `addExample` method: | ||
|
||
import ExampleSimilarityFromExisting from "@examples/prompts/semantic_similarity_example_selector_from_existing.ts"; | ||
|
||
<CodeBlock language="typescript">{ExampleSimilarityFromExisting}</CodeBlock> | ||
|
||
## Metadata filtering | ||
|
||
When adding examples, each field is available as metadata in the produced document. If you would like further control over your | ||
search space, you can add extra fields to your examples and pass a `filter` parameter when initializing your selector: | ||
|
||
import ExampleSimilarityMetadataFiltering from "@examples/prompts/semantic_similarity_example_selector_metadata_filtering.ts"; | ||
|
||
<CodeBlock language="typescript">{ExampleSimilarityMetadataFiltering}</CodeBlock> |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
102 changes: 102 additions & 0 deletions
102
examples/src/prompts/semantic_similarity_example_selector_from_existing.ts
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,102 @@ | ||
// Ephemeral, in-memory vector store for demo purposes | ||
import { MemoryVectorStore } from "langchain/vectorstores/memory"; | ||
import { | ||
SemanticSimilarityExampleSelector, | ||
PromptTemplate, | ||
FewShotPromptTemplate, | ||
} from "langchain/prompts"; | ||
import { OpenAIEmbeddings } from "langchain/embeddings/openai"; | ||
import { ChatOpenAI } from "langchain/chat_models/openai"; | ||
|
||
const embeddings = new OpenAIEmbeddings(); | ||
|
||
const memoryVectorStore = new MemoryVectorStore(embeddings); | ||
|
||
const examples = [ | ||
{ | ||
query: "healthy food", | ||
output: `galbi`, | ||
}, | ||
{ | ||
query: "healthy food", | ||
output: `schnitzel`, | ||
}, | ||
{ | ||
query: "foo", | ||
output: `bar`, | ||
}, | ||
]; | ||
|
||
const exampleSelector = new SemanticSimilarityExampleSelector({ | ||
vectorStore: memoryVectorStore, | ||
k: 2, | ||
// Only embed the "query" key of each example | ||
inputKeys: ["query"], | ||
}); | ||
|
||
for (const example of examples) { | ||
// Format and add an example to the underlying vector store | ||
await exampleSelector.addExample(example); | ||
} | ||
|
||
// Create a prompt template that will be used to format the examples. | ||
const examplePrompt = PromptTemplate.fromTemplate(`<example> | ||
<user_input> | ||
{query} | ||
</user_input> | ||
<output> | ||
{output} | ||
</output> | ||
</example>`); | ||
|
||
// Create a FewShotPromptTemplate that will use the example selector. | ||
const dynamicPrompt = new FewShotPromptTemplate({ | ||
// We provide an ExampleSelector instead of examples. | ||
exampleSelector, | ||
examplePrompt, | ||
prefix: `Answer the user's question, using the below examples as reference:`, | ||
suffix: "User question: {query}", | ||
inputVariables: ["query"], | ||
}); | ||
|
||
const formattedValue = await dynamicPrompt.format({ | ||
query: "What is a healthy food?", | ||
}); | ||
console.log(formattedValue); | ||
|
||
/* | ||
Answer the user's question, using the below examples as reference: | ||
<example> | ||
<user_input> | ||
healthy | ||
</user_input> | ||
<output> | ||
galbi | ||
</output> | ||
</example> | ||
<example> | ||
<user_input> | ||
healthy | ||
</user_input> | ||
<output> | ||
schnitzel | ||
</output> | ||
</example> | ||
User question: What is a healthy food? | ||
*/ | ||
|
||
const model = new ChatOpenAI({}); | ||
|
||
const chain = dynamicPrompt.pipe(model); | ||
|
||
const result = await chain.invoke({ query: "What is a healthy food?" }); | ||
console.log(result); | ||
/* | ||
AIMessage { | ||
content: 'A healthy food can be galbi or schnitzel.', | ||
additional_kwargs: { function_call: undefined } | ||
} | ||
*/ |
82 changes: 82 additions & 0 deletions
82
examples/src/prompts/semantic_similarity_example_selector_metadata_filtering.ts
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,82 @@ | ||
// Ephemeral, in-memory vector store for demo purposes | ||
import { MemoryVectorStore } from "langchain/vectorstores/memory"; | ||
import { | ||
SemanticSimilarityExampleSelector, | ||
PromptTemplate, | ||
FewShotPromptTemplate, | ||
} from "langchain/prompts"; | ||
import { OpenAIEmbeddings } from "langchain/embeddings/openai"; | ||
import { ChatOpenAI } from "langchain/chat_models/openai"; | ||
import { Document } from "langchain/document"; | ||
|
||
const embeddings = new OpenAIEmbeddings(); | ||
|
||
const memoryVectorStore = new MemoryVectorStore(embeddings); | ||
|
||
const examples = [ | ||
{ | ||
query: "healthy food", | ||
output: `lettuce`, | ||
food_type: "vegetable", | ||
}, | ||
{ | ||
query: "healthy food", | ||
output: `schnitzel`, | ||
food_type: "veal", | ||
}, | ||
{ | ||
query: "foo", | ||
output: `bar`, | ||
food_type: "baz", | ||
}, | ||
]; | ||
|
||
const exampleSelector = new SemanticSimilarityExampleSelector({ | ||
vectorStore: memoryVectorStore, | ||
k: 2, | ||
// Only embed the "query" key of each example | ||
inputKeys: ["query"], | ||
// Filter type will depend on your specific vector store. | ||
// See the section of the docs for the specific vector store you are using. | ||
filter: (doc: Document) => doc.metadata.food_type === "vegetable", | ||
}); | ||
|
||
for (const example of examples) { | ||
// Format and add an example to the underlying vector store | ||
await exampleSelector.addExample(example); | ||
} | ||
|
||
// Create a prompt template that will be used to format the examples. | ||
const examplePrompt = PromptTemplate.fromTemplate(`<example> | ||
<user_input> | ||
{query} | ||
</user_input> | ||
<output> | ||
{output} | ||
</output> | ||
</example>`); | ||
|
||
// Create a FewShotPromptTemplate that will use the example selector. | ||
const dynamicPrompt = new FewShotPromptTemplate({ | ||
// We provide an ExampleSelector instead of examples. | ||
exampleSelector, | ||
examplePrompt, | ||
prefix: `Answer the user's question, using the below examples as reference:`, | ||
suffix: "User question:\n{query}", | ||
inputVariables: ["query"], | ||
}); | ||
|
||
const model = new ChatOpenAI({}); | ||
|
||
const chain = dynamicPrompt.pipe(model); | ||
|
||
const result = await chain.invoke({ | ||
query: "What is exactly one type of healthy food?", | ||
}); | ||
console.log(result); | ||
/* | ||
AIMessage { | ||
content: 'One type of healthy food is lettuce.', | ||
additional_kwargs: { function_call: undefined } | ||
} | ||
*/ |
Oops, something went wrong.