Adding CQA Retriever

This commit is contained in:
2025-05-24 12:27:45 -05:00
parent 65fb3532e3
commit 93362b209b
7 changed files with 240 additions and 0 deletions

View File

@@ -0,0 +1,74 @@
const filter = {
filterExpression: CQA_RetrieverSettings.filterExpression,
};
const embedding = new langchain.openai.AzureOpenAIEmbeddings({
azureOpenAIApiInstanceName:
CQA_RetrieverSettings.azure_openai_api.instance_name,
azureOpenAIApiDeploymentName:
CQA_RetrieverSettings.azure_openai_api.deployment_name,
azureOpenAIApiVersion: CQA_RetrieverSettings.azure_openai_api.version,
azureOpenAIApiKey: CQA_RetrieverSettings.azure_openai_api.key,
});
const store =
new langchain.community.vectorstores.azure_aisearch.AzureAISearchVectorStore(
embedding,
{
endpoint: CQA_RetrieverSettings.azure_aisearch.endpoint,
key: CQA_RetrieverSettings.azure_aisearch.key,
indexName: CQA_RetrieverSettings.azure_aisearch.index_name,
search: {
type: langchain.community.vectorstores.azure_aisearch
.AzureAISearchQueryType.SimilarityHybrid,
},
}
);
function getSourceId(document) {
if (document.metadata) {
const mergedMetadata = Object.values(document.metadata).join("");
const metatDataObj = JSON.parse(mergedMetadata);
if ("sourceURL" in metatDataObj) {
return metatDataObj.sourceURL;
}
if ("source" in metatDataObj) {
return metatDataObj.source;
}
if ("source_id" in metatDataObj) {
return metatDataObj.source_id;
}
if ("sourceName" in metatDataObj) {
return metatDataObj.sourceName;
}
} else return "no source found";
}
return {
async retrieve(query) {
const resultDocuments = await store.similaritySearch(query, 20, filter);
const sources = resultDocuments.map((doc) => ({
source_id: getSourceId(doc),
text: doc.pageContent,
}));
const cqaSources = {
instances: [
{
sources: sources,
question: query,
generate_question: true,
knowledgebase_description: "iva-vector-demo",
extra_guidance: "",
language_code: "en-GB",
},
],
};
if (CQA_RetrieverSettings.debug)
console.log(JSON.stringify(cqaSources, null, 2));
return cqaSources;
},
};

View File

@@ -0,0 +1,16 @@
{
"azure_aisearch": {
"endpoint": "https://iva-demo-vector-service.search.windows.net",
"key": "<azure_aisearch_key>",
"index_name": "iva-vector-demo"
},
"azure_openai_api": {
"key": "<azure_openai_key>",
"instance_name": "iva-open-ai",
"deployment_name": "text-embedding-3-small",
"embeddings_deployment_name": null,
"version": "2024-08-01-preview"
},
"filterExpression": "search.in(company, 'Verint')",
"debug": true
}