mirror of
https://git.mirrors.martin98.com/https://github.com/langgenius/dify.git
synced 2025-05-14 07:28:17 +08:00
123 lines
3.8 KiB
TypeScript
123 lines
3.8 KiB
TypeScript
import { uniq } from 'lodash-es'
|
|
import type { MultipleRetrievalConfig } from './types'
|
|
import type {
|
|
DataSet,
|
|
SelectedDatasetsMode,
|
|
} from '@/models/datasets'
|
|
import {
|
|
DEFAULT_WEIGHTED_SCORE,
|
|
RerankingModeEnum,
|
|
} from '@/models/datasets'
|
|
import { RETRIEVE_METHOD } from '@/types/app'
|
|
import { DATASET_DEFAULT } from '@/config'
|
|
|
|
export const checkNodeValid = () => {
|
|
return true
|
|
}
|
|
|
|
export const getSelectedDatasetsMode = (datasets: DataSet[]) => {
|
|
let allHighQuality = true
|
|
let allHighQualityVectorSearch = true
|
|
let allHighQualityFullTextSearch = true
|
|
let allEconomic = true
|
|
let mixtureHighQualityAndEconomic = true
|
|
let inconsistentEmbeddingModel = false
|
|
if (!datasets.length) {
|
|
allHighQuality = false
|
|
allHighQualityVectorSearch = false
|
|
allHighQualityFullTextSearch = false
|
|
allEconomic = false
|
|
mixtureHighQualityAndEconomic = false
|
|
inconsistentEmbeddingModel = false
|
|
}
|
|
datasets.forEach((dataset) => {
|
|
if (dataset.indexing_technique === 'economy') {
|
|
allHighQuality = false
|
|
allHighQualityVectorSearch = false
|
|
allHighQualityFullTextSearch = false
|
|
}
|
|
if (dataset.indexing_technique === 'high_quality') {
|
|
allEconomic = false
|
|
|
|
if (dataset.retrieval_model_dict.search_method !== RETRIEVE_METHOD.semantic)
|
|
allHighQualityVectorSearch = false
|
|
|
|
if (dataset.retrieval_model_dict.search_method !== RETRIEVE_METHOD.fullText)
|
|
allHighQualityFullTextSearch = false
|
|
}
|
|
})
|
|
|
|
if (allHighQuality || allEconomic)
|
|
mixtureHighQualityAndEconomic = false
|
|
|
|
if (allHighQuality)
|
|
inconsistentEmbeddingModel = uniq(datasets.map(item => item.embedding_model)).length > 1
|
|
|
|
return {
|
|
allHighQuality,
|
|
allHighQualityVectorSearch,
|
|
allHighQualityFullTextSearch,
|
|
allEconomic,
|
|
mixtureHighQualityAndEconomic,
|
|
inconsistentEmbeddingModel,
|
|
} as SelectedDatasetsMode
|
|
}
|
|
|
|
export const getMultipleRetrievalConfig = (multipleRetrievalConfig: MultipleRetrievalConfig, selectedDatasets: DataSet[]) => {
|
|
const {
|
|
allHighQuality,
|
|
allHighQualityVectorSearch,
|
|
allHighQualityFullTextSearch,
|
|
allEconomic,
|
|
mixtureHighQualityAndEconomic,
|
|
inconsistentEmbeddingModel,
|
|
} = getSelectedDatasetsMode(selectedDatasets)
|
|
|
|
const {
|
|
top_k = DATASET_DEFAULT.top_k,
|
|
score_threshold,
|
|
reranking_mode,
|
|
reranking_model,
|
|
weights,
|
|
reranking_enable,
|
|
} = multipleRetrievalConfig || { top_k: DATASET_DEFAULT.top_k }
|
|
|
|
const result = {
|
|
top_k,
|
|
score_threshold,
|
|
reranking_mode,
|
|
reranking_model,
|
|
weights,
|
|
reranking_enable: allEconomic ? reranking_enable : true,
|
|
}
|
|
|
|
if (allEconomic || mixtureHighQualityAndEconomic || inconsistentEmbeddingModel)
|
|
result.reranking_mode = RerankingModeEnum.RerankingModel
|
|
|
|
if (allHighQuality && !inconsistentEmbeddingModel && reranking_mode === undefined)
|
|
result.reranking_mode = RerankingModeEnum.WeightedScore
|
|
|
|
if (allHighQuality && !inconsistentEmbeddingModel && (reranking_mode === RerankingModeEnum.WeightedScore || reranking_mode === undefined) && !weights) {
|
|
result.weights = {
|
|
vector_setting: {
|
|
vector_weight: allHighQualityVectorSearch
|
|
? DEFAULT_WEIGHTED_SCORE.allHighQualityVectorSearch.semantic
|
|
: allHighQualityFullTextSearch
|
|
? DEFAULT_WEIGHTED_SCORE.allHighQualityFullTextSearch.semantic
|
|
: DEFAULT_WEIGHTED_SCORE.other.semantic,
|
|
embedding_provider_name: selectedDatasets[0].embedding_model_provider,
|
|
embedding_model_name: selectedDatasets[0].embedding_model,
|
|
},
|
|
keyword_setting: {
|
|
keyword_weight: allHighQualityVectorSearch
|
|
? DEFAULT_WEIGHTED_SCORE.allHighQualityVectorSearch.keyword
|
|
: allHighQualityFullTextSearch
|
|
? DEFAULT_WEIGHTED_SCORE.allHighQualityFullTextSearch.keyword
|
|
: DEFAULT_WEIGHTED_SCORE.other.keyword,
|
|
},
|
|
}
|
|
}
|
|
|
|
return result
|
|
}
|