dify/api/core/helper/position_helper.py

117 lines
4.7 KiB
Python

import os
from collections import OrderedDict
from collections.abc import Callable
from typing import Any
from configs import dify_config
from core.tools.utils.yaml_utils import load_yaml_file
def get_position_map(folder_path: str, *, file_name: str = "_position.yaml") -> dict[str, int]:
"""
Get the mapping from name to index from a YAML file.
:param folder_path:
:param file_name: the YAML file name, default to '_position.yaml'
:return: a dict with name as key and index as value
"""
position_file_path = os.path.join(folder_path, file_name)
yaml_content = load_yaml_file(file_path=position_file_path, default_value=[])
positions = [item.strip() for item in yaml_content if item and isinstance(item, str) and item.strip()]
return {name: index for index, name in enumerate(positions)}
def get_tool_position_map(folder_path: str, file_name: str = "_position.yaml") -> dict[str, int]:
"""
Get the mapping for tools from name to index from a YAML file.
:param folder_path:
:param file_name: the YAML file name, default to '_position.yaml'
:return: a dict with name as key and index as value
"""
position_map = get_position_map(folder_path, file_name=file_name)
return sort_and_filter_position_map(
position_map,
pin_list=dify_config.POSITION_TOOL_PINS_LIST,
include_list=dify_config.POSITION_TOOL_INCLUDES_LIST,
exclude_list=dify_config.POSITION_TOOL_EXCLUDES_LIST
)
def get_provider_position_map(folder_path: str, file_name: str = "_position.yaml") -> dict[str, int]:
"""
Get the mapping for providers from name to index from a YAML file.
:param folder_path:
:param file_name: the YAML file name, default to '_position.yaml'
:return: a dict with name as key and index as value
"""
position_map = get_position_map(folder_path, file_name=file_name)
return sort_and_filter_position_map(
position_map,
pin_list=dify_config.POSITION_PROVIDER_PINS_LIST,
include_list=dify_config.POSITION_PROVIDER_INCLUDES_LIST,
exclude_list=dify_config.POSITION_PROVIDER_EXCLUDES_LIST
)
def sort_and_filter_position_map(original_position_map: dict[str, int], pin_list: list[str], include_list: list[str], exclude_list: list[str]) -> dict[str, int]:
"""
Sort and filter the positions
:param position_map: the position map to be sorted and filtered
:param pin_list: the list of pins to be put at the beginning
:param include_set: the set of names to be included
:param exclude_set: the set of names to be excluded
:return: the sorted and filtered position map
"""
positions = sorted(original_position_map.keys(), key=lambda x: original_position_map[x])
include_set = set(include_list) if include_list else set(positions)
exclude_set = set(exclude_list) if exclude_list else set()
# Add pins to position map
position_map = {name: idx for idx, name in enumerate(pin_list) if name in original_position_map}
# Add remaining positions to position map, respecting include and exclude lists
start_idx = len(position_map)
for name in positions:
if name in include_set and name not in exclude_set and name not in position_map:
position_map[name] = start_idx
start_idx += 1
return position_map
def sort_by_position_map(
position_map: dict[str, int],
data: list[Any],
name_func: Callable[[Any], str],
) -> list[Any]:
"""
Sort the objects by the position map.
If the name of the object is not in the position map, it will be put at the end.
:param position_map: the map holding positions in the form of {name: index}
:param name_func: the function to get the name of the object
:param data: the data to be sorted
:return: the sorted objects
"""
if not position_map or not data:
return data
filtered_data = [item for item in data if name_func(item) in position_map]
return sorted(filtered_data, key=lambda x: position_map.get(name_func(x), float('inf')))
def sort_to_dict_by_position_map(
position_map: dict[str, int],
data: list[Any],
name_func: Callable[[Any], str],
) -> OrderedDict[str, Any]:
"""
Sort the objects into a ordered dict by the position map.
If the name of the object is not in the position map, it will be put at the end.
:param position_map: the map holding positions in the form of {name: index}
:param name_func: the function to get the name of the object
:param data: the data to be sorted
:return: an OrderedDict with the sorted pairs of name and object
"""
sorted_items = sort_by_position_map(position_map, data, name_func)
return OrderedDict([(name_func(item), item) for item in sorted_items])