| |
| |
| """ |
| Reference: |
| - [graphrag](https://github.com/microsoft/graphrag) |
| """ |
|
|
| import html |
| import re |
| from collections.abc import Callable |
| from typing import Any |
|
|
| ErrorHandlerFn = Callable[[BaseException | None, str | None, dict | None], None] |
|
|
|
|
| def perform_variable_replacements( |
| input: str, history: list[dict] | None = None, variables: dict | None = None |
| ) -> str: |
| """Perform variable replacements on the input string and in a chat log.""" |
| if history is None: |
| history = [] |
| if variables is None: |
| variables = {} |
| result = input |
|
|
| def replace_all(input: str) -> str: |
| result = input |
| for k, v in variables.items(): |
| result = result.replace(f"{{{k}}}", v) |
| return result |
|
|
| result = replace_all(result) |
| for i, entry in enumerate(history): |
| if entry.get("role") == "system": |
| entry["content"] = replace_all(entry.get("content") or "") |
|
|
| return result |
|
|
|
|
| def clean_str(input: Any) -> str: |
| """Clean an input string by removing HTML escapes, control characters, and other unwanted characters.""" |
| |
| if not isinstance(input, str): |
| return input |
|
|
| result = html.unescape(input.strip()) |
| |
| return re.sub(r"[\"\x00-\x1f\x7f-\x9f]", "", result) |
|
|
|
|
| def dict_has_keys_with_types( |
| data: dict, expected_fields: list[tuple[str, type]] |
| ) -> bool: |
| """Return True if the given dictionary has the given keys with the given types.""" |
| for field, field_type in expected_fields: |
| if field not in data: |
| return False |
|
|
| value = data[field] |
| if not isinstance(value, field_type): |
| return False |
| return True |
|
|
|
|