langflow/src/backend/base/langflow/schema/schema.py
2024-04-01 10:37:41 -03:00

150 lines
5.2 KiB
Python

import copy
from typing import Literal, Optional
from langchain_core.documents import Document
from pydantic import BaseModel, model_validator
class Record(BaseModel):
"""
Represents a record with text and optional data.
Attributes:
data (dict, optional): Additional data associated with the record.
"""
text_key: Optional[str] = "text"
data: dict = {}
default_value: Optional[str] = ""
@model_validator(mode="before")
def validate_data(cls, values):
if not values.get("data"):
values["data"] = {}
# Any other keyword should be added to the data dictionary
for key in values:
if key not in values["data"] and key not in {"text_key", "data", "default_value"}:
values["data"][key] = values[key]
return values
def get_text(self):
"""
Retrieves the text value from the data dictionary.
If the text key is present in the data dictionary, the corresponding value is returned.
Otherwise, the default value is returned.
Returns:
The text value from the data dictionary or the default value.
"""
return self.data.get(self.text_key, self.default_value)
@classmethod
def from_document(cls, document: Document) -> "Record":
"""
Converts a Document to a Record.
Args:
document (Document): The Document to convert.
Returns:
Record: The converted Record.
"""
data = document.metadata
data["text"] = document.page_content
return cls(data=data, text_key="text")
def __add__(self, other: "Record") -> "Record":
"""
Combines the data of two records by attempting to add values for overlapping keys
for all types that support the addition operation. Falls back to the value from 'other'
record when addition is not supported.
"""
combined_data = self.data.copy()
for key, value in other.data.items():
# If the key exists in both records and both values support the addition operation
if key in combined_data:
try:
combined_data[key] += value
except TypeError:
# Fallback: Use the value from 'other' record if addition is not supported
combined_data[key] = value
else:
# If the key is not in the first record, simply add it
combined_data[key] = value
return Record(data=combined_data)
def to_lc_document(self) -> Document:
"""
Converts the Record to a Document.
Returns:
Document: The converted Document.
"""
text = self.data.pop(self.text_key, self.default_value)
return Document(page_content=text, metadata=self.data)
def __getattr__(self, key):
"""
Allows attribute-like access to the data dictionary.
"""
try:
if key.startswith("__"):
return self.__getattribute__(key)
if key in {"data", "text_key"} or key.startswith("_"):
return super().__getattr__(key)
return self.data.get(key, self.default_value)
except KeyError:
# Fallback to default behavior to raise AttributeError for undefined attributes
raise AttributeError(f"'{type(self).__name__}' object has no attribute '{key}'")
def __setattr__(self, key, value):
"""
Allows attribute-like setting of values in the data dictionary,
while still allowing direct assignment to class attributes.
"""
if key in {"data", "text_key"} or key.startswith("_"):
super().__setattr__(key, value)
else:
self.data[key] = value
def __delattr__(self, key):
"""
Allows attribute-like deletion from the data dictionary.
"""
if key in {"data", "text_key"} or key.startswith("_"):
super().__delattr__(key)
else:
del self.data[key]
def __deepcopy__(self, memo):
"""
Custom deepcopy implementation to handle copying of the Record object.
"""
# Create a new Record object with a deep copy of the data dictionary
return Record(data=copy.deepcopy(self.data, memo), text_key=self.text_key, default_value=self.default_value)
def __str__(self) -> str:
"""
Returns a string representation of the Record, including text and data.
"""
# Assuming a method to dump model data as JSON string exists.
# If it doesn't, you might need to implement it or use json.dumps() directly.
# build the string considering all keys in the data dictionary
prefix = "Record("
suffix = ")"
text = f"text_key={self.text_key}, "
text += ", ".join([f"{k}={v}" for k, v in self.data.items()])
return prefix + text + suffix
# check which attributes the Record has by checking the keys in the data dictionary
def __dir__(self):
return super().__dir__() + list(self.data.keys())
INPUT_FIELD_NAME = "input_value"
InputType = Literal["chat", "text", "any"]
OutputType = Literal["chat", "text", "any", "debug"]