Knowledge Node

KnowledgeNode ¶

Bases: BaseModel

Source code in src/fed_rag/data_structures/knowledge_node.py

class KnowledgeNode(BaseModel):
    model_config = ConfigDict(
        # ensures that validation is performed for defaulted None values
        validate_default=True
    )
    node_id: str = Field(default_factory=lambda: str(uuid.uuid4()))
    embedding: list[float] | None = Field(
        description="Encoded representation of node. If multimodal type, then this is shared embedding between image and text.",
        default=None,
    )
    node_type: NodeType = Field(description="Type of node.")
    text_content: str | None = Field(
        description="Text content. Used for TEXT and potentially MULTIMODAL node types.",
        default=None,
    )
    image_content: bytes | None = Field(
        description="Image content as binary data (decoded from base64)",
        default=None,
    )
    metadata: dict = Field(
        description="Metadata for node.", default_factory=dict
    )

    # validators
    @field_validator("text_content", mode="before")
    @classmethod
    def validate_text_content(
        cls, value: str | None, info: ValidationInfo
    ) -> str | None:
        node_type = info.data.get("node_type")
        node_type = cast(NodeType, node_type)
        if node_type == NodeType.TEXT and value is None:
            raise ValueError("NodeType == 'text', but text_content is None.")

        if node_type == NodeType.MULTIMODAL and value is None:
            raise ValueError(
                "NodeType == 'multimodal', but text_content is None."
            )

        return value

    @field_validator("image_content", mode="after")
    @classmethod
    def validate_image_content(
        cls, value: str | None, info: ValidationInfo
    ) -> str | None:
        node_type = info.data.get("node_type")
        node_type = cast(NodeType, node_type)
        if node_type == NodeType.IMAGE:
            if value is None:
                raise ValueError(
                    "NodeType == 'image', but image_content is None."
                )

        if node_type == NodeType.MULTIMODAL:
            if value is None:
                raise ValueError(
                    "NodeType == 'multimodal', but image_content is None."
                )

        return value

    def get_content(self) -> NodeContent:
        """Return dict of node content."""
        content: NodeContent = {
            "image_content": self.image_content,
            "text_content": self.text_content,
        }
        return content

    @field_serializer("metadata")
    def serialize_metadata(
        self, metadata: dict[Any, Any] | None
    ) -> str | None:
        """
        Custom serializer for the metadata field.

        Will serialize the metadata field into a json string.

        Args:
            metadata: Metadata dictionary to serialize.

        Returns:
            Serialized metadata as a json string.
        """
        if metadata:
            return json.dumps(metadata)
        return None

    @field_validator("metadata", mode="before")
    @classmethod
    def deserialize_metadata(
        cls, metadata: dict[Any, Any] | str | None
    ) -> dict[Any, Any] | None:
        """
        Custom validator for the metadata field.

        Will deserialize the metadata from a json string if it's a string.

        Args:
            metadata: Metadata to validate. If it is a json string, it will be deserialized into a dictionary.

        Returns:
            Validated metadata.
        """
        if isinstance(metadata, str):
            deserialized_metadata = json.loads(metadata)
            return cast(dict[Any, Any], deserialized_metadata)
        if metadata is None:
            return {}
        return metadata

    def model_dump_without_embeddings(self) -> dict[str, Any]:
        """Seriliaze the node without the embedding."""
        return self.model_dump(exclude={"embedding"})

get_content ¶

get_content()

Return dict of node content.

Source code in src/fed_rag/data_structures/knowledge_node.py

def get_content(self) -> NodeContent:
    """Return dict of node content."""
    content: NodeContent = {
        "image_content": self.image_content,
        "text_content": self.text_content,
    }
    return content

serialize_metadata ¶

serialize_metadata(metadata)

Custom serializer for the metadata field.

Will serialize the metadata field into a json string.

Parameters:

Name	Type	Description	Default
`metadata`	`dict[Any, Any] \| None`	Metadata dictionary to serialize.	required

Returns:

Type	Description
`str \| None`	Serialized metadata as a json string.

Source code in src/fed_rag/data_structures/knowledge_node.py

@field_serializer("metadata")
def serialize_metadata(
    self, metadata: dict[Any, Any] | None
) -> str | None:
    """
    Custom serializer for the metadata field.

    Will serialize the metadata field into a json string.

    Args:
        metadata: Metadata dictionary to serialize.

    Returns:
        Serialized metadata as a json string.
    """
    if metadata:
        return json.dumps(metadata)
    return None

deserialize_metadata `classmethod` ¶

deserialize_metadata(metadata)

Custom validator for the metadata field.

Will deserialize the metadata from a json string if it's a string.

Parameters:

Name	Type	Description	Default
`metadata`	`dict[Any, Any] \| str \| None`	Metadata to validate. If it is a json string, it will be deserialized into a dictionary.	required

Returns:

Type	Description
`dict[Any, Any] \| None`	Validated metadata.

Source code in src/fed_rag/data_structures/knowledge_node.py

@field_validator("metadata", mode="before")
@classmethod
def deserialize_metadata(
    cls, metadata: dict[Any, Any] | str | None
) -> dict[Any, Any] | None:
    """
    Custom validator for the metadata field.

    Will deserialize the metadata from a json string if it's a string.

    Args:
        metadata: Metadata to validate. If it is a json string, it will be deserialized into a dictionary.

    Returns:
        Validated metadata.
    """
    if isinstance(metadata, str):
        deserialized_metadata = json.loads(metadata)
        return cast(dict[Any, Any], deserialized_metadata)
    if metadata is None:
        return {}
    return metadata

model_dump_without_embeddings ¶

model_dump_without_embeddings()

Seriliaze the node without the embedding.

Source code in src/fed_rag/data_structures/knowledge_node.py

def model_dump_without_embeddings(self) -> dict[str, Any]:
    """Seriliaze the node without the embedding."""
    return self.model_dump(exclude={"embedding"})

Knowledge Node

KnowledgeNode ¶

get_content ¶

serialize_metadata ¶

deserialize_metadata classmethod ¶

model_dump_without_embeddings ¶

deserialize_metadata `classmethod` ¶