Source code for julee.domain.models.assembly_specification.knowledge_service_query

"""
KnowledgeServiceQuery domain models for the Capture, Extract, Assemble,
Publish
workflow.

This module contains the KnowledgeServiceQuery domain object that represents
specific queries to knowledge services for data extraction in the CEAP
workflow system.

A KnowledgeServiceQuery defines a specific extraction operation that can be
performed against a knowledge service to extract data for a particular part
of an AssemblySpecification's JSON schema.

All domain models use Pydantic BaseModel for validation, serialization,
and type safety, following the patterns established in the sample project.
"""

from datetime import datetime, timezone
from typing import Any

from pydantic import BaseModel, Field, field_validator



[docs]
class KnowledgeServiceQuery(BaseModel):
    """Knowledge service query configuration for extracting specific data.

    A KnowledgeServiceQuery represents a specific extraction operation that
    can be performed against a knowledge service. It defines which knowledge
    service to use and what prompt to send for data extraction.

    When executed, the relevant section of the AssemblySpecification's JSON
    schema will be
    passed along with the prompt to ensure the knowledge service response
    conforms to the expected structure and validation requirements.

    The mapping between queries and schema sections is handled by the
    AssemblySpecification's knowledge_service_queries field.

    Examples of query_metadata usage:

    For Anthropic services::

        query_metadata = {
            "model": "claude-sonnet-4-5",
            "max_tokens": 4000,
            "temperature": 0.1
        }

    For OpenAI services::

        query_metadata = {
            "model": "gpt-4",
            "temperature": 0.2,
            "top_p": 0.9
        }

    For custom services::

        query_metadata = {
            "endpoint": "custom-model-v2",
            "timeout": 30,
            "retries": 3
        }

    """

    # Core query identification

[docs]
    query_id: str = Field(description="Unique identifier for this query")


[docs]
    name: str = Field(description="Human-readable name describing the query purpose")


    # Knowledge service configuration

[docs]
    knowledge_service_id: str = Field(
        description="Identifier of the knowledge service to query"
    )


[docs]
    prompt: str = Field(
        description="The specific prompt to send to the knowledge service "
        "for this extraction"
    )


    # Service-specific configuration

[docs]
    query_metadata: dict[str, Any] | None = Field(
        default_factory=dict,
        description="Service-specific metadata and configuration options "
        "such as model selection, temperature, max_tokens, etc. "
        "The structure depends on the specific knowledge service being used.",
    )


[docs]
    assistant_prompt: str | None = Field(
        default=None,
        description="Optional assistant message content to constrain "
        "or prime the model's response. This is added as the final "
        "assistant message before the model generates its response, "
        "allowing control over response format and structure.",
    )



[docs]
    created_at: datetime | None = Field(
        default_factory=lambda: datetime.now(timezone.utc)
    )


[docs]
    updated_at: datetime | None = Field(
        default_factory=lambda: datetime.now(timezone.utc)
    )


    @field_validator("query_id")
    @classmethod

[docs]
    def query_id_must_not_be_empty(cls, v: str) -> str:
        if not v or not v.strip():
            raise ValueError("Query ID cannot be empty")
        return v.strip()


    @field_validator("name")
    @classmethod

[docs]
    def name_must_not_be_empty(cls, v: str) -> str:
        if not v or not v.strip():
            raise ValueError("Query name cannot be empty")
        return v.strip()


    @field_validator("knowledge_service_id")
    @classmethod

[docs]
    def knowledge_service_id_must_not_be_empty(cls, v: str) -> str:
        if not v or not v.strip():
            raise ValueError("Knowledge service ID cannot be empty")
        return v.strip()


    @field_validator("prompt")
    @classmethod

[docs]
    def prompt_must_not_be_empty(cls, v: str) -> str:
        if not v or not v.strip():
            raise ValueError("Query prompt cannot be empty")
        return v.strip()