Python SDK Reference

This is the complete API reference for the waxell-observe package. All public symbols are exported from the top-level waxell_observe module.

from waxell_observe import (
    # Top-level functions
    init,
    shutdown,
    generate_session_id,
    # Decorators
    observe,           # Agent run decorator (alias for waxell_agent)
    waxell_agent,      # Original agent decorator (identical to observe)
    tool,              # @tool decorator
    decision,          # @decision decorator
    retrieval,         # @retrieval decorator
    reasoning_dec,     # @reasoning decorator
    retry_dec,         # @retry decorator
    step_dec,          # @step decorator
    # Convenience functions (work within active context)
    tag,
    metadata,
    score,
    decide,
    step,
    reason,
    retrieve,
    retry,
    get_context,
    # Human-in-the-loop
    input,              # Drop-in replacement for input()
    human_turn,         # Context manager for non-terminal channels
    human_interaction,  # One-shot recording
    # Approval handlers
    prompt_approval,    # Terminal Y/N prompt
    auto_approve,       # Always approve (testing)
    auto_deny,          # Always deny (testing)
    # Core classes
    WaxellObserveClient,
    ObserveConfig,
    WaxellContext,
    HumanTurn,
    # Types
    ApprovalDecision,
    LlmCallInfo,
    PolicyCheckResult,
    PromptGuardResult,
    RunCompleteResult,
    RunInfo,
    # Errors
    ConfigurationError,
    ObserveError,
    PolicyViolationError,
    PromptGuardError,
)

init

import waxell_observe

waxell_observe.init(
    api_key: str = "",
    api_url: str = "",
    capture_content: bool = False,
    instrument: list[str] | None = None,
    exclude: list[str] | None = None,
    instrument_infra: bool = True,
    infra_libraries: list[str] | None = None,
    infra_exclude: list[str] | None = None,
    resource_attributes: dict | None = None,
    debug: bool = False,
    prompt_guard: bool = False,
    prompt_guard_server: bool = False,
    prompt_guard_action: str = "block",
    on_policy_block: Callable | None = None,
) -> None

One-line initialization for waxell-observe. This single call configures the HTTP client, initializes OTel tracing (if installed), and auto-instruments installed LLM libraries.

Parameter	Type	Default	Description
`api_key`	`str`	`""`	Waxell API key (`wax_sk_...`). Falls back to `WAXELL_API_KEY` env var
`api_url`	`str`	`""`	Waxell API URL. Falls back to `WAXELL_API_URL` env var
`capture_content`	`bool`	`False`	Include prompt/response content in OTel traces
`instrument`	`list[str] \| None`	`None`	Libraries to auto-instrument (e.g. `["openai", "anthropic"]`). `None` means auto-detect all installed libraries
`exclude`	`list[str] \| None`	`None`	Skip these libraries during auto-instrumentation (e.g. `["litellm", "mcp"]`). Falls back to `WAXELL_EXCLUDE` env var (comma-delimited). Takes precedence over `instrument`
`instrument_infra`	`bool`	`True`	Enable auto-instrumentation of infrastructure libraries (HTTP clients, databases, caches, queues). Falls back to `WAXELL_INSTRUMENT_INFRA` env var
`infra_libraries`	`list[str] \| None`	`None`	Only instrument these specific infra libraries (e.g. `["redis", "httpx"]`). `None` means auto-detect all
`infra_exclude`	`list[str] \| None`	`None`	Instrument all infra libraries except these (e.g. `["celery", "grpc"]`). Falls back to `WAXELL_INFRA_EXCLUDE` env var (comma-delimited)
`resource_attributes`	`dict \| None`	`None`	Custom OTel resource attributes applied to all spans (e.g. `{"deployment.environment": "production"}`)
`debug`	`bool`	`False`	Enable debug logging and console span export
`prompt_guard`	`bool`	`False`	Enable client-side prompt guard (PII, credential, injection detection). Falls back to `WAXELL_PROMPT_GUARD` env var
`prompt_guard_server`	`bool`	`False`	Also check server-side guard service (ML-powered via Presidio + HuggingFace). Falls back to `WAXELL_PROMPT_GUARD_SERVER` env var
`prompt_guard_action`	`str`	`"block"`	Action on violations: `"block"` (raise error), `"warn"` (log and continue), `"redact"` (replace with `##TYPE##`). Falls back to `WAXELL_PROMPT_GUARD_ACTION` env var
`on_policy_block`	`Callable \| None`	`None`	Default handler for all contexts when a policy blocks. Receives `PolicyViolationError`, returns `ApprovalDecision`. Built-in: `prompt_approval`, `auto_approve`, `auto_deny`

Behavior:

Checks the WAXELL_OBSERVE environment variable kill switch first. If set to "false", "0", or "no", initialization is skipped entirely.
Idempotent: calling init() multiple times is safe. Only the first call takes effect.
OTel tracing failure does not block the HTTP path. If tracing initialization fails, a warning is logged and the HTTP-based telemetry continues to work.
Auto-instrumentation failure does not block manual tracing.

Example:

import waxell_observe

# Minimal setup -- auto-detects URL from env, instruments all installed libraries
waxell_observe.init(api_key="wax_sk_abc123")

# Full control
waxell_observe.init(
    api_key="wax_sk_abc123",
    api_url="https://acme.waxell.dev",
    capture_content=True,
    instrument=["openai", "anthropic"],
    debug=True,
)

shutdown

import waxell_observe

waxell_observe.shutdown() -> None

Shut down waxell-observe: flush pending traces and remove auto-instrumentation.

Behavior:

Calls shutdown_tracing() to flush the OTel span processor and shut down the TracerProvider.
Calls uninstrument_all() to remove monkey-patches from instrumented libraries.
Resets the internal _initialized flag so init() can be called again.
Safe to call even if init() was never called.

Example:

import waxell_observe
import atexit

waxell_observe.init(api_key="wax_sk_abc123")
atexit.register(waxell_observe.shutdown)

generate_session_id

from waxell_observe import generate_session_id

generate_session_id() -> str

Generate a random session ID for grouping related runs.

Returns: A string in the format sess_ followed by 16 hex characters (e.g. sess_a1b2c3d4e5f6g7h8).

Example:

from waxell_observe import generate_session_id, WaxellContext

session = generate_session_id()

async with WaxellContext(agent_name="agent-1", session_id=session) as ctx:
    ...

async with WaxellContext(agent_name="agent-2", session_id=session) as ctx:
    ...

Top-Level Convenience Functions

These functions operate on the current WaxellContext in scope. They are no-ops when called outside of an active context, making them safe to use in code that may or may not be wrapped by @observe or WaxellContext.

tag

import waxell_observe

waxell_observe.tag(key: str, value: str) -> None

Set a searchable tag on the current context. No-op if no context is active.

Example:

from waxell_observe import observe
import waxell_observe

@observe(agent_name="my-agent")
async def run_agent(query: str) -> str:
    waxell_observe.tag("environment", "production")
    waxell_observe.tag("pipeline", "rag-v2")
    return await process(query)

metadata

import waxell_observe

waxell_observe.metadata(key: str, value: Any) -> None

Set metadata on the current context. Values can be any JSON-serializable type. No-op if no context is active.

Example:

waxell_observe.metadata("model_version", "gpt-4-turbo")
waxell_observe.metadata("config", {"temperature": 0.7})

score

import waxell_observe

waxell_observe.score(
    name: str,
    value: float | str | bool,
    data_type: str = "numeric",
    comment: str = "",
) -> None

Record a score on the current context. No-op if no context is active.

Parameter	Type	Default	Description
`name`	`str`	(required)	Score name
`value`	`float \| str \| bool`	(required)	Score value
`data_type`	`str`	`"numeric"`	`"numeric"`, `"categorical"`, or `"boolean"`
`comment`	`str`	`""`	Optional comment

Example:

waxell_observe.score("relevance", 0.95)
waxell_observe.score("helpful", True, data_type="boolean")
waxell_observe.score("category", "informational", data_type="categorical")

decide

import waxell_observe

waxell_observe.decide(
    name: str,
    chosen: str,
    options: list[str] | None = None,
    reasoning: str = "",
    confidence: float | None = None,
) -> None

Record a decision on the current context. No-op if no context is active.

Parameter	Type	Default	Description
`name`	`str`	(required)	Decision name
`chosen`	`str`	(required)	The selected option
`options`	`list[str] \| None`	`None`	Available choices
`reasoning`	`str`	`""`	Why this option was chosen
`confidence`	`float \| None`	`None`	Confidence score (0.0-1.0)

Example:

waxell_observe.decide(
    "route_query",
    chosen="semantic_search",
    options=["semantic", "keyword", "hybrid"],
    reasoning="Query contains natural language phrasing",
    confidence=0.9,
)

step

waxell_observe.step(name: str, output: dict | None = None) -> None

Record an execution step on the current context. No-op if no context is active.

Parameter	Type	Default	Description
`name`	`str`	(required)	Step name
`output`	`dict \| None`	`None`	Step output data

Example:

waxell_observe.step("preprocessing", output={"tokens": 150, "language": "en"})
waxell_observe.step("validation")  # output is optional

reason

waxell_observe.reason(
    step: str,
    thought: str,
    evidence: list[str] | None = None,
    conclusion: str = "",
) -> None

Record a reasoning step on the current context. No-op if no context is active.

Parameter	Type	Default	Description
`step`	`str`	(required)	Reasoning step name
`thought`	`str`	(required)	The reasoning thought process
`evidence`	`list[str] \| None`	`None`	Supporting evidence
`conclusion`	`str`	`""`	Final conclusion

Example:

waxell_observe.reason(
    "source_evaluation",
    thought="Document A is from a peer-reviewed journal",
    evidence=["Published 2024", "Cited 45 times"],
    conclusion="High reliability source",
)

retrieve

waxell_observe.retrieve(
    query: str,
    documents: list[dict],
    source: str = "",
    scores: list[float] | None = None,
) -> None

Record a retrieval operation on the current context. No-op if no context is active.

Parameter	Type	Default	Description
`query`	`str`	(required)	The search query
`documents`	`list[dict]`	(required)	Retrieved documents
`source`	`str`	`""`	Data source name
`scores`	`list[float] \| None`	`None`	Relevance scores

Example:

waxell_observe.retrieve(
    query="AI safety best practices",
    documents=[{"id": "doc1", "title": "Safety Guide"}],
    source="pinecone",
    scores=[0.95],
)

retry

waxell_observe.retry(
    attempt: int,
    reason: str,
    strategy: str = "retry",
    original_error: str = "",
    fallback_to: str = "",
) -> None

Record a retry/fallback event on the current context. No-op if no context is active.

Parameter	Type	Default	Description
`attempt`	`int`	(required)	Attempt number (1-indexed)
`reason`	`str`	(required)	Why the retry occurred
`strategy`	`str`	`"retry"`	Strategy: `"retry"`, `"fallback"`, `"circuit_break"`
`original_error`	`str`	`""`	Error that triggered the retry
`fallback_to`	`str`	`""`	Fallback target name

Example:

waxell_observe.retry(
    attempt=2,
    reason="Rate limit exceeded",
    strategy="fallback",
    original_error="429 Too Many Requests",
    fallback_to="gpt-4o-mini",
)

get_context

import waxell_observe

waxell_observe.get_context() -> WaxellContext | None

Get the current WaxellContext if one is active, otherwise None.

Example:

ctx = waxell_observe.get_context()
if ctx:
    ctx.record_llm_call(model="gpt-4o", tokens_in=100, tokens_out=50)

input

import waxell_observe

waxell_observe.input(prompt: str = "", *, action: str = "input") -> str

Drop-in replacement for Python's built-in input(). Calls input(prompt) and records the prompt, response, and elapsed time as a human_turn IO span.

Falls back to plain input() if called outside a WaxellContext.

Example:

answer = waxell_observe.input("Approve? (y/n): ")

human_turn

import waxell_observe

waxell_observe.human_turn(
    prompt: str = "",
    channel: str = "terminal",
    action: str = "",
    metadata: dict | None = None,
) -> HumanTurn | _NoOpHumanTurn

Returns a context manager that captures a human interaction as a timed IO span. Use for non-terminal channels (Slack, webhooks, UI).

Returns a no-op if called outside a WaxellContext.

Example:

with waxell_observe.human_turn(prompt="Deploy?", channel="slack", action="approval") as turn:
    response = await wait_for_reaction()
    turn.set_response(response)

human_interaction

import waxell_observe

waxell_observe.human_interaction(
    prompt: str = "",
    response: str = "",
    channel: str = "terminal",
    action: str = "",
    elapsed_seconds: float | None = None,
    metadata: dict | None = None,
) -> None

Record a completed human interaction. One-shot alternative to human_turn() when you already have all the data.