harness-python-react/tests/test_otel_semconv.py at 1a32080b9595ea5adc7040f43f7bb71e366ecafc · constk/harness-python-react · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
"""Assertions that emitted spans use OTel semantic-convention attribute names.

Test-side enforcement of the rule "use the official OTel semconv attribute
names where one exists" (see `src/observability/spans.py` and
`docs/INVARIANTS.md`).

The scaffold ships only semconv-defined keys (no custom ones); the
`ALLOWED_CUSTOM_KEYS` set below is intentionally empty. When a project
that extends this template needs a custom attribute (e.g.
`agent.tool_calls_count`), it MUST add a constant to
`src/observability/spans.py` AND register it in `ALLOWED_CUSTOM_KEYS` —
the registry-closure test fails otherwise. That's the forcing function
that keeps custom keys to their documented set rather than letting them
proliferate as one-off raw strings.
"""

from __future__ import annotations

from typing import TYPE_CHECKING

import pytest
from opentelemetry import trace
from opentelemetry.sdk.trace import TracerProvider
from opentelemetry.sdk.trace.export import SimpleSpanProcessor
from opentelemetry.sdk.trace.export.in_memory_span_exporter import (
    InMemorySpanExporter,
)

from src.observability import spans as spans_module
from src.observability.spans import (
    DB_QUERY_TEXT,
    DB_RESPONSE_RETURNED_ROWS,
    GENAI_CONVERSATION_ID,
    GENAI_OPERATION_NAME,
    GENAI_PROVIDER_NAME,
    GENAI_REQUEST_MODEL,
    GENAI_TOOL_CALL_ARGUMENTS,
    GENAI_TOOL_CALL_RESULT,
    GENAI_TOOL_NAME,
    GENAI_USAGE_INPUT_TOKENS,
    GENAI_USAGE_OUTPUT_TOKENS,
    agent_span,
)

if TYPE_CHECKING:
    from collections.abc import Sequence

    from opentelemetry.sdk.trace import ReadableSpan


SEMCONV_KEYS: frozenset[str] = frozenset(
    {
        GENAI_CONVERSATION_ID,
        GENAI_REQUEST_MODEL,
        GENAI_OPERATION_NAME,
        GENAI_PROVIDER_NAME,
        GENAI_USAGE_INPUT_TOKENS,
        GENAI_USAGE_OUTPUT_TOKENS,
        GENAI_TOOL_NAME,
        GENAI_TOOL_CALL_ARGUMENTS,
        GENAI_TOOL_CALL_RESULT,
        DB_QUERY_TEXT,
        DB_RESPONSE_RETURNED_ROWS,
    }
)

# Custom keys allowed because no semconv equivalent exists. Empty in the
# scaffold — projects that extend this template add entries here as they
# add custom span attributes (and constants in `src/observability/spans.py`).
ALLOWED_CUSTOM_KEYS: frozenset[str] = frozenset()

ACCEPTED_KEYS: frozenset[str] = SEMCONV_KEYS | ALLOWED_CUSTOM_KEYS


@pytest.fixture
def memory_exporter(monkeypatch: pytest.MonkeyPatch) -> InMemorySpanExporter:
    """Install a TracerProvider that records spans into an in-memory exporter.

    Uses `monkeypatch.setattr` to swap `trace.get_tracer_provider` for the
    test's lifetime instead of `trace.set_tracer_provider` — the OTel SDK
    refuses to override the global provider once any other test has called
    `set_tracer_provider`, which would silently route spans to the wrong
    exporter.

    Uses `SimpleSpanProcessor` so spans are visible to `get_finished_spans()`
    immediately after the span context exits — no flush race.
    """
    exporter = InMemorySpanExporter()
    provider = TracerProvider()
    provider.add_span_processor(SimpleSpanProcessor(exporter))
    monkeypatch.setattr(trace, "get_tracer_provider", lambda: provider)
    return exporter


def _span_by_name(spans: Sequence[ReadableSpan], name: str) -> ReadableSpan:
    """Return the unique span with the given name (assert exactly one)."""
    matches = [s for s in spans if s.name == name]
    assert len(matches) == 1, (
        f"expected exactly one span named {name!r}, got {len(matches)} "
        f"(all names: {[s.name for s in spans]})"
    )
    return matches[0]


def test_tool_call_span_carries_genai_tool_attributes(
    memory_exporter: InMemorySpanExporter,
) -> None:
    """A tool-call span carries the documented `gen_ai.tool.*` keys."""
    tool_attrs: dict[str, str | int] = {
        GENAI_TOOL_NAME: "echo",
        GENAI_TOOL_CALL_ARGUMENTS: '{"msg": "hi"}',
        GENAI_TOOL_CALL_RESULT: '{"echoed": "hi"}',
    }
    with agent_span("tool.echo", tool_attrs):
        pass

    spans = memory_exporter.get_finished_spans()
    tool_span = _span_by_name(spans, "tool.echo")
    assert tool_span.attributes is not None
    keys = set(tool_span.attributes)

    assert GENAI_TOOL_NAME in keys
    assert GENAI_TOOL_CALL_ARGUMENTS in keys
    assert GENAI_TOOL_CALL_RESULT in keys
    assert tool_span.attributes[GENAI_TOOL_NAME] == "echo"


def test_llm_call_span_carries_genai_attributes(
    memory_exporter: InMemorySpanExporter,
) -> None:
    """An LLM-style span carries the documented `gen_ai.*` keys + token usage."""
    llm_attrs: dict[str, str | int] = {
        GENAI_CONVERSATION_ID: "session-test-1",
        GENAI_REQUEST_MODEL: "gpt-4o-mini",
        GENAI_OPERATION_NAME: "chat",
        GENAI_PROVIDER_NAME: "openai",
        GENAI_USAGE_INPUT_TOKENS: 42,
        GENAI_USAGE_OUTPUT_TOKENS: 100,
    }
    with agent_span("agent.llm_call", llm_attrs):
        pass

    spans = memory_exporter.get_finished_spans()
    llm_span = _span_by_name(spans, "agent.llm_call")
    assert llm_span.attributes is not None

    for key, value in llm_attrs.items():
        assert key in llm_span.attributes, f"missing {key}"
        assert llm_span.attributes[key] == value


def test_db_query_span_carries_db_attributes(
    memory_exporter: InMemorySpanExporter,
) -> None:
    """A DB-query span carries `db.query.text` + `db.response.returned_rows`."""
    db_attrs: dict[str, str | int] = {
        DB_QUERY_TEXT: "SELECT 1",
        DB_RESPONSE_RETURNED_ROWS: 1,
    }
    with agent_span("db.example_query", db_attrs):
        pass

    spans = memory_exporter.get_finished_spans()
    db_span = _span_by_name(spans, "db.example_query")
    assert db_span.attributes is not None
    keys = set(db_span.attributes)

    assert DB_QUERY_TEXT in keys
    assert DB_RESPONSE_RETURNED_ROWS in keys


def test_no_unregistered_attribute_keys_emitted(
    memory_exporter: InMemorySpanExporter,
) -> None:
    """Every emitted attribute key is in `SEMCONV_KEYS` or `ALLOWED_CUSTOM_KEYS`."""
    with agent_span(
        "tool.echo",
        {
            GENAI_TOOL_NAME: "echo",
            GENAI_TOOL_CALL_ARGUMENTS: "{}",
            GENAI_TOOL_CALL_RESULT: "{}",
        },
    ):
        pass

    spans = memory_exporter.get_finished_spans()

    rogue: list[tuple[str, str]] = []
    for span in spans:
        if span.attributes is None:
            continue
        for key in span.attributes:
            if key not in ACCEPTED_KEYS:
                rogue.append((span.name, key))

    assert not rogue, (
        "Span attributes emitted with keys outside the documented registry: "
        f"{rogue}. Either use a semconv name from `src/observability/spans.py` "
        "or add the new key to both `spans.py` (with a comment explaining why "
        "no semconv equivalent applies) and `ALLOWED_CUSTOM_KEYS` in this test."
    )


def test_spans_module_constants_are_registered() -> None:
    """Every uppercase `str` constant in `spans.py` belongs to the test allowlist.

    The allowlist is `SEMCONV_KEYS | ALLOWED_CUSTOM_KEYS`. Catches the
    "added a new constant in `spans.py` without updating the test" drift class.
    If this fails, either:

    - the new constant is a semconv name → add it to `SEMCONV_KEYS`.
    - the new constant is a custom name → add it to `ALLOWED_CUSTOM_KEYS`
      AND ensure the comment in `spans.py` explains why no semconv applies.
    """
    declared = {
        getattr(spans_module, name)
        for name in dir(spans_module)
        if name.isupper() and isinstance(getattr(spans_module, name), str)
    }
    unregistered = declared - ACCEPTED_KEYS
    assert not unregistered, (
        f"`spans.py` defines constants not in the test allowlist: "
        f"{sorted(unregistered)!r}. Update `SEMCONV_KEYS` or "
        "`ALLOWED_CUSTOM_KEYS` in this test."
    )