Skip to content
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
57 changes: 51 additions & 6 deletions logfire/_internal/integrations/llm_providers/anthropic.py
Original file line number Diff line number Diff line change
@@ -1,12 +1,23 @@
from __future__ import annotations

from typing import TYPE_CHECKING, Any
import json
from typing import TYPE_CHECKING, Any, cast

import anthropic
from anthropic.types import Message, TextBlock, TextDelta

from logfire._internal.utils import handle_internal_errors

from .semconv import (
OPERATION_NAME,
PROVIDER_NAME,
REQUEST_MAX_TOKENS,
REQUEST_STOP_SEQUENCES,
REQUEST_TEMPERATURE,
REQUEST_TOP_K,
REQUEST_TOP_P,
TOOL_DEFINITIONS,
)
from .types import EndpointConfig, StreamState

if TYPE_CHECKING:
Expand All @@ -22,24 +33,58 @@
)


def _extract_request_parameters(json_data: dict[str, Any], span_data: dict[str, Any]) -> None:
"""Extract request parameters from json_data and add to span_data."""
if (max_tokens := json_data.get('max_tokens')) is not None:
span_data[REQUEST_MAX_TOKENS] = max_tokens

if (temperature := json_data.get('temperature')) is not None:
span_data[REQUEST_TEMPERATURE] = temperature

if (top_p := json_data.get('top_p')) is not None:
span_data[REQUEST_TOP_P] = top_p

if (top_k := json_data.get('top_k')) is not None:
span_data[REQUEST_TOP_K] = top_k

if (stop_sequences := json_data.get('stop_sequences')) is not None:
span_data[REQUEST_STOP_SEQUENCES] = json.dumps(stop_sequences)

if (tools := json_data.get('tools')) is not None:
span_data[TOOL_DEFINITIONS] = json.dumps(tools)


def get_endpoint_config(options: FinalRequestOptions) -> EndpointConfig:
"""Returns the endpoint config for Anthropic or Bedrock depending on the url."""
url = options.url
json_data = options.json_data
if not isinstance(json_data, dict): # pragma: no cover
raw_json_data = options.json_data
if not isinstance(raw_json_data, dict): # pragma: no cover
# Ensure that `{request_data[model]!r}` doesn't raise an error, just a warning about `model` missing.
json_data = {}
raw_json_data = {}
json_data = cast('dict[str, Any]', raw_json_data)
Copy link
Copy Markdown
Collaborator

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

is this raw_json_data variable needed just to deal with pyright quirks?

Copy link
Copy Markdown
Contributor Author

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

pyright quirks, please advise


if url == '/v1/messages':
span_data: dict[str, Any] = {
'request_data': json_data,
PROVIDER_NAME: 'anthropic',
OPERATION_NAME: 'chat',
}
_extract_request_parameters(json_data, span_data)

return EndpointConfig(
message_template='Message with {request_data[model]!r}',
span_data={'request_data': json_data},
span_data=span_data,
stream_state_cls=AnthropicMessageStreamState,
)
else:
span_data = {
'request_data': json_data,
'url': url,
PROVIDER_NAME: 'anthropic',
}
return EndpointConfig(
message_template='Anthropic API call to {url!r}',
span_data={'request_data': json_data, 'url': url},
span_data=span_data,
)


Expand Down
6 changes: 4 additions & 2 deletions logfire/_internal/integrations/llm_providers/llm_provider.py
Original file line number Diff line number Diff line change
Expand Up @@ -4,6 +4,8 @@
from contextlib import AbstractContextManager, ExitStack, contextmanager, nullcontext
from typing import TYPE_CHECKING, Any, Callable, cast

from opentelemetry.trace import SpanKind

from logfire import attach_context, get_context
from logfire.propagate import ContextCarrier

Expand Down Expand Up @@ -136,7 +138,7 @@ def instrumented_llm_request_sync(*args: Any, **kwargs: Any) -> Any:
message_template, span_data, kwargs = _instrumentation_setup(*args, **kwargs)
if message_template is None:
return original_request_method(*args, **kwargs)
with logfire_llm.span(message_template, **span_data) as span:
with logfire_llm.span(message_template, _span_kind=SpanKind.CLIENT, **span_data) as span:
with maybe_suppress_instrumentation(suppress_otel):
if kwargs.get('stream'):
return original_request_method(*args, **kwargs)
Expand All @@ -148,7 +150,7 @@ async def instrumented_llm_request_async(*args: Any, **kwargs: Any) -> Any:
message_template, span_data, kwargs = _instrumentation_setup(*args, **kwargs)
if message_template is None:
return await original_request_method(*args, **kwargs)
with logfire_llm.span(message_template, **span_data) as span:
with logfire_llm.span(message_template, _span_kind=SpanKind.CLIENT, **span_data) as span:
with maybe_suppress_instrumentation(suppress_otel):
if kwargs.get('stream'):
return await original_request_method(*args, **kwargs)
Expand Down
113 changes: 98 additions & 15 deletions logfire/_internal/integrations/llm_providers/openai.py
Original file line number Diff line number Diff line change
Expand Up @@ -18,6 +18,19 @@
from logfire import LogfireSpan

from ...utils import handle_internal_errors, log_internal_error
from .semconv import (
OPERATION_NAME,
PROVIDER_NAME,
REQUEST_FREQUENCY_PENALTY,
REQUEST_MAX_TOKENS,
REQUEST_MODEL,
REQUEST_PRESENCE_PENALTY,
REQUEST_SEED,
REQUEST_STOP_SEQUENCES,
REQUEST_TEMPERATURE,
REQUEST_TOP_P,
TOOL_DEFINITIONS,
)
from .types import EndpointConfig, StreamState

if TYPE_CHECKING:
Expand All @@ -33,63 +46,133 @@
)


def _extract_request_parameters(json_data: dict[str, Any], span_data: dict[str, Any]) -> None:
"""Extract request parameters from json_data and add to span_data."""
if (max_tokens := json_data.get('max_tokens')) is not None:
span_data[REQUEST_MAX_TOKENS] = max_tokens
elif (max_output_tokens := json_data.get('max_output_tokens')) is not None:
span_data[REQUEST_MAX_TOKENS] = max_output_tokens

if (temperature := json_data.get('temperature')) is not None:
span_data[REQUEST_TEMPERATURE] = temperature

if (top_p := json_data.get('top_p')) is not None:
span_data[REQUEST_TOP_P] = top_p

if (stop := json_data.get('stop')) is not None:
if isinstance(stop, str):
span_data[REQUEST_STOP_SEQUENCES] = json.dumps([stop])
else:
span_data[REQUEST_STOP_SEQUENCES] = json.dumps(stop)

if (seed := json_data.get('seed')) is not None:
span_data[REQUEST_SEED] = seed

if (frequency_penalty := json_data.get('frequency_penalty')) is not None:
span_data[REQUEST_FREQUENCY_PENALTY] = frequency_penalty

if (presence_penalty := json_data.get('presence_penalty')) is not None:
span_data[REQUEST_PRESENCE_PENALTY] = presence_penalty

if (tools := json_data.get('tools')) is not None:
span_data[TOOL_DEFINITIONS] = json.dumps(tools)


def get_endpoint_config(options: FinalRequestOptions) -> EndpointConfig:
"""Returns the endpoint config for OpenAI depending on the url."""
url = options.url

json_data = options.json_data
if not isinstance(json_data, dict): # pragma: no cover
raw_json_data = options.json_data
if not isinstance(raw_json_data, dict): # pragma: no cover
# Ensure that `{request_data[model]!r}` doesn't raise an error, just a warning about `model` missing.
json_data = {}
raw_json_data = {}
json_data = cast('dict[str, Any]', raw_json_data)

if url == '/chat/completions':
if is_current_agent_span('Chat completion with {gen_ai.request.model!r}'):
return EndpointConfig(message_template='', span_data={})

span_data: dict[str, Any] = {
'request_data': json_data,
'gen_ai.request.model': json_data.get('model'),
PROVIDER_NAME: 'openai',
OPERATION_NAME: 'chat',
}
_extract_request_parameters(json_data, span_data)

return EndpointConfig(
message_template='Chat Completion with {request_data[model]!r}',
span_data={'request_data': json_data, 'gen_ai.request.model': json_data['model']},
span_data=span_data,
stream_state_cls=OpenaiChatCompletionStreamState,
)
elif url == '/responses':
if is_current_agent_span('Responses API', 'Responses API with {gen_ai.request.model!r}'):
return EndpointConfig(message_template='', span_data={})

stream = json_data.get('stream', False) # type: ignore
span_data: dict[str, Any] = {
'gen_ai.request.model': json_data['model'],
'request_data': {'model': json_data['model'], 'stream': stream},
stream = json_data.get('stream', False)
span_data = {
'gen_ai.request.model': json_data.get('model'),
'request_data': {'model': json_data.get('model'), 'stream': stream},
'events': inputs_to_events(
json_data['input'], # type: ignore
json_data.get('instructions'), # type: ignore
json_data.get('input'),
json_data.get('instructions'),
),
PROVIDER_NAME: 'openai',
OPERATION_NAME: 'chat',
}
_extract_request_parameters(json_data, span_data)
Comment thread
jimilp7 marked this conversation as resolved.

return EndpointConfig(
message_template='Responses API with {gen_ai.request.model!r}',
span_data=span_data,
stream_state_cls=OpenaiResponsesStreamState,
)
elif url == '/completions':
span_data = {
'request_data': json_data,
'gen_ai.request.model': json_data.get('model'),
PROVIDER_NAME: 'openai',
OPERATION_NAME: 'text_completion',
}
_extract_request_parameters(json_data, span_data)
return EndpointConfig(
message_template='Completion with {request_data[model]!r}',
span_data={'request_data': json_data, 'gen_ai.request.model': json_data['model']},
span_data=span_data,
stream_state_cls=OpenaiCompletionStreamState,
)
elif url == '/embeddings':
span_data = {
'request_data': json_data,
'gen_ai.request.model': json_data.get('model'),
PROVIDER_NAME: 'openai',
OPERATION_NAME: 'embeddings',
}
_extract_request_parameters(json_data, span_data)
return EndpointConfig(
message_template='Embedding Creation with {request_data[model]!r}',
span_data={'request_data': json_data, 'gen_ai.request.model': json_data['model']},
span_data=span_data,
)
elif url == '/images/generations':
span_data = {
'request_data': json_data,
'gen_ai.request.model': json_data.get('model'),
PROVIDER_NAME: 'openai',
OPERATION_NAME: 'image_generation',
}
_extract_request_parameters(json_data, span_data)
return EndpointConfig(
message_template='Image Generation with {request_data[model]!r}',
span_data={'request_data': json_data, 'gen_ai.request.model': json_data['model']},
span_data=span_data,
)
else:
span_data = {'request_data': json_data, 'url': url}
span_data = {
'request_data': json_data,
'url': url,
PROVIDER_NAME: 'openai',
}
if 'model' in json_data:
span_data['gen_ai.request.model'] = json_data['model']
span_data[REQUEST_MODEL] = json_data['model']
_extract_request_parameters(json_data, span_data)
return EndpointConfig(
message_template='OpenAI API call to {url!r}',
span_data=span_data,
Expand Down
44 changes: 44 additions & 0 deletions logfire/_internal/integrations/llm_providers/semconv.py
Original file line number Diff line number Diff line change
@@ -0,0 +1,44 @@
"""Gen AI Semantic Convention attribute names.

These constants follow the OpenTelemetry Gen AI Semantic Conventions.
See: https://opentelemetry.io/docs/specs/semconv/gen-ai/
"""

from __future__ import annotations

# Provider and operation
PROVIDER_NAME = 'gen_ai.provider.name'
OPERATION_NAME = 'gen_ai.operation.name'

# Model information
REQUEST_MODEL = 'gen_ai.request.model'
RESPONSE_MODEL = 'gen_ai.response.model'

# Request parameters
REQUEST_MAX_TOKENS = 'gen_ai.request.max_tokens'
REQUEST_TEMPERATURE = 'gen_ai.request.temperature'
REQUEST_TOP_P = 'gen_ai.request.top_p'
REQUEST_TOP_K = 'gen_ai.request.top_k'
REQUEST_STOP_SEQUENCES = 'gen_ai.request.stop_sequences'
REQUEST_SEED = 'gen_ai.request.seed'
REQUEST_FREQUENCY_PENALTY = 'gen_ai.request.frequency_penalty'
REQUEST_PRESENCE_PENALTY = 'gen_ai.request.presence_penalty'

# Response metadata
RESPONSE_ID = 'gen_ai.response.id'
RESPONSE_FINISH_REASONS = 'gen_ai.response.finish_reasons'

# Token usage
INPUT_TOKENS = 'gen_ai.usage.input_tokens'
OUTPUT_TOKENS = 'gen_ai.usage.output_tokens'

# Message content
INPUT_MESSAGES = 'gen_ai.input.messages'
OUTPUT_MESSAGES = 'gen_ai.output.messages'
SYSTEM_INSTRUCTIONS = 'gen_ai.system_instructions'

# Tool definitions
TOOL_DEFINITIONS = 'gen_ai.tool.definitions'

# Conversation tracking
CONVERSATION_ID = 'gen_ai.conversation.id'
Loading
Loading