159 lines
4.8 KiB
Python
159 lines
4.8 KiB
Python
import json
|
|
import logging
|
|
from dataclasses import asdict
|
|
from enum import Enum
|
|
from typing import Union
|
|
|
|
from opentelemetry._logs import Logger, LogRecord
|
|
from opentelemetry.instrumentation.sagemaker.event_models import (
|
|
ChoiceEvent,
|
|
MessageEvent,
|
|
)
|
|
from opentelemetry.instrumentation.sagemaker.reusable_streaming_body import (
|
|
ReusableStreamingBody,
|
|
)
|
|
from opentelemetry.instrumentation.sagemaker.streaming_wrapper import StreamingWrapper
|
|
from opentelemetry.instrumentation.sagemaker.utils import (
|
|
should_emit_events,
|
|
should_send_prompts,
|
|
)
|
|
from opentelemetry.semconv._incubating.attributes import (
|
|
gen_ai_attributes as GenAIAttributes,
|
|
)
|
|
|
|
logger = logging.getLogger(__name__)
|
|
|
|
|
|
class Roles(Enum):
|
|
USER = "user"
|
|
ASSISTANT = "assistant"
|
|
SYSTEM = "system"
|
|
TOOL = "tool"
|
|
|
|
|
|
VALID_MESSAGE_ROLES = {role.value for role in Roles}
|
|
"""The valid roles for naming the message event."""
|
|
|
|
EVENT_ATTRIBUTES = {GenAIAttributes.GEN_AI_SYSTEM: "sagemaker"}
|
|
"""The attributes to be used for the event."""
|
|
|
|
|
|
def emit_message_event(kwargs, event_logger):
|
|
try:
|
|
input_body = json.loads(kwargs.get("Body"))
|
|
except json.JSONDecodeError:
|
|
logger.debug(
|
|
"OpenTelemetry failed to decode the request body, error: %s",
|
|
kwargs.get("Body"),
|
|
)
|
|
return
|
|
emit_event(
|
|
MessageEvent(content=input_body.get("inputs", ""), role="user"), event_logger
|
|
)
|
|
|
|
|
|
def emit_choice_events(response: dict, event_logger):
|
|
response_body: Union[StreamingWrapper, ReusableStreamingBody, None] = response.get(
|
|
"Body"
|
|
)
|
|
|
|
if isinstance(response_body, StreamingWrapper):
|
|
emit_event(
|
|
ChoiceEvent(
|
|
index=0,
|
|
message={
|
|
"content": response_body.accumulating_body,
|
|
"role": "assistant",
|
|
},
|
|
finish_reason="unknown",
|
|
),
|
|
event_logger,
|
|
)
|
|
elif isinstance(response_body, ReusableStreamingBody):
|
|
for i, gen in enumerate(json.loads(response_body.read())):
|
|
emit_event(
|
|
ChoiceEvent(
|
|
index=i,
|
|
message={"content": gen.get("generated_text"), "role": "assistant"},
|
|
finish_reason="unknown",
|
|
),
|
|
event_logger,
|
|
)
|
|
|
|
|
|
def emit_event(
|
|
event: Union[MessageEvent, ChoiceEvent], event_logger: Union[Logger, None]
|
|
) -> None:
|
|
"""
|
|
Emit an event to the OpenTelemetry SDK.
|
|
|
|
Args:
|
|
event: The event to emit.
|
|
"""
|
|
if not should_emit_events() or event_logger is None:
|
|
return
|
|
|
|
if isinstance(event, MessageEvent):
|
|
_emit_message_event(event, event_logger)
|
|
elif isinstance(event, ChoiceEvent):
|
|
_emit_choice_event(event, event_logger)
|
|
else:
|
|
raise TypeError("Unsupported event type")
|
|
|
|
|
|
def _emit_message_event(event: MessageEvent, event_logger: Logger) -> None:
|
|
body = asdict(event)
|
|
|
|
if event.role in VALID_MESSAGE_ROLES:
|
|
name = "gen_ai.{}.message".format(event.role)
|
|
# According to the semantic conventions, the role is conditionally required if available
|
|
# and not equal to the "role" in the message name. So, remove the role from the body if
|
|
# it is the same as the in the event name.
|
|
body.pop("role", None)
|
|
else:
|
|
name = "gen_ai.user.message"
|
|
|
|
# According to the semantic conventions, only the assistant role has tool call
|
|
if event.role != Roles.ASSISTANT.value and event.tool_calls is not None:
|
|
del body["tool_calls"]
|
|
elif event.tool_calls is None:
|
|
del body["tool_calls"]
|
|
|
|
if not should_send_prompts():
|
|
del body["content"]
|
|
if body.get("tool_calls") is not None:
|
|
for tool_call in body["tool_calls"]:
|
|
tool_call["function"].pop("arguments", None)
|
|
|
|
log_record = LogRecord(
|
|
body=body,
|
|
attributes=EVENT_ATTRIBUTES,
|
|
event_name=name
|
|
)
|
|
event_logger.emit(log_record)
|
|
|
|
|
|
def _emit_choice_event(event: ChoiceEvent, event_logger: Logger) -> None:
|
|
body = asdict(event)
|
|
if event.message["role"] == Roles.ASSISTANT.value:
|
|
# According to the semantic conventions, the role is conditionally required if available
|
|
# and not equal to "assistant", so remove the role from the body if it is "assistant".
|
|
body["message"].pop("role", None)
|
|
|
|
if event.tool_calls is None:
|
|
del body["tool_calls"]
|
|
|
|
if not should_send_prompts():
|
|
body["message"].pop("content", None)
|
|
if body.get("tool_calls") is not None:
|
|
for tool_call in body["tool_calls"]:
|
|
tool_call["function"].pop("arguments", None)
|
|
|
|
log_record = LogRecord(
|
|
body=body,
|
|
attributes=EVENT_ATTRIBUTES,
|
|
event_name="gen_ai.choice"
|
|
|
|
)
|
|
event_logger.emit(log_record)
|