feat(openai): standardize completions to indexed attribute format

codefromthecrypt · codefromthecrypt · commit 463fd1e74983 · 2025-09-30T10:55:30.000+08:00
Signed-off-by: Adrian Cole &lt;adrian@tetrate.io&gt;
diff --git a/python/instrumentation/openinference-instrumentation-openai/src/openinference/instrumentation/openai/_request_attributes_extractor.py b/python/instrumentation/openinference-instrumentation-openai/src/openinference/instrumentation/openai/_request_attributes_extractor.py
@@ -32,6 +32,8 @@
 
 # TODO: Update to use SpanAttributes.EMBEDDING_INVOCATION_PARAMETERS when released in semconv
 _EMBEDDING_INVOCATION_PARAMETERS = "embedding.invocation_parameters"
+# TODO: Update to use SpanAttributes.LLM_INPUT_PROMPTS when released in semconv
+_LLM_INPUT_PROMPTS = "llm.input_prompts"
 
 if TYPE_CHECKING:
     from openai.types import Completion, CreateEmbeddingResponse
@@ -226,13 +228,14 @@ def _get_attributes_from_completion_create_param(
 
     model_prompt = params.get("prompt")
     if isinstance(model_prompt, str):
-        yield SpanAttributes.LLM_PROMPTS, [model_prompt]
+        yield f"{_LLM_INPUT_PROMPTS}.0", model_prompt
     elif (
         isinstance(model_prompt, list)
         and model_prompt
         and all(isinstance(item, str) for item in model_prompt)
     ):
-        yield SpanAttributes.LLM_PROMPTS, model_prompt
+        for index, prompt in enumerate(model_prompt):
+            yield f"{_LLM_INPUT_PROMPTS}.{index}", prompt
 
 
 def _get_attributes_from_embedding_create_param(
diff --git a/python/instrumentation/openinference-instrumentation-openai/src/openinference/instrumentation/openai/_response_attributes_extractor.py b/python/instrumentation/openinference-instrumentation-openai/src/openinference/instrumentation/openai/_response_attributes_extractor.py
@@ -25,6 +25,11 @@
     ToolCallAttributes,
 )
 
+# TODO: Update to use SpanAttributes.LLM_OUTPUT_CHOICES when released in semconv
+_LLM_OUTPUT_CHOICES = "llm.output_choices"
+# TODO: Update to use ChoiceAttributes.CHOICE_TEXT when released in semconv
+_CHOICE_TEXT = "choice.text"
+
 if TYPE_CHECKING:
     from openai.types import Completion, CreateEmbeddingResponse
     from openai.types.chat import ChatCompletion
@@ -114,6 +119,13 @@ def _get_attributes_from_completion(
         if usage := getattr(completion, "usage", None):
             yield from self._get_attributes_from_completion_usage(usage)
 
+        if (choices := getattr(completion, "choices", None)) and isinstance(choices, Iterable):
+            for choice in choices:
+                if (index := getattr(choice, "index", None)) is None:
+                    continue
+                if text := getattr(choice, "text", None):
+                    yield f"{_LLM_OUTPUT_CHOICES}.{index}.{_CHOICE_TEXT}", text
+
     def _get_attributes_from_create_embedding_response(
         self,
         response: "CreateEmbeddingResponse",
diff --git a/python/instrumentation/openinference-instrumentation-openai/tests/openinference/instrumentation/openai/test_instrumentor.py b/python/instrumentation/openinference-instrumentation-openai/tests/openinference/instrumentation/openai/test_instrumentor.py
@@ -16,7 +16,6 @@
     List,
     Mapping,
     Optional,
-    Sequence,
     Tuple,
     Union,
     cast,
@@ -300,8 +299,8 @@ def test_completions(
     prompt_template_version: str,
     prompt_template_variables: Dict[str, Any],
 ) -> None:
-    # SpanAttributes.LLM_PROMPTS is always a list, so coerce the input accordingly.
-    prompt = prompt_input if isinstance(prompt_input, list) else [prompt_input]
+    # Normalize prompt_input (string or list) to a list for iteration
+    prompts = prompt_input if isinstance(prompt_input, list) else [prompt_input]
     output_texts: List[str] = completion_mock_stream[1] if is_stream else get_texts()
     invocation_parameters = {
         "stream": is_stream,
@@ -399,10 +398,14 @@ async def task() -> None:
     assert isinstance(attributes.pop(INPUT_VALUE, None), str)
     assert isinstance(attributes.pop(INPUT_MIME_TYPE, None), str)
     # Prompts are recorded in request phase, so present regardless of status
-    assert list(cast(Sequence[str], attributes.pop(LLM_PROMPTS, None))) == prompt
+    for i, prompt_text in enumerate(prompts):
+        assert attributes.pop(f"llm.input_prompts.{i}", None) == prompt_text
     if status_code == 200:
         assert isinstance(attributes.pop(OUTPUT_VALUE, None), str)
         assert isinstance(attributes.pop(OUTPUT_MIME_TYPE, None), str)
+        # Check output choices
+        for i, text in enumerate(output_texts):
+            assert attributes.pop(f"llm.output_choices.{i}.choice.text", None) == text
         if not is_stream:
             # Usage is not available for streaming in general.
             assert attributes.pop(LLM_TOKEN_COUNT_TOTAL, None) == completion_usage["total_tokens"]
diff --git a/python/openinference-instrumentation/src/openinference/instrumentation/config.py b/python/openinference-instrumentation/src/openinference/instrumentation/config.py
@@ -84,12 +84,22 @@ def __aexit__(
 OPENINFERENCE_BASE64_IMAGE_MAX_LENGTH = "OPENINFERENCE_BASE64_IMAGE_MAX_LENGTH"
 # Limits characters of a base64 encoding of an image
 OPENINFERENCE_HIDE_PROMPTS = "OPENINFERENCE_HIDE_PROMPTS"
-# Hides LLM prompts
+# DEPRECATED: Use OPENINFERENCE_HIDE_INPUT_PROMPTS instead
+OPENINFERENCE_HIDE_INPUT_PROMPTS = "OPENINFERENCE_HIDE_INPUT_PROMPTS"
+# Hides input prompts
+OPENINFERENCE_HIDE_OUTPUT_CHOICES = "OPENINFERENCE_HIDE_OUTPUT_CHOICES"
+# Hides output choices
 REDACTED_VALUE = "__REDACTED__"
 # When a value is hidden, it will be replaced by this redacted value
 
+# TODO: Update to use SpanAttributes constants when released in semconv
+_LLM_INPUT_PROMPTS = "llm.input_prompts"
+_LLM_OUTPUT_CHOICES = "llm.output_choices"
+
 DEFAULT_HIDE_LLM_INVOCATION_PARAMETERS = False
 DEFAULT_HIDE_PROMPTS = False
+DEFAULT_HIDE_INPUT_PROMPTS = False
+DEFAULT_HIDE_OUTPUT_CHOICES = False
 DEFAULT_HIDE_INPUTS = False
 DEFAULT_HIDE_OUTPUTS = False
 
@@ -195,7 +205,23 @@ class TraceConfig:
             "default_value": DEFAULT_HIDE_PROMPTS,
         },
     )
-    """Hides LLM prompts"""
+    """Hides LLM prompts (DEPRECATED: use hide_input_prompts)"""
+    hide_input_prompts: Optional[bool] = field(
+        default=None,
+        metadata={
+            "env_var": OPENINFERENCE_HIDE_INPUT_PROMPTS,
+            "default_value": DEFAULT_HIDE_INPUT_PROMPTS,
+        },
+    )
+    """Hides input prompts"""
+    hide_output_choices: Optional[bool] = field(
+        default=None,
+        metadata={
+            "env_var": OPENINFERENCE_HIDE_OUTPUT_CHOICES,
+            "default_value": DEFAULT_HIDE_OUTPUT_CHOICES,
+        },
+    )
+    """Hides output choices"""
     base64_image_max_length: Optional[int] = field(
         default=None,
         metadata={
@@ -206,6 +232,12 @@ class TraceConfig:
     """Limits characters of a base64 encoding of an image"""
 
     def __post_init__(self) -> None:
+        # Track if hide_input_prompts was explicitly set (not None)
+        # to avoid overriding explicit user configuration
+        hide_input_prompts_was_explicit = self.hide_input_prompts is not None
+        # Also check if it's set via environment variable
+        hide_input_prompts_env_was_set = os.getenv(OPENINFERENCE_HIDE_INPUT_PROMPTS) is not None
+
         for f in fields(self):
             expected_type = get_args(f.type)[0]
             # Optional is Union[T,NoneType]. get_args()returns (T, NoneType).
@@ -216,6 +248,15 @@ def __post_init__(self) -> None:
                 f.metadata["env_var"],
                 f.metadata["default_value"],
             )
+        # TODO: Remove this backward compatibility after deprecation period
+        # Only apply backward compat if hide_input_prompts wasn't explicitly set
+        # via constructor argument or environment variable
+        if (
+            not hide_input_prompts_was_explicit
+            and not hide_input_prompts_env_was_set
+            and self.hide_prompts is True
+        ):
+            object.__setattr__(self, "hide_input_prompts", True)
 
     def mask(
         self,
@@ -226,6 +267,8 @@ def mask(
             return None
         elif self.hide_prompts and key == SpanAttributes.LLM_PROMPTS:
             value = REDACTED_VALUE
+        elif (self.hide_inputs or self.hide_input_prompts) and _LLM_INPUT_PROMPTS in key:
+            value = REDACTED_VALUE
         elif self.hide_inputs and key == SpanAttributes.INPUT_VALUE:
             value = REDACTED_VALUE
         elif self.hide_inputs and key == SpanAttributes.INPUT_MIME_TYPE:
@@ -242,6 +285,8 @@ def mask(
             self.hide_outputs or self.hide_output_messages
         ) and SpanAttributes.LLM_OUTPUT_MESSAGES in key:
             return None
+        elif (self.hide_outputs or self.hide_output_choices) and _LLM_OUTPUT_CHOICES in key:
+            value = REDACTED_VALUE
         elif (
             self.hide_input_text
             and SpanAttributes.LLM_INPUT_MESSAGES in key
diff --git a/python/openinference-instrumentation/tests/test_config.py b/python/openinference-instrumentation/tests/test_config.py
@@ -17,18 +17,22 @@
     DEFAULT_BASE64_IMAGE_MAX_LENGTH,
     DEFAULT_HIDE_INPUT_IMAGES,
     DEFAULT_HIDE_INPUT_MESSAGES,
+    DEFAULT_HIDE_INPUT_PROMPTS,
     DEFAULT_HIDE_INPUT_TEXT,
     DEFAULT_HIDE_INPUTS,
     DEFAULT_HIDE_LLM_INVOCATION_PARAMETERS,
+    DEFAULT_HIDE_OUTPUT_CHOICES,
     DEFAULT_HIDE_OUTPUT_MESSAGES,
     DEFAULT_HIDE_OUTPUT_TEXT,
     DEFAULT_HIDE_OUTPUTS,
     DEFAULT_HIDE_PROMPTS,
     OPENINFERENCE_BASE64_IMAGE_MAX_LENGTH,
     OPENINFERENCE_HIDE_INPUT_IMAGES,
     OPENINFERENCE_HIDE_INPUT_MESSAGES,
+    OPENINFERENCE_HIDE_INPUT_PROMPTS,
     OPENINFERENCE_HIDE_INPUT_TEXT,
     OPENINFERENCE_HIDE_INPUTS,
+    OPENINFERENCE_HIDE_OUTPUT_CHOICES,
     OPENINFERENCE_HIDE_OUTPUT_MESSAGES,
     OPENINFERENCE_HIDE_OUTPUT_TEXT,
     OPENINFERENCE_HIDE_OUTPUTS,
@@ -49,6 +53,8 @@ def test_default_settings() -> None:
     assert config.hide_input_text == DEFAULT_HIDE_INPUT_TEXT
     assert config.hide_output_text == DEFAULT_HIDE_OUTPUT_TEXT
     assert config.hide_prompts == DEFAULT_HIDE_PROMPTS
+    assert config.hide_input_prompts == DEFAULT_HIDE_INPUT_PROMPTS
+    assert config.hide_output_choices == DEFAULT_HIDE_OUTPUT_CHOICES
     assert config.base64_image_max_length == DEFAULT_BASE64_IMAGE_MAX_LENGTH
 
 
@@ -121,6 +127,8 @@ def test_attribute_priority(k: str, in_memory_span_exporter: InMemorySpanExporte
 @pytest.mark.parametrize("hide_input_text", [False, True])
 @pytest.mark.parametrize("hide_output_text", [False, True])
 @pytest.mark.parametrize("hide_prompts", [False, True])
+@pytest.mark.parametrize("hide_input_prompts", [False, True])
+@pytest.mark.parametrize("hide_output_choices", [False, True])
 @pytest.mark.parametrize("base64_image_max_length", [10_000])
 def test_settings_from_env_vars_and_code(
     hide_inputs: bool,
@@ -131,6 +139,8 @@ def test_settings_from_env_vars_and_code(
     hide_input_text: bool,
     hide_output_text: bool,
     hide_prompts: bool,
+    hide_input_prompts: bool,
+    hide_output_choices: bool,
     base64_image_max_length: int,
     monkeypatch: pytest.MonkeyPatch,
 ) -> None:
@@ -141,6 +151,8 @@ def test_settings_from_env_vars_and_code(
     monkeypatch.setenv(OPENINFERENCE_HIDE_OUTPUT_MESSAGES, str(hide_output_messages))
     monkeypatch.setenv(OPENINFERENCE_HIDE_INPUT_IMAGES, str(hide_input_images))
     monkeypatch.setenv(OPENINFERENCE_HIDE_PROMPTS, str(hide_prompts))
+    monkeypatch.setenv(OPENINFERENCE_HIDE_INPUT_PROMPTS, str(hide_input_prompts))
+    monkeypatch.setenv(OPENINFERENCE_HIDE_OUTPUT_CHOICES, str(hide_output_choices))
     monkeypatch.setenv(OPENINFERENCE_HIDE_INPUT_TEXT, str(hide_input_text))
     monkeypatch.setenv(OPENINFERENCE_HIDE_OUTPUT_TEXT, str(hide_output_text))
     monkeypatch.setenv(OPENINFERENCE_BASE64_IMAGE_MAX_LENGTH, str(base64_image_max_length))
@@ -154,6 +166,8 @@ def test_settings_from_env_vars_and_code(
     assert config.hide_input_text is parse_bool_from_env(OPENINFERENCE_HIDE_INPUT_TEXT)
     assert config.hide_output_text is parse_bool_from_env(OPENINFERENCE_HIDE_OUTPUT_TEXT)
     assert config.hide_prompts is parse_bool_from_env(OPENINFERENCE_HIDE_PROMPTS)
+    assert config.hide_input_prompts is parse_bool_from_env(OPENINFERENCE_HIDE_INPUT_PROMPTS)
+    assert config.hide_output_choices is parse_bool_from_env(OPENINFERENCE_HIDE_OUTPUT_CHOICES)
     assert config.base64_image_max_length == int(
         os.getenv(OPENINFERENCE_BASE64_IMAGE_MAX_LENGTH, default=-1)
     )
@@ -169,6 +183,8 @@ def test_settings_from_env_vars_and_code(
     new_hide_input_text = not hide_input_text
     new_hide_output_text = not hide_output_text
     new_hide_prompts = not hide_prompts
+    new_hide_input_prompts = not hide_input_prompts
+    new_hide_output_choices = not hide_output_choices
     config = TraceConfig(
         hide_inputs=new_hide_inputs,
         hide_outputs=new_hide_outputs,
@@ -178,6 +194,8 @@ def test_settings_from_env_vars_and_code(
         hide_input_text=new_hide_input_text,
         hide_output_text=new_hide_output_text,
         hide_prompts=new_hide_prompts,
+        hide_input_prompts=new_hide_input_prompts,
+        hide_output_choices=new_hide_output_choices,
         base64_image_max_length=new_base64_image_max_length,
     )
     assert config.hide_inputs is new_hide_inputs
@@ -188,6 +206,8 @@ def test_settings_from_env_vars_and_code(
     assert config.hide_input_text is new_hide_input_text
     assert config.hide_output_text is new_hide_output_text
     assert config.hide_prompts is new_hide_prompts
+    assert config.hide_input_prompts is new_hide_input_prompts
+    assert config.hide_output_choices is new_hide_output_choices
     assert config.base64_image_max_length == new_base64_image_max_length
 
 
diff --git a/python/openinference-semantic-conventions/src/openinference/semconv/trace/__init__.py b/python/openinference-semantic-conventions/src/openinference/semconv/trace/__init__.py
@@ -57,6 +57,17 @@ class SpanAttributes:
     LLM_PROMPTS = "llm.prompts"
     """
     Prompts provided to a completions API.
+    DEPRECATED: Use LLM_INPUT_PROMPTS instead for indexed format.
+    """
+    LLM_INPUT_PROMPTS = "llm.input_prompts"
+    """
+    Prompt(s) provided to a completions API. Use indexed format for arrays.
+    Maps to the 'prompt' field in the request (e.g., request.prompt or request.prompt[0]).
+    """
+    LLM_OUTPUT_CHOICES = "llm.output_choices"
+    """
+    Choice(s) returned from a completions API. Use indexed format for arrays.
+    Maps to the 'choices' array in the response (e.g., response.choices[0]).
     """
     LLM_PROMPT_TEMPLATE = "llm.prompt_template.template"
     """
@@ -293,6 +304,18 @@ class MessageAttributes:
     """
 
 
+class ChoiceAttributes:
+    """
+    Attributes for a choice returned from a completions API
+    """
+
+    CHOICE_TEXT = "choice.text"
+    """
+    The text content of a completion choice.
+    Maps to the 'text' field in the choice (e.g., response.choices[0].text).
+    """
+
+
 class MessageContentAttributes:
     """
     Attributes for the contents of user messages sent to an LLM.
diff --git a/python/openinference-semantic-conventions/tests/openinference/semconv/test_attributes.py b/python/openinference-semantic-conventions/tests/openinference/semconv/test_attributes.py
@@ -54,6 +54,7 @@
 
 from openinference.semconv.resource import ResourceAttributes
 from openinference.semconv.trace import (
+    ChoiceAttributes,
     DocumentAttributes,
     EmbeddingAttributes,
     ImageAttributes,
@@ -117,8 +118,10 @@ def test_nesting(self) -> None:
                 },
                 "function_call": SpanAttributes.LLM_FUNCTION_CALL,
                 "input_messages": SpanAttributes.LLM_INPUT_MESSAGES,
+                "input_prompts": SpanAttributes.LLM_INPUT_PROMPTS,
                 "invocation_parameters": SpanAttributes.LLM_INVOCATION_PARAMETERS,
                 "model_name": SpanAttributes.LLM_MODEL_NAME,
+                "output_choices": SpanAttributes.LLM_OUTPUT_CHOICES,
                 "output_messages": SpanAttributes.LLM_OUTPUT_MESSAGES,
                 "prompt_template": {
                     "template": SpanAttributes.LLM_PROMPT_TEMPLATE,
@@ -330,6 +333,22 @@ def test_nesting(self) -> None:
         }
 
 
+class TestChoiceAttributes:
+    """Tests for ChoiceAttributes namespace structure.
+
+    Verifies that completion choice attributes from flat spans are properly
+    organized under the choice namespace.
+    """
+
+    def test_nesting(self) -> None:
+        attributes = _get_attributes(ChoiceAttributes)
+        assert _nested_dict(attributes) == {
+            "choice": {
+                "text": ChoiceAttributes.CHOICE_TEXT,
+            }
+        }
+
+
 class TestResourceAttributes:
     """Tests for ResourceAttributes namespace structure.
 
diff --git a/spec/configuration.md b/spec/configuration.md
@@ -15,8 +15,10 @@ The possible settings are:
 | OPENINFERENCE_HIDE_OUTPUT_MESSAGES           | Hides all output messages (independent of HIDE_OUTPUTS)                                                                        | bool | False   |
 | OPENINFERENCE_HIDE_INPUT_IMAGES              | Hides images from input messages (only applies when input messages are not already hidden)                                     | bool | False   |
 | OPENINFERENCE_HIDE_INPUT_TEXT                | Hides text from input messages (only applies when input messages are not already hidden)                                       | bool | False   |
-| OPENINFERENCE_HIDE_PROMPTS                   | Hides LLM prompts                                                                                                              | bool | False   |
+| OPENINFERENCE_HIDE_PROMPTS                   | DEPRECATED: Use OPENINFERENCE_HIDE_INPUT_PROMPTS instead                                                                       | bool | False   |
+| OPENINFERENCE_HIDE_INPUT_PROMPTS             | Hides input prompts (for completions API)                                                                                      | bool | False   |
 | OPENINFERENCE_HIDE_OUTPUT_TEXT               | Hides text from output messages (only applies when output messages are not already hidden)                                     | bool | False   |
+| OPENINFERENCE_HIDE_OUTPUT_CHOICES            | Hides output choices (for completions API)                                                                                     | bool | False   |
 | OPENINFERENCE_HIDE_EMBEDDING_VECTORS         | Hides embedding vectors                                                                                                        | bool | False   |
 | OPENINFERENCE_BASE64_IMAGE_MAX_LENGTH        | Limits characters of a base64 encoding of an image                                                                             | int  | 32,000  |
 
@@ -51,7 +53,9 @@ If you are working in Python, and want to set up a configuration different than
         hide_output_text=...,
         hide_embedding_vectors=...,
         base64_image_max_length=...,
-        hide_prompts=...,
+        hide_prompts=...,  # DEPRECATED: use hide_input_prompts
+        hide_input_prompts=...,
+        hide_output_choices=...,
     )
 
     from openinference.instrumentation.openai import OpenAIInstrumentor
diff --git a/spec/llm_spans.md b/spec/llm_spans.md