feat(openai): standardize completions to indexed attribute format

codefromthecrypt · codefromthecrypt · commit 62473a24024e · 2025-10-01T10:52:05.000+08:00
Signed-off-by: Adrian Cole &lt;adrian@tetrate.io&gt;
diff --git a/python/instrumentation/openinference-instrumentation-openai/src/openinference/instrumentation/openai/_attributes/_responses_api.py b/python/instrumentation/openinference-instrumentation-openai/src/openinference/instrumentation/openai/_attributes/_responses_api.py
@@ -482,7 +482,9 @@ def _get_attributes_from_response_input_param_function_call_output(
         if (call_id := obj.get("call_id")) is not None:
             yield f"{prefix}{MessageAttributes.MESSAGE_TOOL_CALL_ID}", call_id
         if (output := obj.get("output")) is not None:
-            yield f"{prefix}{MessageAttributes.MESSAGE_CONTENT}", output
+            # output can be str or complex type - serialize complex types to JSON
+            output_value = output if isinstance(output, str) else safe_json_dumps(output)
+            yield f"{prefix}{MessageAttributes.MESSAGE_CONTENT}", output_value
 
     @classmethod
     @stop_on_exception
@@ -495,7 +497,9 @@ def _get_attributes_from_response_custom_tool_call_output_param(
         if (call_id := obj.get("call_id")) is not None:
             yield f"{prefix}{MessageAttributes.MESSAGE_TOOL_CALL_ID}", call_id
         if (output := obj.get("output")) is not None:
-            yield f"{prefix}{MessageAttributes.MESSAGE_CONTENT}", output
+            # output can be str or complex type - serialize complex types to JSON
+            output_value = output if isinstance(output, str) else safe_json_dumps(output)
+            yield f"{prefix}{MessageAttributes.MESSAGE_CONTENT}", output_value
 
     @classmethod
     @stop_on_exception
diff --git a/python/instrumentation/openinference-instrumentation-openai/src/openinference/instrumentation/openai/_request_attributes_extractor.py b/python/instrumentation/openinference-instrumentation-openai/src/openinference/instrumentation/openai/_request_attributes_extractor.py
@@ -32,6 +32,8 @@
 
 # TODO: Update to use SpanAttributes.EMBEDDING_INVOCATION_PARAMETERS when released in semconv
 _EMBEDDING_INVOCATION_PARAMETERS = "embedding.invocation_parameters"
+# TODO: Update to use SpanAttributes.COMPLETION_PROMPT when released in semconv
+_COMPLETION_PROMPT = "completion.prompt"
 
 if TYPE_CHECKING:
     from openai.types import Completion, CreateEmbeddingResponse
@@ -226,13 +228,14 @@ def _get_attributes_from_completion_create_param(
 
     model_prompt = params.get("prompt")
     if isinstance(model_prompt, str):
-        yield SpanAttributes.LLM_PROMPTS, [model_prompt]
+        yield f"{_COMPLETION_PROMPT}.0", model_prompt
     elif (
         isinstance(model_prompt, list)
         and model_prompt
         and all(isinstance(item, str) for item in model_prompt)
     ):
-        yield SpanAttributes.LLM_PROMPTS, model_prompt
+        for index, prompt in enumerate(model_prompt):
+            yield f"{_COMPLETION_PROMPT}.{index}", prompt
 
 
 def _get_attributes_from_embedding_create_param(
diff --git a/python/instrumentation/openinference-instrumentation-openai/src/openinference/instrumentation/openai/_response_attributes_extractor.py b/python/instrumentation/openinference-instrumentation-openai/src/openinference/instrumentation/openai/_response_attributes_extractor.py
@@ -25,6 +25,9 @@
     ToolCallAttributes,
 )
 
+# TODO: Update to use SpanAttributes.COMPLETION_TEXT when released in semconv
+_COMPLETION_TEXT = "completion.text"
+
 if TYPE_CHECKING:
     from openai.types import Completion, CreateEmbeddingResponse
     from openai.types.chat import ChatCompletion
@@ -114,6 +117,13 @@ def _get_attributes_from_completion(
         if usage := getattr(completion, "usage", None):
             yield from self._get_attributes_from_completion_usage(usage)
 
+        if (choices := getattr(completion, "choices", None)) and isinstance(choices, Iterable):
+            for choice in choices:
+                if (index := getattr(choice, "index", None)) is None:
+                    continue
+                if text := getattr(choice, "text", None):
+                    yield f"{_COMPLETION_TEXT}.{index}", text
+
     def _get_attributes_from_create_embedding_response(
         self,
         response: "CreateEmbeddingResponse",
diff --git a/python/instrumentation/openinference-instrumentation-openai/tests/openinference/instrumentation/openai/test_instrumentor.py b/python/instrumentation/openinference-instrumentation-openai/tests/openinference/instrumentation/openai/test_instrumentor.py
@@ -16,7 +16,6 @@
     List,
     Mapping,
     Optional,
-    Sequence,
     Tuple,
     Union,
     cast,
@@ -47,6 +46,11 @@
     ToolCallAttributes,
 )
 
+# TODO: Update to use SpanAttributes.COMPLETION_PROMPT when released in semconv
+_COMPLETION_PROMPT = "completion.prompt"
+# TODO: Update to use SpanAttributes.COMPLETION_TEXT when released in semconv
+_COMPLETION_TEXT = "completion.text"
+
 for name, logger in logging.root.manager.loggerDict.items():
     if name.startswith("openinference.") and isinstance(logger, logging.Logger):
         logger.setLevel(logging.DEBUG)
@@ -300,8 +304,8 @@ def test_completions(
     prompt_template_version: str,
     prompt_template_variables: Dict[str, Any],
 ) -> None:
-    # SpanAttributes.LLM_PROMPTS is always a list, so coerce the input accordingly.
-    prompt = prompt_input if isinstance(prompt_input, list) else [prompt_input]
+    # Normalize prompt_input (string or list) to a list for iteration
+    prompts = prompt_input if isinstance(prompt_input, list) else [prompt_input]
     output_texts: List[str] = completion_mock_stream[1] if is_stream else get_texts()
     invocation_parameters = {
         "stream": is_stream,
@@ -399,10 +403,14 @@ async def task() -> None:
     assert isinstance(attributes.pop(INPUT_VALUE, None), str)
     assert isinstance(attributes.pop(INPUT_MIME_TYPE, None), str)
     # Prompts are recorded in request phase, so present regardless of status
-    assert list(cast(Sequence[str], attributes.pop(LLM_PROMPTS, None))) == prompt
+    for i, prompt_text in enumerate(prompts):
+        assert attributes.pop(f"{_COMPLETION_PROMPT}.{i}", None) == prompt_text
     if status_code == 200:
         assert isinstance(attributes.pop(OUTPUT_VALUE, None), str)
         assert isinstance(attributes.pop(OUTPUT_MIME_TYPE, None), str)
+        # Check output completions
+        for i, text in enumerate(output_texts):
+            assert attributes.pop(f"{_COMPLETION_TEXT}.{i}", None) == text
         if not is_stream:
             # Usage is not available for streaming in general.
             assert attributes.pop(LLM_TOKEN_COUNT_TOTAL, None) == completion_usage["total_tokens"]
diff --git a/python/openinference-instrumentation/src/openinference/instrumentation/config.py b/python/openinference-instrumentation/src/openinference/instrumentation/config.py
@@ -84,12 +84,22 @@ def __aexit__(
 OPENINFERENCE_BASE64_IMAGE_MAX_LENGTH = "OPENINFERENCE_BASE64_IMAGE_MAX_LENGTH"
 # Limits characters of a base64 encoding of an image
 OPENINFERENCE_HIDE_PROMPTS = "OPENINFERENCE_HIDE_PROMPTS"
-# Hides LLM prompts
+# DEPRECATED: Use OPENINFERENCE_HIDE_COMPLETION_PROMPT instead
+OPENINFERENCE_HIDE_COMPLETION_PROMPT = "OPENINFERENCE_HIDE_COMPLETION_PROMPT"
+# Hides completion prompt
+OPENINFERENCE_HIDE_COMPLETION_TEXT = "OPENINFERENCE_HIDE_COMPLETION_TEXT"
+# Hides completion text
 REDACTED_VALUE = "__REDACTED__"
 # When a value is hidden, it will be replaced by this redacted value
 
+# TODO: Update to use SpanAttributes constants when released in semconv
+_COMPLETION_PROMPT = "completion.prompt"
+_COMPLETION_TEXT = "completion.text"
+
 DEFAULT_HIDE_LLM_INVOCATION_PARAMETERS = False
 DEFAULT_HIDE_PROMPTS = False
+DEFAULT_HIDE_COMPLETION_PROMPT = False
+DEFAULT_HIDE_COMPLETION_TEXT = False
 DEFAULT_HIDE_INPUTS = False
 DEFAULT_HIDE_OUTPUTS = False
 
@@ -195,7 +205,23 @@ class TraceConfig:
             "default_value": DEFAULT_HIDE_PROMPTS,
         },
     )
-    """Hides LLM prompts"""
+    """Hides LLM prompts (DEPRECATED: use hide_completion_prompt)"""
+    hide_completion_prompt: Optional[bool] = field(
+        default=None,
+        metadata={
+            "env_var": OPENINFERENCE_HIDE_COMPLETION_PROMPT,
+            "default_value": DEFAULT_HIDE_COMPLETION_PROMPT,
+        },
+    )
+    """Hides completion prompt"""
+    hide_completion_text: Optional[bool] = field(
+        default=None,
+        metadata={
+            "env_var": OPENINFERENCE_HIDE_COMPLETION_TEXT,
+            "default_value": DEFAULT_HIDE_COMPLETION_TEXT,
+        },
+    )
+    """Hides completion text"""
     base64_image_max_length: Optional[int] = field(
         default=None,
         metadata={
@@ -206,6 +232,14 @@ class TraceConfig:
     """Limits characters of a base64 encoding of an image"""
 
     def __post_init__(self) -> None:
+        # Track if hide_completion_prompt was explicitly set (not None)
+        # to avoid overriding explicit user configuration
+        hide_completion_prompt_was_explicit = self.hide_completion_prompt is not None
+        # Also check if it's set via environment variable
+        hide_completion_prompt_env_was_set = (
+            os.getenv(OPENINFERENCE_HIDE_COMPLETION_PROMPT) is not None
+        )
+
         for f in fields(self):
             expected_type = get_args(f.type)[0]
             # Optional is Union[T,NoneType]. get_args()returns (T, NoneType).
@@ -216,6 +250,15 @@ def __post_init__(self) -> None:
                 f.metadata["env_var"],
                 f.metadata["default_value"],
             )
+        # TODO: Remove this backward compatibility after deprecation period
+        # Only apply backward compat if hide_completion_prompt wasn't explicitly set
+        # via constructor argument or environment variable
+        if (
+            not hide_completion_prompt_was_explicit
+            and not hide_completion_prompt_env_was_set
+            and self.hide_prompts is True
+        ):
+            object.__setattr__(self, "hide_completion_prompt", True)
 
     def mask(
         self,
@@ -226,6 +269,10 @@ def mask(
             return None
         elif self.hide_prompts and key == SpanAttributes.LLM_PROMPTS:
             value = REDACTED_VALUE
+        elif (
+            self.hide_inputs or self.hide_completion_prompt
+        ) and _COMPLETION_PROMPT in key:
+            value = REDACTED_VALUE
         elif self.hide_inputs and key == SpanAttributes.INPUT_VALUE:
             value = REDACTED_VALUE
         elif self.hide_inputs and key == SpanAttributes.INPUT_MIME_TYPE:
@@ -242,6 +289,10 @@ def mask(
             self.hide_outputs or self.hide_output_messages
         ) and SpanAttributes.LLM_OUTPUT_MESSAGES in key:
             return None
+        elif (
+            self.hide_outputs or self.hide_completion_text
+        ) and _COMPLETION_TEXT in key:
+            value = REDACTED_VALUE
         elif (
             self.hide_input_text
             and SpanAttributes.LLM_INPUT_MESSAGES in key
diff --git a/python/openinference-instrumentation/tests/test_config.py b/python/openinference-instrumentation/tests/test_config.py
@@ -17,18 +17,22 @@
     DEFAULT_BASE64_IMAGE_MAX_LENGTH,
     DEFAULT_HIDE_INPUT_IMAGES,
     DEFAULT_HIDE_INPUT_MESSAGES,
+    DEFAULT_HIDE_COMPLETION_PROMPT,
     DEFAULT_HIDE_INPUT_TEXT,
     DEFAULT_HIDE_INPUTS,
     DEFAULT_HIDE_LLM_INVOCATION_PARAMETERS,
+    DEFAULT_HIDE_COMPLETION_TEXT,
     DEFAULT_HIDE_OUTPUT_MESSAGES,
     DEFAULT_HIDE_OUTPUT_TEXT,
     DEFAULT_HIDE_OUTPUTS,
     DEFAULT_HIDE_PROMPTS,
     OPENINFERENCE_BASE64_IMAGE_MAX_LENGTH,
     OPENINFERENCE_HIDE_INPUT_IMAGES,
     OPENINFERENCE_HIDE_INPUT_MESSAGES,
+    OPENINFERENCE_HIDE_COMPLETION_PROMPT,
     OPENINFERENCE_HIDE_INPUT_TEXT,
     OPENINFERENCE_HIDE_INPUTS,
+    OPENINFERENCE_HIDE_COMPLETION_TEXT,
     OPENINFERENCE_HIDE_OUTPUT_MESSAGES,
     OPENINFERENCE_HIDE_OUTPUT_TEXT,
     OPENINFERENCE_HIDE_OUTPUTS,
@@ -49,6 +53,8 @@ def test_default_settings() -> None:
     assert config.hide_input_text == DEFAULT_HIDE_INPUT_TEXT
     assert config.hide_output_text == DEFAULT_HIDE_OUTPUT_TEXT
     assert config.hide_prompts == DEFAULT_HIDE_PROMPTS
+    assert config.hide_completion_prompt == DEFAULT_HIDE_COMPLETION_PROMPT
+    assert config.hide_completion_text == DEFAULT_HIDE_COMPLETION_TEXT
     assert config.base64_image_max_length == DEFAULT_BASE64_IMAGE_MAX_LENGTH
 
 
@@ -121,6 +127,8 @@ def test_attribute_priority(k: str, in_memory_span_exporter: InMemorySpanExporte
 @pytest.mark.parametrize("hide_input_text", [False, True])
 @pytest.mark.parametrize("hide_output_text", [False, True])
 @pytest.mark.parametrize("hide_prompts", [False, True])
+@pytest.mark.parametrize("hide_completion_prompt", [False, True])
+@pytest.mark.parametrize("hide_completion_text", [False, True])
 @pytest.mark.parametrize("base64_image_max_length", [10_000])
 def test_settings_from_env_vars_and_code(
     hide_inputs: bool,
@@ -131,6 +139,8 @@ def test_settings_from_env_vars_and_code(
     hide_input_text: bool,
     hide_output_text: bool,
     hide_prompts: bool,
+    hide_completion_prompt: bool,
+    hide_completion_text: bool,
     base64_image_max_length: int,
     monkeypatch: pytest.MonkeyPatch,
 ) -> None:
@@ -141,6 +151,8 @@ def test_settings_from_env_vars_and_code(
     monkeypatch.setenv(OPENINFERENCE_HIDE_OUTPUT_MESSAGES, str(hide_output_messages))
     monkeypatch.setenv(OPENINFERENCE_HIDE_INPUT_IMAGES, str(hide_input_images))
     monkeypatch.setenv(OPENINFERENCE_HIDE_PROMPTS, str(hide_prompts))
+    monkeypatch.setenv(OPENINFERENCE_HIDE_COMPLETION_PROMPT, str(hide_completion_prompt))
+    monkeypatch.setenv(OPENINFERENCE_HIDE_COMPLETION_TEXT, str(hide_completion_text))
     monkeypatch.setenv(OPENINFERENCE_HIDE_INPUT_TEXT, str(hide_input_text))
     monkeypatch.setenv(OPENINFERENCE_HIDE_OUTPUT_TEXT, str(hide_output_text))
     monkeypatch.setenv(OPENINFERENCE_BASE64_IMAGE_MAX_LENGTH, str(base64_image_max_length))
@@ -154,6 +166,8 @@ def test_settings_from_env_vars_and_code(
     assert config.hide_input_text is parse_bool_from_env(OPENINFERENCE_HIDE_INPUT_TEXT)
     assert config.hide_output_text is parse_bool_from_env(OPENINFERENCE_HIDE_OUTPUT_TEXT)
     assert config.hide_prompts is parse_bool_from_env(OPENINFERENCE_HIDE_PROMPTS)
+    assert config.hide_completion_prompt is parse_bool_from_env(OPENINFERENCE_HIDE_COMPLETION_PROMPT)
+    assert config.hide_completion_text is parse_bool_from_env(OPENINFERENCE_HIDE_COMPLETION_TEXT)
     assert config.base64_image_max_length == int(
         os.getenv(OPENINFERENCE_BASE64_IMAGE_MAX_LENGTH, default=-1)
     )
@@ -169,6 +183,8 @@ def test_settings_from_env_vars_and_code(
     new_hide_input_text = not hide_input_text
     new_hide_output_text = not hide_output_text
     new_hide_prompts = not hide_prompts
+    new_hide_completion_prompt = not hide_completion_prompt
+    new_hide_completion_text = not hide_completion_text
     config = TraceConfig(
         hide_inputs=new_hide_inputs,
         hide_outputs=new_hide_outputs,
@@ -178,6 +194,8 @@ def test_settings_from_env_vars_and_code(
         hide_input_text=new_hide_input_text,
         hide_output_text=new_hide_output_text,
         hide_prompts=new_hide_prompts,
+        hide_completion_prompt=new_hide_completion_prompt,
+        hide_completion_text=new_hide_completion_text,
         base64_image_max_length=new_base64_image_max_length,
     )
     assert config.hide_inputs is new_hide_inputs
@@ -188,6 +206,8 @@ def test_settings_from_env_vars_and_code(
     assert config.hide_input_text is new_hide_input_text
     assert config.hide_output_text is new_hide_output_text
     assert config.hide_prompts is new_hide_prompts
+    assert config.hide_completion_prompt is new_hide_completion_prompt
+    assert config.hide_completion_text is new_hide_completion_text
     assert config.base64_image_max_length == new_base64_image_max_length
 
 
diff --git a/python/openinference-semantic-conventions/src/openinference/semconv/trace/__init__.py b/python/openinference-semantic-conventions/src/openinference/semconv/trace/__init__.py
@@ -57,6 +57,19 @@ class SpanAttributes:
     LLM_PROMPTS = "llm.prompts"
     """
     Prompts provided to a completions API.
+    DEPRECATED: Use COMPLETION_PROMPT instead for indexed format.
+    """
+    COMPLETION_PROMPT = "completion.prompt"
+    """
+    Prompt(s) provided to a completions API. Use indexed format for arrays.
+    Maps to the 'prompt' field in the request (e.g., request.prompt or request.prompt[0]).
+    Use format: completion.prompt.N
+    """
+    COMPLETION_TEXT = "completion.text"
+    """
+    Text Choice(s) returned from a completions API. Use indexed format for arrays.
+    Maps to the 'choices' array in the response (e.g., response.choices[0].text).
+    Use format: completion.text.N
     """
     LLM_PROMPT_TEMPLATE = "llm.prompt_template.template"
     """
diff --git a/python/openinference-semantic-conventions/tests/openinference/semconv/test_attributes.py b/python/openinference-semantic-conventions/tests/openinference/semconv/test_attributes.py
@@ -97,6 +97,10 @@ def test_nesting(self) -> None:
                 "mime_type": SpanAttributes.INPUT_MIME_TYPE,
                 "value": SpanAttributes.INPUT_VALUE,
             },
+            "completion": {
+                "input": SpanAttributes.COMPLETION_INPUT,
+                "output": SpanAttributes.COMPLETION_OUTPUT,
+            },
             "llm": {
                 "cost": {
                     "completion": SpanAttributes.LLM_COST_COMPLETION,
diff --git a/spec/configuration.md b/spec/configuration.md
@@ -15,8 +15,10 @@ The possible settings are:
 | OPENINFERENCE_HIDE_OUTPUT_MESSAGES           | Hides all output messages (independent of HIDE_OUTPUTS)                                                                        | bool | False   |
 | OPENINFERENCE_HIDE_INPUT_IMAGES              | Hides images from input messages (only applies when input messages are not already hidden)                                     | bool | False   |
 | OPENINFERENCE_HIDE_INPUT_TEXT                | Hides text from input messages (only applies when input messages are not already hidden)                                       | bool | False   |
-| OPENINFERENCE_HIDE_PROMPTS                   | Hides LLM prompts                                                                                                              | bool | False   |
+| OPENINFERENCE_HIDE_PROMPTS                   | DEPRECATED: Use OPENINFERENCE_HIDE_COMPLETION_PROMPT instead                                                                       | bool | False   |
+| OPENINFERENCE_HIDE_COMPLETION_PROMPT             | Hides completion prompt (for completions API)                                                                                      | bool | False   |
 | OPENINFERENCE_HIDE_OUTPUT_TEXT               | Hides text from output messages (only applies when output messages are not already hidden)                                     | bool | False   |
+| OPENINFERENCE_HIDE_COMPLETION_TEXT               | Hides completion text (for completions API)                                                                         | bool | False   |
 | OPENINFERENCE_HIDE_EMBEDDING_VECTORS         | Hides embedding vectors                                                                                                        | bool | False   |
 | OPENINFERENCE_BASE64_IMAGE_MAX_LENGTH        | Limits characters of a base64 encoding of an image                                                                             | int  | 32,000  |
 
@@ -51,7 +53,9 @@ If you are working in Python, and want to set up a configuration different than
         hide_output_text=...,
         hide_embedding_vectors=...,
         base64_image_max_length=...,
-        hide_prompts=...,
+        hide_prompts=...,  # DEPRECATED: use hide_completion_prompt
+        hide_completion_prompt=...,
+        hide_completion_text=...,
     )
 
     from openinference.instrumentation.openai import OpenAIInstrumentor
diff --git a/spec/llm_spans.md b/spec/llm_spans.md
diff --git a/spec/semantic_conventions.md b/spec/semantic_conventions.md