traceloop · nirga · Oct 2, 2024 · Sep 12, 2024 · Sep 17, 2024 · Sep 17, 2024
diff --git a/...s/opentelemetry-instrumentation-bedrock/opentelemetry/instrumentation/bedrock/__init__.py b/...s/opentelemetry-instrumentation-bedrock/opentelemetry/instrumentation/bedrock/__init__.py
diff --git a/packages/opentelemetry-instrumentation-bedrock/tests/conftest.py b/packages/opentelemetry-instrumentation-bedrock/tests/conftest.py
@@ -3,41 +3,10 @@
 import os
 import pytest
 import boto3
-from opentelemetry import trace
-from opentelemetry.instrumentation.bedrock import BedrockInstrumentor
-from opentelemetry.sdk.trace import TracerProvider
-from opentelemetry.sdk.trace.export import SimpleSpanProcessor
-from opentelemetry.sdk.trace.export.in_memory_span_exporter import InMemorySpanExporter
 
 pytest_plugins = []
 
 
-@pytest.fixture(scope="session")
-def exporter():
-    exporter = InMemorySpanExporter()
-    processor = SimpleSpanProcessor(exporter)
-
-    provider = TracerProvider()
-    provider.add_span_processor(processor)
-    trace.set_tracer_provider(provider)
-
-    return exporter
-
-
-@pytest.fixture(scope="session", autouse=True)
-def instrument(exporter):
-    BedrockInstrumentor(enrich_token_usage=True).instrument()
-
-    yield
-
-    exporter.shutdown()
-
-
-@pytest.fixture(autouse=True)
-def clear_exporter(exporter):
-    exporter.clear()
-
-
 @pytest.fixture(autouse=True)
 def environment():
     if os.getenv("AWS_SECRET_ACCESS_KEY") is None:
@@ -55,6 +24,16 @@ def brt():
     )
 
 
+@pytest.fixture
+def brt2():
+    return boto3.client(
+        service_name="bedrock-runtime",
+        aws_access_key_id=os.getenv("AWS_ACCESS_KEY_ID"),
+        aws_secret_access_key=os.getenv("AWS_SECRET_ACCESS_KEY"),
+        region_name="us-west-2",
+    )
+
+
 @pytest.fixture(scope="module")
 def vcr_config():
     return {"filter_headers": ["authorization"]}
diff --git a/packages/opentelemetry-instrumentation-bedrock/tests/metrics/__init__.py b/packages/opentelemetry-instrumentation-bedrock/tests/metrics/__init__.py
@@ -0,0 +1 @@
+"""unit tests."""
diff --git a/...ation-bedrock/tests/metrics/cassettes/test_bedrock_metrics/test_invoke_model_metrics.yaml b/...ation-bedrock/tests/metrics/cassettes/test_bedrock_metrics/test_invoke_model_metrics.yaml
@@ -0,0 +1,54 @@
+interactions:
+- request:
+    body: '{"inputText": "Tell me a joke about opentelemetry", "textGenerationConfig":
+      {"maxTokenCount": 200, "temperature": 0.5, "topP": 0.5}}'
+    headers:
+      Accept:
+      - !!binary |
+        YXBwbGljYXRpb24vanNvbg==
+      Content-Length:
+      - '132'
+      Content-Type:
+      - !!binary |
+        YXBwbGljYXRpb24vanNvbg==
+      User-Agent:
+      - !!binary |
+        Qm90bzMvMS4zNC4xNjIgbWQvQm90b2NvcmUjMS4zNC4xNjIgdWEvMi4wIG9zL21hY29zIzIzLjYu
+        MCBtZC9hcmNoI2FybTY0IGxhbmcvcHl0aG9uIzMuMTEuNSBtZC9weWltcGwjQ1B5dGhvbiBjZmcv
+        cmV0cnktbW9kZSNsZWdhY3kgQm90b2NvcmUvMS4zNC4xNjI=
+      X-Amz-Date:
+      - !!binary |
+        MjAyNDA5MTlUMDgxNTMyWg==
+      amz-sdk-invocation-id:
+      - !!binary |
+        YmNjNTcxNjYtYjRmOC00MzQzLTg4YmYtNWE4YzBhODBmZTM5
+      amz-sdk-request:
+      - !!binary |
+        YXR0ZW1wdD0x
+    method: POST
+    uri: https://bedrock-runtime.us-west-2.amazonaws.com/model/amazon.titan-text-express-v1/invoke
+  response:
+    body:
+      string: '{"inputTextTokenCount":9,"results":[{"tokenCount":17,"outputText":"\nWhat
+        do you call a bear with no teeth?\nA gummy bear.","completionReason":"FINISH"}]}'
+    headers:
+      Connection:
+      - keep-alive
+      Content-Length:
+      - '154'
+      Content-Type:
+      - application/json
+      Date:
+      - Thu, 19 Sep 2024 08:15:34 GMT
+      X-Amzn-Bedrock-Input-Token-Count:
+      - '9'
+      X-Amzn-Bedrock-Invocation-Latency:
+      - '1229'
+      X-Amzn-Bedrock-Output-Token-Count:
+      - '17'
+      x-amzn-RequestId:
+      - 6278b8bf-c1a7-46d7-822b-9f85ee7805b6
+    status:
+      code: 200
+      message: OK
+version: 1
diff --git a/packages/opentelemetry-instrumentation-bedrock/tests/metrics/conftest.py b/packages/opentelemetry-instrumentation-bedrock/tests/metrics/conftest.py
@@ -0,0 +1,42 @@
+"""Unit tests configuration module."""
+
+import pytest
+from opentelemetry import metrics
+from opentelemetry.sdk.resources import Resource
+from opentelemetry.sdk.metrics import MeterProvider
+from opentelemetry.sdk.metrics.export import InMemoryMetricReader
+from opentelemetry.instrumentation.bedrock import BedrockInstrumentor
+
+from opentelemetry import trace
+from opentelemetry.sdk.trace import TracerProvider
+from opentelemetry.sdk.trace.export import SimpleSpanProcessor
+from opentelemetry.sdk.trace.export.in_memory_span_exporter import InMemorySpanExporter
+
+
+@pytest.fixture(scope="session")
+def metrics_test_context():
+    resource = Resource.create()
+    reader = InMemoryMetricReader()
+    provider = MeterProvider(metric_readers=[reader], resource=resource)
+
+    metrics.set_meter_provider(provider)
+
+    # Without the following lines, span.is_recording() is False
+    # so that _handle_call and _handle_stream_call will be skipped
+    exporter = InMemorySpanExporter()
+    processor = SimpleSpanProcessor(exporter)
+    trace_provider = TracerProvider()
+    trace_provider.add_span_processor(processor)
+    trace.set_tracer_provider(trace_provider)
+
+    BedrockInstrumentor(enrich_token_usage=True).instrument()
+
+    return provider, reader
+
+
+@pytest.fixture(scope="session", autouse=True)
+def clear_metrics_test_context(metrics_test_context):
+    provider, reader = metrics_test_context
+
+    reader.shutdown()
+    provider.shutdown()
diff --git a/packages/opentelemetry-instrumentation-bedrock/tests/metrics/test_bedrock_metrics.py b/packages/opentelemetry-instrumentation-bedrock/tests/metrics/test_bedrock_metrics.py
@@ -0,0 +1,68 @@
+import json
+
+import pytest
+from opentelemetry.semconv_ai import Meters, SpanAttributes
+
+
+@pytest.mark.vcr
+def test_invoke_model_metrics(metrics_test_context, brt2):
+    if brt2 is None:
+        print("test_invoke_model_metrics test skipped.")
+        return
+
+    _, reader = metrics_test_context
+
+    body = json.dumps(
+        {
+            "inputText": "Tell me a joke about opentelemetry",
+            "textGenerationConfig": {
+                "maxTokenCount": 200,
+                "temperature": 0.5,
+                "topP": 0.5,
+            },
+        }
+    )
+
+    brt2.invoke_model(
+        body=body,
+        modelId='amazon.titan-text-express-v1',
+        accept='application/json',
+        contentType='application/json'
+    )
+
+    metrics_data = reader.get_metrics_data()
+    resource_metrics = metrics_data.resource_metrics
+    assert len(resource_metrics) > 0
+
+    found_token_metric = False
+    found_duration_metric = False
+
+    for rm in resource_metrics:
+        for sm in rm.scope_metrics:
+            for metric in sm.metrics:
+
+                if metric.name == Meters.LLM_TOKEN_USAGE:
+                    found_token_metric = True
+                    for data_point in metric.data.data_points:
+                        assert data_point.attributes[SpanAttributes.LLM_TOKEN_TYPE] in [
+                            "output",
+                            "input",
+                        ]
+                        assert data_point.sum > 0
+
+                if metric.name == Meters.LLM_OPERATION_DURATION:
+                    found_duration_metric = True
+                    assert any(
+                        data_point.count > 0 for data_point in metric.data.data_points
+                    )
+                    assert any(
+                        data_point.sum > 0 for data_point in metric.data.data_points
+                    )
+
+                assert (
+                    metric.data.data_points[0].attributes[SpanAttributes.LLM_SYSTEM]
+                    == "bedrock"
+                )
+
+    assert found_token_metric is True
+    assert found_duration_metric is True
diff --git a/packages/opentelemetry-instrumentation-bedrock/tests/traces/__init__.py b/packages/opentelemetry-instrumentation-bedrock/tests/traces/__init__.py
@@ -0,0 +1 @@
+"""unit tests."""
diff --git a/...st_ai21_j2_completion_string_content.yaml → ...st_ai21_j2_completion_string_content.yaml b/...st_ai21_j2_completion_string_content.yaml → ...st_ai21_j2_completion_string_content.yaml
diff --git a/...nthropic/test_anthropic_2_completion.yaml → ...nthropic/test_anthropic_2_completion.yaml b/...nthropic/test_anthropic_2_completion.yaml → ...nthropic/test_anthropic_2_completion.yaml
diff --git a/...thropic_3_completion_complex_content.yaml → ...thropic_3_completion_complex_content.yaml b/...thropic_3_completion_complex_content.yaml → ...thropic_3_completion_complex_content.yaml
diff --git a/...est_anthropic_3_completion_streaming.yaml → ...est_anthropic_3_completion_streaming.yaml b/...est_anthropic_3_completion_streaming.yaml → ...est_anthropic_3_completion_streaming.yaml
diff --git a/...nthropic_3_completion_string_content.yaml → ...nthropic_3_completion_string_content.yaml b/...nthropic_3_completion_string_content.yaml → ...nthropic_3_completion_string_content.yaml
diff --git a/...eta_llama2_completion_string_content.yaml → ...eta_llama2_completion_string_content.yaml b/...eta_llama2_completion_string_content.yaml → ...eta_llama2_completion_string_content.yaml
diff --git a/...est_meta/test_meta_llama3_completion.yaml → ...est_meta/test_meta_llama3_completion.yaml b/...est_meta/test_meta_llama3_completion.yaml → ...est_meta/test_meta_llama3_completion.yaml
diff --git a/...tes/test_titan/test_titan_completion.yaml → ...tes/test_titan/test_titan_completion.yaml b/...tes/test_titan/test_titan_completion.yaml → ...tes/test_titan/test_titan_completion.yaml
diff --git a/packages/opentelemetry-instrumentation-bedrock/tests/traces/conftest.py b/packages/opentelemetry-instrumentation-bedrock/tests/traces/conftest.py
@@ -0,0 +1,34 @@
+"""Unit tests configuration module."""
+
+import pytest
+from opentelemetry import trace
+from opentelemetry.instrumentation.bedrock import BedrockInstrumentor
+from opentelemetry.sdk.trace import TracerProvider
+from opentelemetry.sdk.trace.export import SimpleSpanProcessor
+from opentelemetry.sdk.trace.export.in_memory_span_exporter import InMemorySpanExporter
+
+
+@pytest.fixture(scope="session")
+def exporter():
+    exporter = InMemorySpanExporter()
+    processor = SimpleSpanProcessor(exporter)
+
+    provider = TracerProvider()
+    provider.add_span_processor(processor)
+    trace.set_tracer_provider(provider)
+
+    return exporter
+
+
+@pytest.fixture(scope="session", autouse=True)
+def instrument(exporter):
+    BedrockInstrumentor(enrich_token_usage=True).instrument()
+
+    yield
+
+    exporter.shutdown()
+
+
+@pytest.fixture(autouse=True)
+def clear_exporter(exporter):
+    exporter.clear()
diff --git a/...nstrumentation-bedrock/tests/test_ai21.py → ...ntation-bedrock/tests/traces/test_ai21.py b/...nstrumentation-bedrock/tests/test_ai21.py → ...ntation-bedrock/tests/traces/test_ai21.py
@@ -4,7 +4,7 @@
 import json
 
 
-@pytest.mark.vcr()
+@pytest.mark.vcr
 def test_ai21_j2_completion_string_content(exporter, brt):
     body = json.dumps(
         {

diff --git a/...mentation-bedrock/tests/test_anthropic.py → ...on-bedrock/tests/traces/test_anthropic.py b/...mentation-bedrock/tests/test_anthropic.py → ...on-bedrock/tests/traces/test_anthropic.py
diff --git a/...nstrumentation-bedrock/tests/test_meta.py → ...ntation-bedrock/tests/traces/test_meta.py b/...nstrumentation-bedrock/tests/test_meta.py → ...ntation-bedrock/tests/traces/test_meta.py
@@ -4,7 +4,7 @@
 import json
 
 
-@pytest.mark.vcr()
+@pytest.mark.vcr
 def test_meta_llama2_completion_string_content(exporter, brt):
     model_id = "meta.llama2-13b-chat-v1"
     prompt = """<s>[INST] <<SYS>>
@@ -44,7 +44,7 @@ def test_meta_llama2_completion_string_content(exporter, brt):
     )
 
 
-@pytest.mark.vcr()
+@pytest.mark.vcr
 def test_meta_llama3_completion(exporter, brt):
     model_id = "meta.llama3-70b-instruct-v1:0"
     prompt = "Tell me a joke about opentelemetry"

diff --git a/...strumentation-bedrock/tests/test_titan.py → ...tation-bedrock/tests/traces/test_titan.py b/...strumentation-bedrock/tests/test_titan.py → ...tation-bedrock/tests/traces/test_titan.py
@@ -4,7 +4,7 @@
 import json
 
 
-@pytest.mark.vcr()
+@pytest.mark.vcr
 def test_titan_completion(exporter, brt):
     body = json.dumps(
         {

diff --git a/packages/opentelemetry-semantic-conventions-ai/opentelemetry/semconv_ai/__init__.py b/packages/opentelemetry-semantic-conventions-ai/opentelemetry/semconv_ai/__init__.py
@@ -29,6 +29,8 @@ class Meters:
     LLM_WATSONX_COMPLETIONS_RESPONSES = "llm.watsonx.completions.responses"
     LLM_WATSONX_COMPLETIONS_TOKENS = "llm.watsonx.completions.tokens"
 
+    LLM_BEDROCK_COMPLETIONS_EXCEPTIONS = "llm.bedrock.completions.exceptions"
+
 
 class SpanAttributes:
     # Semantic Conventions for LLM requests, this needs to be removed after