JudgmentLabs
diff --git a/‎src/e2etests/test_tracer.py‎
Lines changed: 3 additions & 3 deletions b/‎src/e2etests/test_tracer.py‎
Lines changed: 3 additions & 3 deletions
diff --git a/‎src/judgeval/tracer/keys.py‎
Lines changed: 10 additions & 9 deletions b/‎src/judgeval/tracer/keys.py‎
Lines changed: 10 additions & 9 deletions
diff --git a/‎src/judgeval/tracer/llm/llm_anthropic/messages.py‎
Lines changed: 34 additions & 22 deletions b/‎src/judgeval/tracer/llm/llm_anthropic/messages.py‎
Lines changed: 34 additions & 22 deletions
diff --git a/‎src/judgeval/tracer/llm/llm_anthropic/messages_stream.py‎
Lines changed: 12 additions & 12 deletions b/‎src/judgeval/tracer/llm/llm_anthropic/messages_stream.py‎
Lines changed: 12 additions & 12 deletions
diff --git a/‎src/judgeval/tracer/llm/llm_google/generate_content.py‎
Lines changed: 8 additions & 6 deletions b/‎src/judgeval/tracer/llm/llm_google/generate_content.py‎
Lines changed: 8 additions & 6 deletions
@@ -286,7 +286,7 @@ def retrieve_llm_cost_helper(trace_id):
         span_attrs = span.get("span_attributes", {})
         if isinstance(span_attrs, str):
             span_attrs = orjson.loads(span_attrs)
-        llm_cost = span_attrs.get("gen_ai.usage.total_cost_usd", 0)
+        llm_cost = span_attrs.get("judgment.usage.total_cost_usd", 0)
         total_llm_cost += llm_cost
 
     if total_llm_cost == 0:
@@ -325,8 +325,8 @@ def retrieve_streaming_trace_helper(trace_id):
         assert False, "No completion content found in streaming span"
 
     # Should have usage information
-    input_tokens = span_attributes.get("gen_ai.usage.input_tokens")
-    output_tokens = span_attributes.get("gen_ai.usage.output_tokens")
+    input_tokens = span_attributes.get("judgment.usage.non_cached_input_tokens")
+    output_tokens = span_attributes.get("judgment.usage.output_tokens")
 
     if input_tokens is None or output_tokens is None:
         assert False, "Missing usage tokens in streaming span"
 
@@ -26,18 +26,19 @@ class AttributeKeys(str, Enum):
 
     PENDING_TRACE_EVAL = "judgment.pending_trace_eval"
 
+    JUDGMENT_LLM_PROVIDER = "judgment.llm.provider"
+    JUDGMENT_LLM_MODEL_NAME = "judgment.llm.model"
+    JUDGMENT_USAGE_NON_CACHED_INPUT_TOKENS = "judgment.usage.non_cached_input_tokens"
+    JUDGMENT_USAGE_CACHE_CREATION_INPUT_TOKENS = (
+        "judgment.usage.cache_creation_input_tokens"
+    )
+    JUDGMENT_USAGE_CACHE_READ_INPUT_TOKENS = "judgment.usage.cache_read_input_tokens"
+    JUDGMENT_USAGE_OUTPUT_TOKENS = "judgment.usage.output_tokens"
+    JUDGMENT_USAGE_TOTAL_COST_USD = "judgment.usage.total_cost_usd"
+
     GEN_AI_PROMPT = "gen_ai.prompt"
     GEN_AI_COMPLETION = "gen_ai.completion"
-    GEN_AI_REQUEST_MODEL = "gen_ai.request.model"
-    GEN_AI_RESPONSE_MODEL = "gen_ai.response.model"
     GEN_AI_SYSTEM = "gen_ai.system"
-    GEN_AI_USAGE_INPUT_TOKENS = "gen_ai.usage.input_tokens"
-    GEN_AI_USAGE_OUTPUT_TOKENS = "gen_ai.usage.output_tokens"
-    GEN_AI_USAGE_CACHE_CREATION_INPUT_TOKENS = (
-        "gen_ai.usage.cache_creation_input_tokens"
-    )
-    GEN_AI_USAGE_CACHE_READ_INPUT_TOKENS = "gen_ai.usage.cache_read_input_tokens"
-
     GEN_AI_REQUEST_TEMPERATURE = "gen_ai.request.temperature"
     GEN_AI_REQUEST_MAX_TOKENS = "gen_ai.request.max_tokens"
     GEN_AI_RESPONSE_FINISH_REASONS = "gen_ai.response.finish_reasons"
 
@@ -95,7 +95,7 @@ def pre_hook(ctx: Dict[str, Any], *args: Any, **kwargs: Any) -> None:
         )
         ctx["model_name"] = kwargs.get("model", "")
         set_span_attribute(
-            ctx["span"], AttributeKeys.GEN_AI_REQUEST_MODEL, ctx["model_name"]
+            ctx["span"], AttributeKeys.JUDGMENT_LLM_MODEL_NAME, ctx["model_name"]
         )
 
     def post_hook(ctx: Dict[str, Any], result: Message) -> None:
@@ -112,17 +112,19 @@ def post_hook(ctx: Dict[str, Any], result: Message) -> None:
                 _extract_anthropic_tokens(result.usage)
             )
             set_span_attribute(
-                span, AttributeKeys.GEN_AI_USAGE_INPUT_TOKENS, prompt_tokens
+                span,
+                AttributeKeys.JUDGMENT_USAGE_NON_CACHED_INPUT_TOKENS,
+                prompt_tokens,
             )
             set_span_attribute(
-                span, AttributeKeys.GEN_AI_USAGE_OUTPUT_TOKENS, completion_tokens
+                span, AttributeKeys.JUDGMENT_USAGE_OUTPUT_TOKENS, completion_tokens
             )
             set_span_attribute(
-                span, AttributeKeys.GEN_AI_USAGE_CACHE_READ_INPUT_TOKENS, cache_read
+                span, AttributeKeys.JUDGMENT_USAGE_CACHE_READ_INPUT_TOKENS, cache_read
             )
             set_span_attribute(
                 span,
-                AttributeKeys.GEN_AI_USAGE_CACHE_CREATION_INPUT_TOKENS,
+                AttributeKeys.JUDGMENT_USAGE_CACHE_CREATION_INPUT_TOKENS,
                 cache_creation,
             )
             set_span_attribute(
@@ -133,7 +135,7 @@ def post_hook(ctx: Dict[str, Any], result: Message) -> None:
 
         set_span_attribute(
             span,
-            AttributeKeys.GEN_AI_RESPONSE_MODEL,
+            AttributeKeys.JUDGMENT_LLM_MODEL_NAME,
             result.model,
         )
 
@@ -169,7 +171,7 @@ def pre_hook(ctx: Dict[str, Any], *args: Any, **kwargs: Any) -> None:
         )
         ctx["model_name"] = kwargs.get("model", "")
         set_span_attribute(
-            ctx["span"], AttributeKeys.GEN_AI_REQUEST_MODEL, ctx["model_name"]
+            ctx["span"], AttributeKeys.JUDGMENT_LLM_MODEL_NAME, ctx["model_name"]
         )
         ctx["accumulated_content"] = ""
 
@@ -197,17 +199,21 @@ def yield_hook(inner_ctx: Dict[str, Any], chunk: RawMessageStreamEvent) -> None:
                     _extract_anthropic_tokens(usage_data)
                 )
                 set_span_attribute(
-                    span, AttributeKeys.GEN_AI_USAGE_INPUT_TOKENS, prompt_tokens
+                    span,
+                    AttributeKeys.JUDGMENT_USAGE_NON_CACHED_INPUT_TOKENS,
+                    prompt_tokens,
                 )
                 set_span_attribute(
-                    span, AttributeKeys.GEN_AI_USAGE_OUTPUT_TOKENS, completion_tokens
+                    span, AttributeKeys.JUDGMENT_USAGE_OUTPUT_TOKENS, completion_tokens
                 )
                 set_span_attribute(
-                    span, AttributeKeys.GEN_AI_USAGE_CACHE_READ_INPUT_TOKENS, cache_read
+                    span,
+                    AttributeKeys.JUDGMENT_USAGE_CACHE_READ_INPUT_TOKENS,
+                    cache_read,
                 )
                 set_span_attribute(
                     span,
-                    AttributeKeys.GEN_AI_USAGE_CACHE_CREATION_INPUT_TOKENS,
+                    AttributeKeys.JUDGMENT_USAGE_CACHE_CREATION_INPUT_TOKENS,
                     cache_creation,
                 )
                 set_span_attribute(
@@ -279,7 +285,7 @@ def pre_hook(ctx: Dict[str, Any], *args: Any, **kwargs: Any) -> None:
         )
         ctx["model_name"] = kwargs.get("model", "")
         set_span_attribute(
-            ctx["span"], AttributeKeys.GEN_AI_REQUEST_MODEL, ctx["model_name"]
+            ctx["span"], AttributeKeys.JUDGMENT_LLM_MODEL_NAME, ctx["model_name"]
         )
 
     def post_hook(ctx: Dict[str, Any], result: Message) -> None:
@@ -296,17 +302,19 @@ def post_hook(ctx: Dict[str, Any], result: Message) -> None:
                 _extract_anthropic_tokens(result.usage)
             )
             set_span_attribute(
-                span, AttributeKeys.GEN_AI_USAGE_INPUT_TOKENS, prompt_tokens
+                span,
+                AttributeKeys.JUDGMENT_USAGE_NON_CACHED_INPUT_TOKENS,
+                prompt_tokens,
             )
             set_span_attribute(
-                span, AttributeKeys.GEN_AI_USAGE_OUTPUT_TOKENS, completion_tokens
+                span, AttributeKeys.JUDGMENT_USAGE_OUTPUT_TOKENS, completion_tokens
             )
             set_span_attribute(
-                span, AttributeKeys.GEN_AI_USAGE_CACHE_READ_INPUT_TOKENS, cache_read
+                span, AttributeKeys.JUDGMENT_USAGE_CACHE_READ_INPUT_TOKENS, cache_read
             )
             set_span_attribute(
                 span,
-                AttributeKeys.GEN_AI_USAGE_CACHE_CREATION_INPUT_TOKENS,
+                AttributeKeys.JUDGMENT_USAGE_CACHE_CREATION_INPUT_TOKENS,
                 cache_creation,
             )
             set_span_attribute(
@@ -317,7 +325,7 @@ def post_hook(ctx: Dict[str, Any], result: Message) -> None:
 
         set_span_attribute(
             span,
-            AttributeKeys.GEN_AI_RESPONSE_MODEL,
+            AttributeKeys.JUDGMENT_LLM_MODEL_NAME,
             result.model,
         )
 
@@ -354,7 +362,7 @@ def pre_hook(ctx: Dict[str, Any], *args: Any, **kwargs: Any) -> None:
         )
         ctx["model_name"] = kwargs.get("model", "")
         set_span_attribute(
-            ctx["span"], AttributeKeys.GEN_AI_REQUEST_MODEL, ctx["model_name"]
+            ctx["span"], AttributeKeys.JUDGMENT_LLM_MODEL_NAME, ctx["model_name"]
         )
         ctx["accumulated_content"] = ""
 
@@ -382,17 +390,21 @@ def yield_hook(inner_ctx: Dict[str, Any], chunk: RawMessageStreamEvent) -> None:
                     _extract_anthropic_tokens(usage_data)
                 )
                 set_span_attribute(
-                    span, AttributeKeys.GEN_AI_USAGE_INPUT_TOKENS, prompt_tokens
+                    span,
+                    AttributeKeys.JUDGMENT_USAGE_NON_CACHED_INPUT_TOKENS,
+                    prompt_tokens,
                 )
                 set_span_attribute(
-                    span, AttributeKeys.GEN_AI_USAGE_OUTPUT_TOKENS, completion_tokens
+                    span, AttributeKeys.JUDGMENT_USAGE_OUTPUT_TOKENS, completion_tokens
                 )
                 set_span_attribute(
-                    span, AttributeKeys.GEN_AI_USAGE_CACHE_READ_INPUT_TOKENS, cache_read
+                    span,
+                    AttributeKeys.JUDGMENT_USAGE_CACHE_READ_INPUT_TOKENS,
+                    cache_read,
                 )
                 set_span_attribute(
                     span,
-                    AttributeKeys.GEN_AI_USAGE_CACHE_CREATION_INPUT_TOKENS,
+                    AttributeKeys.JUDGMENT_USAGE_CACHE_CREATION_INPUT_TOKENS,
                     cache_creation,
                 )
                 set_span_attribute(
 
@@ -44,7 +44,7 @@ def pre_hook(ctx: Dict[str, Any], *args: Any, **kwargs: Any) -> None:
 
         ctx["model_name"] = kwargs.get("model", "")
         set_span_attribute(
-            ctx["span"], AttributeKeys.GEN_AI_REQUEST_MODEL, ctx["model_name"]
+            ctx["span"], AttributeKeys.JUDGMENT_LLM_MODEL_NAME, ctx["model_name"]
         )
         ctx["accumulated_content"] = ""
 
@@ -125,22 +125,22 @@ def post_hook_exit_impl() -> None:
                             ) = _extract_anthropic_tokens(final_message.usage)
                             set_span_attribute(
                                 span,
-                                AttributeKeys.GEN_AI_USAGE_INPUT_TOKENS,
+                                AttributeKeys.JUDGMENT_USAGE_NON_CACHED_INPUT_TOKENS,
                                 prompt_tokens,
                             )
                             set_span_attribute(
                                 span,
-                                AttributeKeys.GEN_AI_USAGE_OUTPUT_TOKENS,
+                                AttributeKeys.JUDGMENT_USAGE_OUTPUT_TOKENS,
                                 completion_tokens,
                             )
                             set_span_attribute(
                                 span,
-                                AttributeKeys.GEN_AI_USAGE_CACHE_READ_INPUT_TOKENS,
+                                AttributeKeys.JUDGMENT_USAGE_CACHE_READ_INPUT_TOKENS,
                                 cache_read,
                             )
                             set_span_attribute(
                                 span,
-                                AttributeKeys.GEN_AI_USAGE_CACHE_CREATION_INPUT_TOKENS,
+                                AttributeKeys.JUDGMENT_USAGE_CACHE_CREATION_INPUT_TOKENS,
                                 cache_creation,
                             )
                             set_span_attribute(
@@ -151,7 +151,7 @@ def post_hook_exit_impl() -> None:
 
                         set_span_attribute(
                             span,
-                            AttributeKeys.GEN_AI_RESPONSE_MODEL,
+                            AttributeKeys.JUDGMENT_LLM_MODEL_NAME,
                             final_message.model,
                         )
                     except Exception:
@@ -190,7 +190,7 @@ def pre_hook(ctx: Dict[str, Any], *args: Any, **kwargs: Any) -> None:
 
         ctx["model_name"] = kwargs.get("model", "")
         set_span_attribute(
-            ctx["span"], AttributeKeys.GEN_AI_REQUEST_MODEL, ctx["model_name"]
+            ctx["span"], AttributeKeys.JUDGMENT_LLM_MODEL_NAME, ctx["model_name"]
         )
         ctx["accumulated_content"] = ""
 
@@ -271,22 +271,22 @@ async def post_hook_aexit_impl() -> None:
                             ) = _extract_anthropic_tokens(final_message.usage)
                             set_span_attribute(
                                 span,
-                                AttributeKeys.GEN_AI_USAGE_INPUT_TOKENS,
+                                AttributeKeys.JUDGMENT_USAGE_NON_CACHED_INPUT_TOKENS,
                                 prompt_tokens,
                             )
                             set_span_attribute(
                                 span,
-                                AttributeKeys.GEN_AI_USAGE_OUTPUT_TOKENS,
+                                AttributeKeys.JUDGMENT_USAGE_OUTPUT_TOKENS,
                                 completion_tokens,
                             )
                             set_span_attribute(
                                 span,
-                                AttributeKeys.GEN_AI_USAGE_CACHE_READ_INPUT_TOKENS,
+                                AttributeKeys.JUDGMENT_USAGE_CACHE_READ_INPUT_TOKENS,
                                 cache_read,
                             )
                             set_span_attribute(
                                 span,
-                                AttributeKeys.GEN_AI_USAGE_CACHE_CREATION_INPUT_TOKENS,
+                                AttributeKeys.JUDGMENT_USAGE_CACHE_CREATION_INPUT_TOKENS,
                                 cache_creation,
                             )
                             set_span_attribute(
@@ -297,7 +297,7 @@ async def post_hook_aexit_impl() -> None:
 
                         set_span_attribute(
                             span,
-                            AttributeKeys.GEN_AI_RESPONSE_MODEL,
+                            AttributeKeys.JUDGMENT_LLM_MODEL_NAME,
                             final_message.model,
                         )
                     except Exception:
 
@@ -63,7 +63,7 @@ def pre_hook(ctx: Dict[str, Any], *args: Any, **kwargs: Any) -> None:
         )
         ctx["model_name"] = kwargs.get("model", "")
         set_span_attribute(
-            ctx["span"], AttributeKeys.GEN_AI_REQUEST_MODEL, ctx["model_name"]
+            ctx["span"], AttributeKeys.JUDGMENT_LLM_MODEL_NAME, ctx["model_name"]
         )
 
     def post_hook(ctx: Dict[str, Any], result: GenerateContentResponse) -> None:
@@ -79,17 +79,19 @@ def post_hook(ctx: Dict[str, Any], result: GenerateContentResponse) -> None:
                 _extract_google_tokens(usage_data)
             )
             set_span_attribute(
-                span, AttributeKeys.GEN_AI_USAGE_INPUT_TOKENS, prompt_tokens
+                span,
+                AttributeKeys.JUDGMENT_USAGE_NON_CACHED_INPUT_TOKENS,
+                prompt_tokens,
             )
             set_span_attribute(
-                span, AttributeKeys.GEN_AI_USAGE_OUTPUT_TOKENS, completion_tokens
+                span, AttributeKeys.JUDGMENT_USAGE_OUTPUT_TOKENS, completion_tokens
             )
             set_span_attribute(
-                span, AttributeKeys.GEN_AI_USAGE_CACHE_READ_INPUT_TOKENS, cache_read
+                span, AttributeKeys.JUDGMENT_USAGE_CACHE_READ_INPUT_TOKENS, cache_read
             )
             set_span_attribute(
                 span,
-                AttributeKeys.GEN_AI_USAGE_CACHE_CREATION_INPUT_TOKENS,
+                AttributeKeys.JUDGMENT_USAGE_CACHE_CREATION_INPUT_TOKENS,
                 cache_creation,
             )
             set_span_attribute(
@@ -100,7 +102,7 @@ def post_hook(ctx: Dict[str, Any], result: GenerateContentResponse) -> None:
 
         set_span_attribute(
             span,
-            AttributeKeys.GEN_AI_RESPONSE_MODEL,
+            AttributeKeys.JUDGMENT_LLM_MODEL_NAME,
             result.model_version if result.model_version else ctx["model_name"],
         )
Original file line number	Diff line number	Diff line change
`@@ -95,7 +95,7 @@ def pre_hook(ctx: Dict[str, Any], args: Any, *kwargs: Any) -> None:`
`95`	`95`	`)`
`96`	`96`	`ctx["model_name"] = kwargs.get("model", "")`
`97`	`97`	`set_span_attribute(`
`98`		`- ctx["span"], AttributeKeys.GEN_AI_REQUEST_MODEL, ctx["model_name"]`
	`98`	`+ ctx["span"], AttributeKeys.JUDGMENT_LLM_MODEL_NAME, ctx["model_name"]`
`99`	`99`	`)`
`100`	`100`
`101`	`101`	`def post_hook(ctx: Dict[str, Any], result: Message) -> None:`
`@@ -112,17 +112,19 @@ def post_hook(ctx: Dict[str, Any], result: Message) -> None:`
`112`	`112`	`_extract_anthropic_tokens(result.usage)`
`113`	`113`	`)`
`114`	`114`	`set_span_attribute(`
`115`		`- span, AttributeKeys.GEN_AI_USAGE_INPUT_TOKENS, prompt_tokens`
	`115`	`+ span,`
	`116`	`+ AttributeKeys.JUDGMENT_USAGE_NON_CACHED_INPUT_TOKENS,`
	`117`	`+ prompt_tokens,`
`116`	`118`	`)`
`117`	`119`	`set_span_attribute(`
`118`		`- span, AttributeKeys.GEN_AI_USAGE_OUTPUT_TOKENS, completion_tokens`
	`120`	`+ span, AttributeKeys.JUDGMENT_USAGE_OUTPUT_TOKENS, completion_tokens`
`119`	`121`	`)`
`120`	`122`	`set_span_attribute(`
`121`		`- span, AttributeKeys.GEN_AI_USAGE_CACHE_READ_INPUT_TOKENS, cache_read`
	`123`	`+ span, AttributeKeys.JUDGMENT_USAGE_CACHE_READ_INPUT_TOKENS, cache_read`
`122`	`124`	`)`
`123`	`125`	`set_span_attribute(`
`124`	`126`	`span,`
`125`		`- AttributeKeys.GEN_AI_USAGE_CACHE_CREATION_INPUT_TOKENS,`
	`127`	`+ AttributeKeys.JUDGMENT_USAGE_CACHE_CREATION_INPUT_TOKENS,`
`126`	`128`	`cache_creation,`
`127`	`129`	`)`
`128`	`130`	`set_span_attribute(`
`@@ -133,7 +135,7 @@ def post_hook(ctx: Dict[str, Any], result: Message) -> None:`
`133`	`135`
`134`	`136`	`set_span_attribute(`
`135`	`137`	`span,`
`136`		`- AttributeKeys.GEN_AI_RESPONSE_MODEL,`
	`138`	`+ AttributeKeys.JUDGMENT_LLM_MODEL_NAME,`
`137`	`139`	`result.model,`
`138`	`140`	`)`
`139`	`141`
`@@ -169,7 +171,7 @@ def pre_hook(ctx: Dict[str, Any], args: Any, *kwargs: Any) -> None:`
`169`	`171`	`)`
`170`	`172`	`ctx["model_name"] = kwargs.get("model", "")`
`171`	`173`	`set_span_attribute(`
`172`		`- ctx["span"], AttributeKeys.GEN_AI_REQUEST_MODEL, ctx["model_name"]`
	`174`	`+ ctx["span"], AttributeKeys.JUDGMENT_LLM_MODEL_NAME, ctx["model_name"]`
`173`	`175`	`)`
`174`	`176`	`ctx["accumulated_content"] = ""`
`175`	`177`
`@@ -197,17 +199,21 @@ def yield_hook(inner_ctx: Dict[str, Any], chunk: RawMessageStreamEvent) -> None:`
`197`	`199`	`_extract_anthropic_tokens(usage_data)`
`198`	`200`	`)`
`199`	`201`	`set_span_attribute(`
`200`		`- span, AttributeKeys.GEN_AI_USAGE_INPUT_TOKENS, prompt_tokens`
	`202`	`+ span,`
	`203`	`+ AttributeKeys.JUDGMENT_USAGE_NON_CACHED_INPUT_TOKENS,`
	`204`	`+ prompt_tokens,`
`201`	`205`	`)`
`202`	`206`	`set_span_attribute(`
`203`		`- span, AttributeKeys.GEN_AI_USAGE_OUTPUT_TOKENS, completion_tokens`
	`207`	`+ span, AttributeKeys.JUDGMENT_USAGE_OUTPUT_TOKENS, completion_tokens`
`204`	`208`	`)`
`205`	`209`	`set_span_attribute(`
`206`		`- span, AttributeKeys.GEN_AI_USAGE_CACHE_READ_INPUT_TOKENS, cache_read`
	`210`	`+ span,`
	`211`	`+ AttributeKeys.JUDGMENT_USAGE_CACHE_READ_INPUT_TOKENS,`
	`212`	`+ cache_read,`
`207`	`213`	`)`
`208`	`214`	`set_span_attribute(`
`209`	`215`	`span,`
`210`		`- AttributeKeys.GEN_AI_USAGE_CACHE_CREATION_INPUT_TOKENS,`
	`216`	`+ AttributeKeys.JUDGMENT_USAGE_CACHE_CREATION_INPUT_TOKENS,`
`211`	`217`	`cache_creation,`
`212`	`218`	`)`
`213`	`219`	`set_span_attribute(`
`@@ -279,7 +285,7 @@ def pre_hook(ctx: Dict[str, Any], args: Any, *kwargs: Any) -> None:`
`279`	`285`	`)`
`280`	`286`	`ctx["model_name"] = kwargs.get("model", "")`
`281`	`287`	`set_span_attribute(`
`282`		`- ctx["span"], AttributeKeys.GEN_AI_REQUEST_MODEL, ctx["model_name"]`
	`288`	`+ ctx["span"], AttributeKeys.JUDGMENT_LLM_MODEL_NAME, ctx["model_name"]`
`283`	`289`	`)`
`284`	`290`
`285`	`291`	`def post_hook(ctx: Dict[str, Any], result: Message) -> None:`
`@@ -296,17 +302,19 @@ def post_hook(ctx: Dict[str, Any], result: Message) -> None:`
`296`	`302`	`_extract_anthropic_tokens(result.usage)`
`297`	`303`	`)`
`298`	`304`	`set_span_attribute(`
`299`		`- span, AttributeKeys.GEN_AI_USAGE_INPUT_TOKENS, prompt_tokens`
	`305`	`+ span,`
	`306`	`+ AttributeKeys.JUDGMENT_USAGE_NON_CACHED_INPUT_TOKENS,`
	`307`	`+ prompt_tokens,`
`300`	`308`	`)`
`301`	`309`	`set_span_attribute(`
`302`		`- span, AttributeKeys.GEN_AI_USAGE_OUTPUT_TOKENS, completion_tokens`
	`310`	`+ span, AttributeKeys.JUDGMENT_USAGE_OUTPUT_TOKENS, completion_tokens`
`303`	`311`	`)`
`304`	`312`	`set_span_attribute(`
`305`		`- span, AttributeKeys.GEN_AI_USAGE_CACHE_READ_INPUT_TOKENS, cache_read`
	`313`	`+ span, AttributeKeys.JUDGMENT_USAGE_CACHE_READ_INPUT_TOKENS, cache_read`
`306`	`314`	`)`
`307`	`315`	`set_span_attribute(`
`308`	`316`	`span,`
`309`		`- AttributeKeys.GEN_AI_USAGE_CACHE_CREATION_INPUT_TOKENS,`
	`317`	`+ AttributeKeys.JUDGMENT_USAGE_CACHE_CREATION_INPUT_TOKENS,`
`310`	`318`	`cache_creation,`
`311`	`319`	`)`
`312`	`320`	`set_span_attribute(`
`@@ -317,7 +325,7 @@ def post_hook(ctx: Dict[str, Any], result: Message) -> None:`
`317`	`325`
`318`	`326`	`set_span_attribute(`
`319`	`327`	`span,`
`320`		`- AttributeKeys.GEN_AI_RESPONSE_MODEL,`
	`328`	`+ AttributeKeys.JUDGMENT_LLM_MODEL_NAME,`
`321`	`329`	`result.model,`
`322`	`330`	`)`
`323`	`331`
`@@ -354,7 +362,7 @@ def pre_hook(ctx: Dict[str, Any], args: Any, *kwargs: Any) -> None:`
`354`	`362`	`)`
`355`	`363`	`ctx["model_name"] = kwargs.get("model", "")`
`356`	`364`	`set_span_attribute(`
`357`		`- ctx["span"], AttributeKeys.GEN_AI_REQUEST_MODEL, ctx["model_name"]`
	`365`	`+ ctx["span"], AttributeKeys.JUDGMENT_LLM_MODEL_NAME, ctx["model_name"]`
`358`	`366`	`)`
`359`	`367`	`ctx["accumulated_content"] = ""`
`360`	`368`
`@@ -382,17 +390,21 @@ def yield_hook(inner_ctx: Dict[str, Any], chunk: RawMessageStreamEvent) -> None:`
`382`	`390`	`_extract_anthropic_tokens(usage_data)`
`383`	`391`	`)`
`384`	`392`	`set_span_attribute(`
`385`		`- span, AttributeKeys.GEN_AI_USAGE_INPUT_TOKENS, prompt_tokens`
	`393`	`+ span,`
	`394`	`+ AttributeKeys.JUDGMENT_USAGE_NON_CACHED_INPUT_TOKENS,`
	`395`	`+ prompt_tokens,`
`386`	`396`	`)`
`387`	`397`	`set_span_attribute(`
`388`		`- span, AttributeKeys.GEN_AI_USAGE_OUTPUT_TOKENS, completion_tokens`
	`398`	`+ span, AttributeKeys.JUDGMENT_USAGE_OUTPUT_TOKENS, completion_tokens`
`389`	`399`	`)`
`390`	`400`	`set_span_attribute(`
`391`		`- span, AttributeKeys.GEN_AI_USAGE_CACHE_READ_INPUT_TOKENS, cache_read`
	`401`	`+ span,`
	`402`	`+ AttributeKeys.JUDGMENT_USAGE_CACHE_READ_INPUT_TOKENS,`
	`403`	`+ cache_read,`
`392`	`404`	`)`
`393`	`405`	`set_span_attribute(`
`394`	`406`	`span,`
`395`		`- AttributeKeys.GEN_AI_USAGE_CACHE_CREATION_INPUT_TOKENS,`
	`407`	`+ AttributeKeys.JUDGMENT_USAGE_CACHE_CREATION_INPUT_TOKENS,`
`396`	`408`	`cache_creation,`
`397`	`409`	`)`
`398`	`410`	`set_span_attribute(`
Original file line number	Diff line number	Diff line change
`@@ -63,7 +63,7 @@ def pre_hook(ctx: Dict[str, Any], args: Any, *kwargs: Any) -> None:`
`63`	`63`	`)`
`64`	`64`	`ctx["model_name"] = kwargs.get("model", "")`
`65`	`65`	`set_span_attribute(`
`66`		`- ctx["span"], AttributeKeys.GEN_AI_REQUEST_MODEL, ctx["model_name"]`
	`66`	`+ ctx["span"], AttributeKeys.JUDGMENT_LLM_MODEL_NAME, ctx["model_name"]`
`67`	`67`	`)`
`68`	`68`
`69`	`69`	`def post_hook(ctx: Dict[str, Any], result: GenerateContentResponse) -> None:`
`@@ -79,17 +79,19 @@ def post_hook(ctx: Dict[str, Any], result: GenerateContentResponse) -> None:`
`79`	`79`	`_extract_google_tokens(usage_data)`
`80`	`80`	`)`
`81`	`81`	`set_span_attribute(`
`82`		`- span, AttributeKeys.GEN_AI_USAGE_INPUT_TOKENS, prompt_tokens`
	`82`	`+ span,`
	`83`	`+ AttributeKeys.JUDGMENT_USAGE_NON_CACHED_INPUT_TOKENS,`
	`84`	`+ prompt_tokens,`
`83`	`85`	`)`
`84`	`86`	`set_span_attribute(`
`85`		`- span, AttributeKeys.GEN_AI_USAGE_OUTPUT_TOKENS, completion_tokens`
	`87`	`+ span, AttributeKeys.JUDGMENT_USAGE_OUTPUT_TOKENS, completion_tokens`
`86`	`88`	`)`
`87`	`89`	`set_span_attribute(`
`88`		`- span, AttributeKeys.GEN_AI_USAGE_CACHE_READ_INPUT_TOKENS, cache_read`
	`90`	`+ span, AttributeKeys.JUDGMENT_USAGE_CACHE_READ_INPUT_TOKENS, cache_read`
`89`	`91`	`)`
`90`	`92`	`set_span_attribute(`
`91`	`93`	`span,`
`92`		`- AttributeKeys.GEN_AI_USAGE_CACHE_CREATION_INPUT_TOKENS,`
	`94`	`+ AttributeKeys.JUDGMENT_USAGE_CACHE_CREATION_INPUT_TOKENS,`
`93`	`95`	`cache_creation,`
`94`	`96`	`)`
`95`	`97`	`set_span_attribute(`
`@@ -100,7 +102,7 @@ def post_hook(ctx: Dict[str, Any], result: GenerateContentResponse) -> None:`
`100`	`102`
`101`	`103`	`set_span_attribute(`
`102`	`104`	`span,`
`103`		`- AttributeKeys.GEN_AI_RESPONSE_MODEL,`
	`105`	`+ AttributeKeys.JUDGMENT_LLM_MODEL_NAME,`
`104`	`106`	`result.model_version if result.model_version else ctx["model_name"],`
`105`	`107`	`)`
`106`	`108`