chore: Add supportability metrics for LLM vendors and models. (#3006)

jaffinito · web-flow · commit a41309182914 · 2025-03-03T08:53:11.000-06:00
diff --git a/src/Agent/NewRelic/Agent/Extensions/NewRelic.Agent.Extensions/Llm/SupportabilityHelpers.cs b/src/Agent/NewRelic/Agent/Extensions/NewRelic.Agent.Extensions/Llm/SupportabilityHelpers.cs
@@ -0,0 +1,105 @@
+// Copyright 2020 New Relic, Inc. All rights reserved.
+// SPDX-License-Identifier: Apache-2.0
+
+using System;
+using System.Collections.Concurrent;
+using System.Text.RegularExpressions;
+using NewRelic.Agent.Api;
+
+namespace NewRelic.Agent.Extensions.Llm
+{
+    public static class SupportabilityHelpers
+    {
+        private const string OpenAiDateRemovalPattern = @"-\d{4}-\d{2}-\d{2}";
+
+        private static readonly ConcurrentDictionary<string, object> _seenModels = new();
+
+        public static void CreateModelIdSupportabilityMetricsForOpenAi(string model, IAgent agent)
+        {
+            if (string.IsNullOrWhiteSpace(model))
+            {
+                return;
+            }
+
+            // Only want to send this metric once-ish per model
+            if (!_seenModels.TryAdd(model, null))
+            {
+                return;
+            }
+
+            try
+            {
+                // Example openai: o1
+                // Example openai: gpt-4o-2024-11-20
+                var noDateModel = Regex.Replace(model, OpenAiDateRemovalPattern, string.Empty);
+                var modelIdDetails = noDateModel.Split('-');
+                if (modelIdDetails.Length == 1)
+                {
+                    agent.RecordSupportabilityMetric("DotNet/LLM/openai/" + modelIdDetails[0]);
+                    return;
+                }
+
+                agent.RecordSupportabilityMetric("DotNet/LLM/openai/" + modelIdDetails[0] + "-" + modelIdDetails[1]);
+            }
+            catch (Exception ex) // if there is a problem, this will also only happen once-ish per model
+            {
+                agent.Logger.Finest($"Error creating model supportability metric for {model}: {ex.Message}");
+            }
+        }
+
+        public static void CreateModelIdSupportabilityMetricsForBedrock(string model, IAgent agent)
+        {
+            if (string.IsNullOrWhiteSpace(model))
+            {
+                return;
+            }
+
+            // Only want to send this metric once-ish per model
+            if (!_seenModels.TryAdd(model, null))
+            {
+                return;
+            }
+
+            try
+            {
+                // Example foundation bedrock: anthropic.claude-3-5-sonnet-20241022-v2:0
+                // Example inference bedrock: us.anthropic.claude-3-5-sonnet-20241022-v2:0
+                // Example bedrock marketplace: deepseek-llm-r1
+                var modelDetails = model.Split('.');
+                if (modelDetails.Length == 1) // bedrock marketplace
+                {
+                    // Format the bedrock marketplace model id into one that can be used by the standard logic.
+                    var marketplaceDetails = modelDetails[0].Split('-');
+                    modelDetails =
+                    [
+                        marketplaceDetails[0],
+                        string.Join("-", marketplaceDetails, 1, marketplaceDetails.Length - 1)
+                    ];
+                }
+
+                if (modelDetails.Length != 2 && modelDetails.Length != 3)
+                {
+                    return;
+                }
+
+                // if there is a region, it will be the first part of the model id
+                var vendorIndex = modelDetails.Length == 2 ? 0 : 1;
+                var vendor = modelDetails[vendorIndex];
+
+                var modelIdDetails = modelDetails[vendorIndex + 1].Split(':')[0].Split('-');
+                if (modelIdDetails[0] == "nova" || modelIdDetails[0] == "titan" || modelIdDetails[0] == "claude") // first 2 - capture some extra details to narrow down support
+                {
+                    agent.RecordSupportabilityMetric("DotNet/LLM/" + vendor + "/" + modelIdDetails[0] + "-" + modelIdDetails[1]);
+                }
+                else // first only - any model that doesn't need the above extra details
+                {
+                    agent.RecordSupportabilityMetric("DotNet/LLM/" + vendor + "/" + modelIdDetails[0]);
+                }
+            }
+            catch (Exception ex) // if there is a problem, this will also only happen once-ish per model
+            {
+                agent.Logger.Finest($"Error creating model supportability metric for {model}: {ex.Message}");
+            }
+        }
+    }
+}
diff --git a/src/Agent/NewRelic/Agent/Extensions/Providers/Wrapper/Bedrock/ConverseAsyncWrapper.cs b/src/Agent/NewRelic/Agent/Extensions/Providers/Wrapper/Bedrock/ConverseAsyncWrapper.cs
@@ -42,7 +42,7 @@ public AfterWrappedMethodDelegate BeforeWrappedMethod(InstrumentedMethodCall ins
 
         dynamic converseRequest = instrumentedMethodCall.MethodCall.MethodArguments[0];
         string modelId = converseRequest.ModelId.ToLower();
-
+        SupportabilityHelpers.CreateModelIdSupportabilityMetricsForBedrock(modelId, agent);
         var operationType = "completion"; // Converse doesn't support embedding
         var segment = transaction.StartCustomSegment(instrumentedMethodCall.MethodCall, $"Llm/{operationType}/{VendorName}/{instrumentedMethodCall.MethodCall.Method.MethodName}");
 
diff --git a/src/Agent/NewRelic/Agent/Extensions/Providers/Wrapper/Bedrock/InvokeModelAsyncWrapper.cs b/src/Agent/NewRelic/Agent/Extensions/Providers/Wrapper/Bedrock/InvokeModelAsyncWrapper.cs
@@ -45,6 +45,7 @@ public AfterWrappedMethodDelegate BeforeWrappedMethod(InstrumentedMethodCall ins
             }
 
             dynamic invokeModelRequest = instrumentedMethodCall.MethodCall.MethodArguments[0];
+            SupportabilityHelpers.CreateModelIdSupportabilityMetricsForBedrock((string)invokeModelRequest.ModelId, agent);
             var operationType = invokeModelRequest.ModelId.Contains("embed") ? "embedding" : "completion";
             var segment = transaction.StartCustomSegment(
                 instrumentedMethodCall.MethodCall,
diff --git a/src/Agent/NewRelic/Agent/Extensions/Providers/Wrapper/OpenAI/OpenAIChatWrapper.cs b/src/Agent/NewRelic/Agent/Extensions/Providers/Wrapper/OpenAI/OpenAIChatWrapper.cs
@@ -97,6 +97,7 @@ public AfterWrappedMethodDelegate BeforeWrappedMethod(InstrumentedMethodCall ins
         agent.RecordSupportabilityMetric($"DotNet/ML/{GetVendorName()}/{version}");
 
         string model = _modelFieldAccessor(instrumentedMethodCall.MethodCall.InvocationTarget);
+        SupportabilityHelpers.CreateModelIdSupportabilityMetricsForOpenAi(model, agent); // prepend vendor name to model id
 
         if (isAsync)
         {
diff --git a/tests/Agent/IntegrationTests/IntegrationTests/LLM/BedrockConverseTests.cs b/tests/Agent/IntegrationTests/IntegrationTests/LLM/BedrockConverseTests.cs
@@ -102,7 +102,8 @@ public void ConverseTest()
             var expectedMetrics = new List<Assertions.ExpectedMetric>
             {
                 new() { metricName = @"Custom/Llm/completion/Bedrock/ConverseAsync", CallCountAllHarvests = 2 },
-                new() { metricName = @"Supportability/DotNet/ML/.*", IsRegexName = true}
+                new() { metricName = @"Supportability/DotNet/ML/.*", IsRegexName = true},
+                new() { metricName = @"Supportability/DotNet/LLM/.*/.*", IsRegexName = true} // Supportability/DotNet/LLM/{vendor}/{model}
             };
 
             var customEventsSuccess = _fixture.AgentLog.GetCustomEvents().Where(ce => !ce.Attributes.Keys.Contains("error")).ToList();
diff --git a/tests/Agent/IntegrationTests/IntegrationTests/LLM/BedrockInvokeTests.cs b/tests/Agent/IntegrationTests/IntegrationTests/LLM/BedrockInvokeTests.cs
@@ -111,7 +111,8 @@ public void BedrockTest()
             {
                 new Assertions.ExpectedMetric { metricName = @"Custom/Llm/completion/Bedrock/InvokeModelAsync", CallCountAllHarvests = _bedrockModelsToTest.Count - 1 },
                 new Assertions.ExpectedMetric { metricName = @"Custom/Llm/embedding/Bedrock/InvokeModelAsync", CallCountAllHarvests = 1 },
-                new Assertions.ExpectedMetric { metricName = @"Supportability/DotNet/ML/.*", IsRegexName = true}
+                new Assertions.ExpectedMetric { metricName = @"Supportability/DotNet/ML/.*", IsRegexName = true},
+                new Assertions.ExpectedMetric { metricName = @"Supportability/DotNet/LLM/.*/.*", IsRegexName = true} // Supportability/DotNet/LLM/{vendor}/{model}
             };
 
             var customEvents = _fixture.AgentLog.GetCustomEvents().ToList();
diff --git a/tests/Agent/IntegrationTests/IntegrationTests/LLM/OpenAITests.cs b/tests/Agent/IntegrationTests/IntegrationTests/LLM/OpenAITests.cs
@@ -117,7 +117,8 @@ public void OpenAITest()
                 new() { metricName = @"Custom/Llm/completion/openai/CompleteChatAsync", metricScope = "OtherTransaction/Custom/MultiFunctionApplicationHelpers.NetStandardLibraries.LLM.OpenAIExerciser/CompleteChatAsync"},
                 new() { metricName = @"Custom/Llm/completion/openai/CompleteChat" },
                 new() { metricName = @"Custom/Llm/completion/openai/CompleteChat", metricScope = "OtherTransaction/Custom/MultiFunctionApplicationHelpers.NetStandardLibraries.LLM.OpenAIExerciser/CompleteChat"},
-                new() { metricName = @"Supportability/DotNet/ML/.*", IsRegexName = true}
+                new() { metricName = @"Supportability/DotNet/ML/.*", IsRegexName = true},
+                new() { metricName = @"Supportability/DotNet/LLM/.*/.*", IsRegexName = true} // Supportability/DotNet/LLM/{vendor}/{model}
             };
 
             var customEventsSuccess = _fixture.AgentLog.GetCustomEvents().Where(ce => !ce.Attributes.Keys.Contains("error")).ToList();
diff --git a/tests/Agent/UnitTests/NewRelic.Agent.Extensions.Tests/Llm/SupportabilityHelpersTests.cs b/tests/Agent/UnitTests/NewRelic.Agent.Extensions.Tests/Llm/SupportabilityHelpersTests.cs
@@ -0,0 +1,169 @@
+// Copyright 2020 New Relic, Inc. All rights reserved.
+// SPDX-License-Identifier: Apache-2.0
+
+using System;
+using System.Collections.Generic;
+using NewRelic.Agent.Api;
+using NewRelic.Agent.Extensions.Llm;
+using NUnit.Framework;
+using Telerik.JustMock;
+
+namespace Agent.Extensions.Tests.Llm
+{
+    // When creating tests, make sure to not use duplicate model name since CreateModelIdSupportabilityMetricsForXXXX only creates the metric once.
+    [TestFixture]
+    public class SupportabilityHelpersTests
+    {
+        private IAgent _agent;
+
+        [SetUp]
+        public void Setup()
+        {
+            _agent = Mock.Create<IAgent>();
+        }
+
+        [TestCase("anthropic.claude-3-sonnet-20240229-v1:0", "anthropic", "claude-3")]
+        [TestCase("us.anthropic.claude-3-sonnet-20240229-v1:0", "anthropic", "claude-3")]
+        [TestCase("apac.anthropic.claude-3-sonnet-20240229-v1:0", "anthropic", "claude-3")]
+        [TestCase("meta.llama3-2-3b-instruct-v1:0", "meta", "llama3")]
+        [TestCase("us.meta.llama3-2-3b-instruct-v1:0", "meta", "llama3")]
+        [TestCase("amazon.nova-lite-v1:0", "amazon", "nova-lite")]
+        [TestCase("eu.amazon.nova-lite-v1:0", "amazon", "nova-lite")]
+        [TestCase("amazon.titan-embed-text-v1", "amazon", "titan-embed")]
+        [TestCase("us.amazon.titan-embed-text-v1", "amazon", "titan-embed")]
+        [TestCase("ai21.jamba-1-5-large-v1:0", "ai21", "jamba")]
+        [TestCase("apac.ai21.jamba-1-5-large-v1:0", "ai21", "jamba")]
+        [TestCase("writer-palmyra-med-70b-32k", "writer", "palmyra")]
+        public void Bedrock_ModelFormatsTests(string fullModel, string vendor, string model)
+        {
+            // Supportability/DotNet/LLM/{vendor}/{model}
+            var expectedMetric = $"Supportability/DotNet/LLM/{vendor}/{model}";
+            var actualMetric = string.Empty;
+            Mock.Arrange(() => _agent.RecordSupportabilityMetric(Arg.AnyString, Arg.AnyLong))
+                .DoInstead((string m, long c) => actualMetric = $"Supportability/{m}");
+
+            SupportabilityHelpers.CreateModelIdSupportabilityMetricsForBedrock(fullModel, _agent);
+
+            Assert.That(actualMetric == expectedMetric, $"Model: '{fullModel}', Actual: '{actualMetric}', Expected: '{expectedMetric}'");
+        }
+
+        [TestCase("o1", "openai", "o1")]
+        [TestCase("o3-mini", "openai", "o3-mini")]
+        [TestCase("gpt-4o-2024-11-20", "openai", "gpt-4o")]
+        public void OpenAi_ModelFormatsTests(string fullModel, string vendor, string model)
+        {
+            // Supportability/DotNet/LLM/{vendor}/{model}
+            var expectedMetric = $"Supportability/DotNet/LLM/{vendor}/{model}";
+            var actualMetric = string.Empty;
+            Mock.Arrange(() => _agent.RecordSupportabilityMetric(Arg.AnyString, Arg.AnyLong))
+                .DoInstead((string m, long c) => actualMetric = $"Supportability/{m}");
+
+            SupportabilityHelpers.CreateModelIdSupportabilityMetricsForOpenAi(fullModel, _agent);
+
+            Assert.That(actualMetric == expectedMetric, $"Model: '{fullModel}', Actual: '{actualMetric}', Expected: '{expectedMetric}'");
+        }
+
+        [TestCase("bedrock", "")]
+        [TestCase("bedrock", "bedrock.bad.model.more.than.four.sections")]
+        [TestCase("openai", "")]
+        public void BadModel_NoMetricTest(string source, string model)
+        {
+            // Supportability/DotNet/LLM/{vendor}/{model}
+            var actualMetric = string.Empty;
+            Mock.Arrange(() => _agent.RecordSupportabilityMetric(Arg.AnyString, Arg.AnyLong))
+                .DoInstead((string m, long c) => actualMetric = $"Supportability/{m}"); // Will not get called
+
+            // Model is always stored so we want to check different values
+            if (source == "bedrock")
+            {
+                SupportabilityHelpers.CreateModelIdSupportabilityMetricsForBedrock(model, _agent);
+            }
+            else if (source == "openai")
+            {
+                SupportabilityHelpers.CreateModelIdSupportabilityMetricsForOpenAi(model, _agent);
+            }
+
+            Assert.That(actualMetric == string.Empty);
+        }
+
+        [Test]
+        public void Bedrock_DuplicateModels_OnlyOneMetricTest()
+        {
+            var fullModel = "luma.ray-v2:0";
+
+            // Supportability/DotNet/LLM/{vendor}/{model}
+            var expectedMetric = $"Supportability/DotNet/LLM/luma/ray";
+            var actualMetrics = new List<string>();
+            Mock.Arrange(() => _agent.RecordSupportabilityMetric(Arg.AnyString, Arg.AnyLong))
+                .DoInstead((string m, long c) => actualMetrics.Add($"Supportability/{m}"));
+
+            SupportabilityHelpers.CreateModelIdSupportabilityMetricsForBedrock(fullModel, _agent);
+            SupportabilityHelpers.CreateModelIdSupportabilityMetricsForBedrock(fullModel, _agent);
+            SupportabilityHelpers.CreateModelIdSupportabilityMetricsForBedrock(fullModel, _agent);
+            SupportabilityHelpers.CreateModelIdSupportabilityMetricsForBedrock(fullModel, _agent);
+
+            Assert.That(actualMetrics.Count == 1);
+            Assert.That(actualMetrics[0] == expectedMetric, $"Model: '{fullModel}', Actual: '{actualMetrics[0]}', Expected: '{expectedMetric}'");
+        }
+
+        [Test]
+        public void OpenAi_DuplicateModels_OnlyOneMetricTest()
+        {
+            var fullModel = "gpt-4.5";
+
+            // Supportability/DotNet/LLM/{vendor}/{model}
+            var expectedMetric = $"Supportability/DotNet/LLM/openai/gpt-4.5";
+            var actualMetrics = new List<string>();
+            Mock.Arrange(() => _agent.RecordSupportabilityMetric(Arg.AnyString, Arg.AnyLong))
+                .DoInstead((string m, long c) => actualMetrics.Add($"Supportability/{m}"));
+
+            SupportabilityHelpers.CreateModelIdSupportabilityMetricsForOpenAi(fullModel, _agent);
+            SupportabilityHelpers.CreateModelIdSupportabilityMetricsForOpenAi(fullModel, _agent);
+            SupportabilityHelpers.CreateModelIdSupportabilityMetricsForOpenAi(fullModel, _agent);
+            SupportabilityHelpers.CreateModelIdSupportabilityMetricsForOpenAi(fullModel, _agent);
+
+            Assert.That(actualMetrics.Count == 1);
+            Assert.That(actualMetrics[0] == expectedMetric, $"Model: '{fullModel}', Actual: '{actualMetrics[0]}', Expected: '{expectedMetric}'");
+        }
+
+        [Test]
+        public void Bedrock_Exception_Test()
+        {
+            var fullModel = "meta.llama3-1-70b-instruct-v1:0";
+            var exception = new Exception("Test exception");
+            var expectedExceptionMessage = $"Error creating model supportability metric for {fullModel}: {exception.Message}";
+
+            // Supportability/DotNet/LLM/{vendor}/{model}
+            Mock.Arrange(() => _agent.RecordSupportabilityMetric(Arg.AnyString, Arg.AnyLong))
+                .Throws(exception);
+
+            var exceptionMessage = string.Empty;
+            Mock.Arrange(() => _agent.Logger.Finest(Arg.AnyString))
+                .DoInstead((string m) => exceptionMessage = m);
+
+            SupportabilityHelpers.CreateModelIdSupportabilityMetricsForBedrock(fullModel, _agent);
+
+            Assert.That(exceptionMessage == expectedExceptionMessage, message: exceptionMessage);
+        }
+
+        [Test]
+        public void OpenAi_Exception_Test()
+        {
+            var fullModel = "chatgpt-4o";
+            var exception = new Exception("Test exception");
+            var expectedExceptionMessage = $"Error creating model supportability metric for {fullModel}: {exception.Message}";
+
+            // Supportability/DotNet/LLM/{vendor}/{model}
+            Mock.Arrange(() => _agent.RecordSupportabilityMetric(Arg.AnyString, Arg.AnyLong))
+                .Throws(exception);
+
+            var exceptionMessage = string.Empty;
+            Mock.Arrange(() => _agent.Logger.Finest(Arg.AnyString))
+                .DoInstead((string m) => exceptionMessage = m);
+
+            SupportabilityHelpers.CreateModelIdSupportabilityMetricsForOpenAi(fullModel, _agent);
+
+            Assert.That(exceptionMessage == expectedExceptionMessage, message: exceptionMessage);
+        }
+    }
+}

Original file line number	Diff line number	Diff line change
`@@ -45,6 +45,7 @@ public AfterWrappedMethodDelegate BeforeWrappedMethod(InstrumentedMethodCall ins`
`45`	`45`	`}`
`46`	`46`
`47`	`47`	`dynamic invokeModelRequest = instrumentedMethodCall.MethodCall.MethodArguments[0];`
	`48`	`+ SupportabilityHelpers.CreateModelIdSupportabilityMetricsForBedrock((string)invokeModelRequest.ModelId, agent);`
`48`	`49`	`var operationType = invokeModelRequest.ModelId.Contains("embed") ? "embedding" : "completion";`
`49`	`50`	`var segment = transaction.StartCustomSegment(`
`50`	`51`	`instrumentedMethodCall.MethodCall,`
Original file line number	Diff line number	Diff line change
`@@ -97,6 +97,7 @@ public AfterWrappedMethodDelegate BeforeWrappedMethod(InstrumentedMethodCall ins`
`97`	`97`	`agent.RecordSupportabilityMetric($"DotNet/ML/{GetVendorName()}/{version}");`
`98`	`98`
`99`	`99`	`string model = _modelFieldAccessor(instrumentedMethodCall.MethodCall.InvocationTarget);`
	`100`	`+ SupportabilityHelpers.CreateModelIdSupportabilityMetricsForOpenAi(model, agent); // prepend vendor name to model id`
`100`	`101`
`101`	`102`	`if (isAsync)`
`102`	`103`	`{`
Original file line number	Diff line number	Diff line change
`@@ -102,7 +102,8 @@ public void ConverseTest()`
`102`	`102`	`var expectedMetrics = new List<Assertions.ExpectedMetric>`
`103`	`103`	`{`
`104`	`104`	`new() { metricName = @"Custom/Llm/completion/Bedrock/ConverseAsync", CallCountAllHarvests = 2 },`
`105`		`- new() { metricName = @"Supportability/DotNet/ML/.*", IsRegexName = true}`
	`105`	`+ new() { metricName = @"Supportability/DotNet/ML/.*", IsRegexName = true},`
	`106`	`+ new() { metricName = @"Supportability/DotNet/LLM/./.", IsRegexName = true} // Supportability/DotNet/LLM/{vendor}/{model}`
`106`	`107`	`};`
`107`	`108`
`108`	`109`	`var customEventsSuccess = _fixture.AgentLog.GetCustomEvents().Where(ce => !ce.Attributes.Keys.Contains("error")).ToList();`
Original file line number	Diff line number	Diff line change
`@@ -111,7 +111,8 @@ public void BedrockTest()`
`111`	`111`	`{`
`112`	`112`	`new Assertions.ExpectedMetric { metricName = @"Custom/Llm/completion/Bedrock/InvokeModelAsync", CallCountAllHarvests = _bedrockModelsToTest.Count - 1 },`
`113`	`113`	`new Assertions.ExpectedMetric { metricName = @"Custom/Llm/embedding/Bedrock/InvokeModelAsync", CallCountAllHarvests = 1 },`
`114`		`- new Assertions.ExpectedMetric { metricName = @"Supportability/DotNet/ML/.*", IsRegexName = true}`
	`114`	`+ new Assertions.ExpectedMetric { metricName = @"Supportability/DotNet/ML/.*", IsRegexName = true},`
	`115`	`+ new Assertions.ExpectedMetric { metricName = @"Supportability/DotNet/LLM/./.", IsRegexName = true} // Supportability/DotNet/LLM/{vendor}/{model}`
`115`	`116`	`};`
`116`	`117`
`117`	`118`	`var customEvents = _fixture.AgentLog.GetCustomEvents().ToList();`