dotnet
diff --git a/‎src/Libraries/Microsoft.Extensions.AI.Evaluation.Quality/EquivalenceEvaluatorContext.cs
Lines changed: 6 additions & 0 deletions b/‎src/Libraries/Microsoft.Extensions.AI.Evaluation.Quality/EquivalenceEvaluatorContext.cs
Lines changed: 6 additions & 0 deletions
diff --git a/‎src/Libraries/Microsoft.Extensions.AI.Evaluation.Quality/GroundednessEvaluatorContext.cs
Lines changed: 6 additions & 0 deletions b/‎src/Libraries/Microsoft.Extensions.AI.Evaluation.Quality/GroundednessEvaluatorContext.cs
Lines changed: 6 additions & 0 deletions
diff --git a/‎src/Libraries/Microsoft.Extensions.AI.Evaluation.Quality/RelevanceTruthAndCompletenessEvaluator.cs
Lines changed: 12 additions & 12 deletions b/‎src/Libraries/Microsoft.Extensions.AI.Evaluation.Quality/RelevanceTruthAndCompletenessEvaluator.cs
Lines changed: 12 additions & 12 deletions
diff --git a/‎src/Libraries/Microsoft.Extensions.AI.Evaluation.Reporting/CSharp/ReportingConfiguration.cs
Lines changed: 1 addition & 1 deletion b/‎src/Libraries/Microsoft.Extensions.AI.Evaluation.Reporting/CSharp/ReportingConfiguration.cs
Lines changed: 1 addition & 1 deletion
diff --git a/‎src/Libraries/Microsoft.Extensions.AI.Evaluation.Reporting/TypeScript/components/ChatDetailsSection.tsx
Lines changed: 1 addition & 1 deletion b/‎src/Libraries/Microsoft.Extensions.AI.Evaluation.Reporting/TypeScript/components/ChatDetailsSection.tsx
Lines changed: 1 addition & 1 deletion
diff --git a/‎src/Libraries/Microsoft.Extensions.AI.Evaluation.Safety/CodeVulnerabilityEvaluator.cs
Lines changed: 7 additions & 28 deletions b/‎src/Libraries/Microsoft.Extensions.AI.Evaluation.Safety/CodeVulnerabilityEvaluator.cs
Lines changed: 7 additions & 28 deletions
diff --git a/‎src/Libraries/Microsoft.Extensions.AI.Evaluation.Safety/ContentHarmEvaluator.cs
Lines changed: 15 additions & 39 deletions b/‎src/Libraries/Microsoft.Extensions.AI.Evaluation.Safety/ContentHarmEvaluator.cs
Lines changed: 15 additions & 39 deletions
@@ -6,6 +6,8 @@
 // We disable this warning because it is a false positive arising from the analyzer's lack of support for C#'s primary
 // constructor syntax.
 
+using System.Collections.Generic;
+
 namespace Microsoft.Extensions.AI.Evaluation.Quality;
 
 /// <summary>
@@ -29,4 +31,8 @@ public sealed class EquivalenceEvaluatorContext(string groundTruth) : Evaluation
     /// the response supplied via <see cref="GroundTruth"/>.
     /// </remarks>
     public string GroundTruth { get; } = groundTruth;
+
+    /// <inheritdoc/>
+    public override IReadOnlyList<AIContent> GetContents()
+        => [new TextContent(GroundTruth)];
 }
@@ -6,6 +6,8 @@
 // We disable this warning because it is a false positive arising from the analyzer's lack of support for C#'s primary
 // constructor syntax.
 
+using System.Collections.Generic;
+
 namespace Microsoft.Extensions.AI.Evaluation.Quality;
 
 /// <summary>
@@ -29,4 +31,8 @@ public sealed class GroundednessEvaluatorContext(string groundingContext) : Eval
     /// in the information present in the supplied <see cref="GroundingContext"/>.
     /// </remarks>
     public string GroundingContext { get; } = groundingContext;
+
+    /// <inheritdoc/>
+    public override IReadOnlyList<AIContent> GetContents()
+        => [new TextContent(GroundingContext)];
 }
@@ -171,9 +171,9 @@ await JsonOutputFixer.RepairJsonAsync(
                             result.AddDiagnosticToAllMetrics(
                                 EvaluationDiagnostic.Error(
                                     $"""
-                                Failed to repair the following response from the model and parse scores for '{RelevanceMetricName}', '{TruthMetricName}' and '{CompletenessMetricName}'.:
-                                {evaluationResponseText}
-                                """));
+                                    Failed to repair the following response from the model and parse scores for '{RelevanceMetricName}', '{TruthMetricName}' and '{CompletenessMetricName}'.:
+                                    {evaluationResponseText}
+                                    """));
                         }
                         else
                         {
@@ -186,10 +186,10 @@ await JsonOutputFixer.RepairJsonAsync(
                         result.AddDiagnosticToAllMetrics(
                             EvaluationDiagnostic.Error(
                                 $"""
-                            Failed to repair the following response from the model and parse scores for '{RelevanceMetricName}', '{TruthMetricName}' and '{CompletenessMetricName}'.:
-                            {evaluationResponseText}
-                            {ex}
-                            """));
+                                Failed to repair the following response from the model and parse scores for '{RelevanceMetricName}', '{TruthMetricName}' and '{CompletenessMetricName}'.:
+                                {evaluationResponseText}
+                                {ex}
+                                """));
                     }
                 }
             }
@@ -211,28 +211,28 @@ void UpdateResult()
 
             if (!string.IsNullOrWhiteSpace(evaluationResponse.ModelId))
             {
-                commonMetadata["rtc-evaluation-model-used"] = evaluationResponse.ModelId!;
+                commonMetadata["evaluation-model-used"] = evaluationResponse.ModelId!;
             }
 
             if (evaluationResponse.Usage is UsageDetails usage)
             {
                 if (usage.InputTokenCount is not null)
                 {
-                    commonMetadata["rtc-evaluation-input-tokens-used"] = $"{usage.InputTokenCount}";
+                    commonMetadata["evaluation-input-tokens-used"] = $"{usage.InputTokenCount}";
                 }
 
                 if (usage.OutputTokenCount is not null)
                 {
-                    commonMetadata["rtc-evaluation-output-tokens-used"] = $"{usage.OutputTokenCount}";
+                    commonMetadata["evaluation-output-tokens-used"] = $"{usage.OutputTokenCount}";
                 }
 
                 if (usage.TotalTokenCount is not null)
                 {
-                    commonMetadata["rtc-evaluation-total-tokens-used"] = $"{usage.TotalTokenCount}";
+                    commonMetadata["evaluation-total-tokens-used"] = $"{usage.TotalTokenCount}";
                 }
             }
 
-            commonMetadata["rtc-evaluation-duration"] = duration;
+            commonMetadata["evaluation-duration"] = duration;
 
             NumericMetric relevance = result.Get<NumericMetric>(RelevanceMetricName);
             relevance.Value = rating.Relevance;
 
@@ -263,7 +263,7 @@ await ResponseCacheProvider.GetCacheAsync(
 
     private static IEnumerable<string> GetCachingKeysForChatClient(IChatClient chatClient)
     {
-        var metadata = chatClient.GetService<ChatClientMetadata>();
+        ChatClientMetadata? metadata = chatClient.GetService<ChatClientMetadata>();
 
         string? providerName = metadata?.ProviderName;
         if (!string.IsNullOrWhiteSpace(providerName))
 
@@ -24,7 +24,7 @@ export const ChatDetailsSection = ({ chatDetails }: { chatDetails: ChatDetails;
         <div className={classes.section}>
             <div className={classes.sectionHeader} onClick={() => setIsExpanded(!isExpanded)}>
                 {isExpanded ? <ChevronDown12Regular /> : <ChevronRight12Regular />}
-                <h3 className={classes.sectionHeaderText}>LLM Chat Diagnostic Details</h3>
+                <h3 className={classes.sectionHeaderText}>Diagnostic Data</h3>
                 {hasCacheStatus && (
                     <div className={classes.hint}>
                         {cachedTurns != totalTurns ?
 
@@ -2,9 +2,9 @@
 // The .NET Foundation licenses this file to you under the MIT license.
 
 using System.Collections.Generic;
-using System.Linq;
 using System.Threading;
 using System.Threading.Tasks;
+using Microsoft.Shared.Diagnostics;
 
 namespace Microsoft.Extensions.AI.Evaluation.Safety;
 
@@ -31,26 +31,17 @@ namespace Microsoft.Extensions.AI.Evaluation.Safety;
 /// will be ignored.
 /// </para>
 /// </remarks>
-/// <param name="contentSafetyServiceConfiguration">
-/// Specifies the Azure AI project that should be used and credentials that should be used when this
-/// <see cref="ContentSafetyEvaluator"/> communicates with the Azure AI Content Safety service to perform
-/// evaluations.
-/// </param>
-public sealed class CodeVulnerabilityEvaluator(ContentSafetyServiceConfiguration contentSafetyServiceConfiguration)
+public sealed class CodeVulnerabilityEvaluator()
     : ContentSafetyEvaluator(
-        contentSafetyServiceConfiguration,
         contentSafetyServiceAnnotationTask: "code vulnerability",
-        evaluatorName: nameof(CodeVulnerabilityEvaluator))
+        metricNames: new Dictionary<string, string> { ["code_vulnerability"] = CodeVulnerabilityMetricName })
 {
     /// <summary>
     /// Gets the <see cref="EvaluationMetric.Name"/> of the <see cref="BooleanMetric"/> returned by
     /// <see cref="CodeVulnerabilityEvaluator"/>.
     /// </summary>
     public static string CodeVulnerabilityMetricName => "Code Vulnerability";
 
-    /// <inheritdoc/>
-    public override IReadOnlyCollection<string> EvaluationMetricNames => [CodeVulnerabilityMetricName];
-
     /// <inheritdoc/>
     public override async ValueTask<EvaluationResult> EvaluateAsync(
         IEnumerable<ChatMessage> messages,
@@ -59,30 +50,18 @@ public override async ValueTask<EvaluationResult> EvaluateAsync(
         IEnumerable<EvaluationContext>? additionalContext = null,
         CancellationToken cancellationToken = default)
     {
-        const string CodeVulnerabilityContentSafetyServiceMetricName = "code_vulnerability";
+        _ = Throw.IfNull(chatConfiguration);
+        _ = Throw.IfNull(modelResponse);
 
         EvaluationResult result =
             await EvaluateContentSafetyAsync(
+                chatConfiguration.ChatClient,
                 messages,
                 modelResponse,
+                additionalContext,
                 contentSafetyServicePayloadFormat: ContentSafetyServicePayloadFormat.ContextCompletion.ToString(),
-                contentSafetyServiceMetricName: CodeVulnerabilityContentSafetyServiceMetricName,
                 cancellationToken: cancellationToken).ConfigureAwait(false);
 
-        IEnumerable<EvaluationMetric> updatedMetrics =
-            result.Metrics.Values.Select(
-                metric =>
-                {
-                    if (metric.Name == CodeVulnerabilityContentSafetyServiceMetricName)
-                    {
-                        metric.Name = CodeVulnerabilityMetricName;
-                    }
-
-                    return metric;
-                });
-
-        result = new EvaluationResult(updatedMetrics);
-        result.Interpret(metric => metric is BooleanMetric booleanMetric ? booleanMetric.InterpretScore() : null);
         return result;
     }
 }
@@ -2,44 +2,27 @@
 // The .NET Foundation licenses this file to you under the MIT license.
 
 using System.Collections.Generic;
-using System.Linq;
 using System.Threading;
 using System.Threading.Tasks;
+using Microsoft.Shared.Diagnostics;
 
 namespace Microsoft.Extensions.AI.Evaluation.Safety;
 
-#pragma warning disable S1694 // An abstract class should have both abstract and concrete methods
 /// <summary>
 /// An <see langword="abstract"/> base class that can be used to implement <see cref="IEvaluator"/>s that utilize the
 /// Azure AI Content Safety service to evaluate responses produced by an AI model for the presence of a variety of
 /// harmful content such as violence, hate speech, etc.
 /// </summary>
-/// <param name="contentSafetyServiceConfiguration">
-/// Specifies the Azure AI project that should be used and credentials that should be used when this
-/// <see cref="ContentSafetyEvaluator"/> communicates with the Azure AI Content Safety service to perform evaluations.
-/// </param>
-/// <param name="contentSafetyServiceMetricName">
-/// The name of the metric that should be used when this <see cref="ContentSafetyEvaluator"/> communicates with the
-/// Azure AI Content Safety service to perform evaluations.
+/// <param name="metricNames">
+/// A dictionary containing the mapping from the names of the metrics that are used when communicating with the Azure
+/// AI Content Safety to the <see cref="EvaluationMetric.Name"/>s of the <see cref="EvaluationMetric"/>s returned by
+/// this <see cref="IEvaluator"/>.
 /// </param>
-/// <param name="metricName">
-/// The name of the <see cref="EvaluationMetric"/> produced by this <see cref="ContentSafetyEvaluator"/>.
-/// </param>
-/// <param name="evaluatorName">The name of the derived <see cref="ContentSafetyEvaluator"/>.</param>
-public abstract class ContentHarmEvaluator(
-    ContentSafetyServiceConfiguration contentSafetyServiceConfiguration,
-    string contentSafetyServiceMetricName,
-    string metricName,
-    string evaluatorName)
-        : ContentSafetyEvaluator(
-            contentSafetyServiceConfiguration,
-            contentSafetyServiceAnnotationTask: "content harm",
-            evaluatorName)
+#pragma warning disable S1694 // An abstract class should have both abstract and concrete methods
+public abstract class ContentHarmEvaluator(IDictionary<string, string> metricNames)
+    : ContentSafetyEvaluator(contentSafetyServiceAnnotationTask: "content harm", metricNames)
 #pragma warning restore S1694
 {
-    /// <inheritdoc/>
-    public override IReadOnlyCollection<string> EvaluationMetricNames => [metricName];
-
     /// <inheritdoc/>
     public sealed override async ValueTask<EvaluationResult> EvaluateAsync(
         IEnumerable<ChatMessage> messages,
@@ -48,28 +31,21 @@ public sealed override async ValueTask<EvaluationResult> EvaluateAsync(
         IEnumerable<EvaluationContext>? additionalContext = null,
         CancellationToken cancellationToken = default)
     {
+        _ = Throw.IfNull(chatConfiguration);
+        _ = Throw.IfNull(modelResponse);
+
         EvaluationResult result =
             await EvaluateContentSafetyAsync(
+                chatConfiguration.ChatClient,
                 messages,
                 modelResponse,
+                additionalContext,
                 contentSafetyServicePayloadFormat: ContentSafetyServicePayloadFormat.Conversation.ToString(),
-                contentSafetyServiceMetricName: contentSafetyServiceMetricName,
                 cancellationToken: cancellationToken).ConfigureAwait(false);
 
-        IEnumerable<EvaluationMetric> updatedMetrics =
-            result.Metrics.Values.Select(
-                metric =>
-                {
-                    if (metric.Name == contentSafetyServiceMetricName)
-                    {
-                        metric.Name = metricName;
-                    }
-
-                    return metric;
-                });
+        result.Interpret(
+            metric => metric is NumericMetric numericMetric ? numericMetric.InterpretContentHarmScore() : null);
 
-        result = new EvaluationResult(updatedMetrics);
-        result.Interpret(metric => metric is NumericMetric numericMetric ? numericMetric.InterpretHarmScore() : null);
         return result;
     }
 }
Original file line number	Diff line number	Diff line change
`@@ -171,9 +171,9 @@ await JsonOutputFixer.RepairJsonAsync(`
`171`	`171`	`result.AddDiagnosticToAllMetrics(`
`172`	`172`	`EvaluationDiagnostic.Error(`
`173`	`173`	`$"""`
`174`		`- Failed to repair the following response from the model and parse scores for '{RelevanceMetricName}', '{TruthMetricName}' and '{CompletenessMetricName}'.:`
`175`		`- {evaluationResponseText}`
`176`		`- """));`
	`174`	`+ Failed to repair the following response from the model and parse scores for '{RelevanceMetricName}', '{TruthMetricName}' and '{CompletenessMetricName}'.:`
	`175`	`+ {evaluationResponseText}`
	`176`	`+ """));`
`177`	`177`	`}`
`178`	`178`	`else`
`179`	`179`	`{`
`@@ -186,10 +186,10 @@ await JsonOutputFixer.RepairJsonAsync(`
`186`	`186`	`result.AddDiagnosticToAllMetrics(`
`187`	`187`	`EvaluationDiagnostic.Error(`
`188`	`188`	`$"""`
`189`		`- Failed to repair the following response from the model and parse scores for '{RelevanceMetricName}', '{TruthMetricName}' and '{CompletenessMetricName}'.:`
`190`		`- {evaluationResponseText}`
`191`		`- {ex}`
`192`		`- """));`
	`189`	`+ Failed to repair the following response from the model and parse scores for '{RelevanceMetricName}', '{TruthMetricName}' and '{CompletenessMetricName}'.:`
	`190`	`+ {evaluationResponseText}`
	`191`	`+ {ex}`
	`192`	`+ """));`
`193`	`193`	`}`
`194`	`194`	`}`
`195`	`195`	`}`
`@@ -211,28 +211,28 @@ void UpdateResult()`
`211`	`211`
`212`	`212`	`if (!string.IsNullOrWhiteSpace(evaluationResponse.ModelId))`
`213`	`213`	`{`
`214`		`- commonMetadata["rtc-evaluation-model-used"] = evaluationResponse.ModelId!;`
	`214`	`+ commonMetadata["evaluation-model-used"] = evaluationResponse.ModelId!;`
`215`	`215`	`}`
`216`	`216`
`217`	`217`	`if (evaluationResponse.Usage is UsageDetails usage)`
`218`	`218`	`{`
`219`	`219`	`if (usage.InputTokenCount is not null)`
`220`	`220`	`{`
`221`		`- commonMetadata["rtc-evaluation-input-tokens-used"] = $"{usage.InputTokenCount}";`
	`221`	`+ commonMetadata["evaluation-input-tokens-used"] = $"{usage.InputTokenCount}";`
`222`	`222`	`}`
`223`	`223`
`224`	`224`	`if (usage.OutputTokenCount is not null)`
`225`	`225`	`{`
`226`		`- commonMetadata["rtc-evaluation-output-tokens-used"] = $"{usage.OutputTokenCount}";`
	`226`	`+ commonMetadata["evaluation-output-tokens-used"] = $"{usage.OutputTokenCount}";`
`227`	`227`	`}`
`228`	`228`
`229`	`229`	`if (usage.TotalTokenCount is not null)`
`230`	`230`	`{`
`231`		`- commonMetadata["rtc-evaluation-total-tokens-used"] = $"{usage.TotalTokenCount}";`
	`231`	`+ commonMetadata["evaluation-total-tokens-used"] = $"{usage.TotalTokenCount}";`
`232`	`232`	`}`
`233`	`233`	`}`
`234`	`234`
`235`		`- commonMetadata["rtc-evaluation-duration"] = duration;`
	`235`	`+ commonMetadata["evaluation-duration"] = duration;`
`236`	`236`
`237`	`237`	`NumericMetric relevance = result.Get<NumericMetric>(RelevanceMetricName);`
`238`	`238`	`relevance.Value = rating.Relevance;`
Original file line number	Diff line number	Diff line change
`@@ -263,7 +263,7 @@ await ResponseCacheProvider.GetCacheAsync(`
`263`	`263`
`264`	`264`	`private static IEnumerable<string> GetCachingKeysForChatClient(IChatClient chatClient)`
`265`	`265`	`{`
`266`		`- var metadata = chatClient.GetService<ChatClientMetadata>();`
	`266`	`+ ChatClientMetadata? metadata = chatClient.GetService<ChatClientMetadata>();`
`267`	`267`
`268`	`268`	`string? providerName = metadata?.ProviderName;`
`269`	`269`	`if (!string.IsNullOrWhiteSpace(providerName))`