mirror of
https://github.com/microsoft/agent-framework.git
synced 2026-06-16 21:04:09 +08:00
626b418622
* .NET: Add a TODO AIContextProvider (#5233) * Add a TODO AIContextProvider * Add unit tests * Address PR comments * Address PR comments * Fix test after removing one tool * .NET: Add a ModeProvider for managing agent modes (#5247) * Add a ModeProvider for managing agent modes * Fix typo * Fix typo * Fix typo * Address PR comments * .NET: Add sample to show how to build a harness (#5268) * Add sample to show how to build a harness * Improve sample * Sample max output tokens and model * Fix encoding * Fix model name in readme * Address PR comments * .NET: Add context window size compaction strategy for harness (#5304) * Add context window size compaction strategy for harness * Apply suggestions from code review Co-authored-by: Copilot <175728472+Copilot@users.noreply.github.com> * Address PR comments --------- Co-authored-by: Copilot <175728472+Copilot@users.noreply.github.com> * .NET: Add a file memory provider (#5315) * Add a file memory provider * Address PR comments * Fix review comments. * Add additional unit tests * Addressing PR comments. * .NET: Harness: Improve prompts and add FileSystem store (#5365) * Harness: Improve prompts and add FileSystem store * Address PR comments * .NET: Harness: Improve path validation (#5404) * Harness: Improve path validation * Address PR comments * .NET: Add always approve helpers, improve sample and fix bug (#5451) * Add always approve helpers, improve sample and fix bug * Address PR comments * .NET: Make Todo, Mode and FileMemory providers more configurable (#5477) * Make Todo, Mode and FileMemory providers more configurable * Address PR comments. * .NET: Add subagents provider and sample (#5518) * Add subagents provider and sample * Addressing PR comments. * .NET: Harness filememory index plus instructions consistency (#5540) * Add FileMemoryProvider index and improve instruction consistency * Address PR comments. * Address PR comments * Address PR comments. * Apply suggestion from @rogerbarreto Co-authored-by: Roger Barreto <19890735+rogerbarreto@users.noreply.github.com> --------- Co-authored-by: Roger Barreto <19890735+rogerbarreto@users.noreply.github.com> * .NET: Refactor harness console to be more extensible and easy to understand with better UX (#5573) * Refactor harness console to be more extensible and easy to understand with better UX. * Fix formatting issues. * Allow multiple clarifications in one response * Address PR comments * .NET: Add FileAccessProvdider and concurrency fix for FileMemoryProvider (#5583) * Add FileAccessProvdider and concurrency fix for FileMemoryProvider * Address PR comments --------- Co-authored-by: Copilot <175728472+Copilot@users.noreply.github.com> Co-authored-by: Roger Barreto <19890735+rogerbarreto@users.noreply.github.com>
220 lines
8.5 KiB
C#
220 lines
8.5 KiB
C#
// Copyright (c) Microsoft. All rights reserved.
|
|
|
|
using System;
|
|
using System.Collections.Generic;
|
|
using System.Threading.Tasks;
|
|
using Microsoft.Agents.AI.Compaction;
|
|
using Microsoft.Extensions.AI;
|
|
|
|
namespace Microsoft.Agents.AI.UnitTests.Compaction;
|
|
|
|
/// <summary>
|
|
/// Contains tests for the <see cref="ContextWindowCompactionStrategy"/> class.
|
|
/// </summary>
|
|
public class ContextWindowCompactionStrategyTests
|
|
{
|
|
[Fact]
|
|
public void Constructor_ValidParameters_SetsProperties()
|
|
{
|
|
// Arrange & Act
|
|
var strategy = new ContextWindowCompactionStrategy(
|
|
maxContextWindowTokens: 1_050_000,
|
|
maxOutputTokens: 128_000);
|
|
|
|
// Assert
|
|
Assert.Equal(1_050_000, strategy.MaxContextWindowTokens);
|
|
Assert.Equal(128_000, strategy.MaxOutputTokens);
|
|
Assert.Equal(922_000, strategy.InputBudgetTokens);
|
|
Assert.Equal(ContextWindowCompactionStrategy.DefaultToolEvictionThreshold, strategy.ToolEvictionThreshold);
|
|
Assert.Equal(ContextWindowCompactionStrategy.DefaultTruncationThreshold, strategy.TruncationThreshold);
|
|
}
|
|
|
|
[Fact]
|
|
public void Constructor_CustomThresholds_SetsProperties()
|
|
{
|
|
// Arrange & Act
|
|
var strategy = new ContextWindowCompactionStrategy(
|
|
maxContextWindowTokens: 1_000_000,
|
|
maxOutputTokens: 100_000,
|
|
toolEvictionThreshold: 0.3,
|
|
truncationThreshold: 0.6);
|
|
|
|
// Assert
|
|
Assert.Equal(900_000, strategy.InputBudgetTokens);
|
|
Assert.Equal(0.3, strategy.ToolEvictionThreshold);
|
|
Assert.Equal(0.6, strategy.TruncationThreshold);
|
|
}
|
|
|
|
[Theory]
|
|
[InlineData(0, 100)] // maxContextWindowTokens <= 0
|
|
[InlineData(-1, 100)] // maxContextWindowTokens negative
|
|
public void Constructor_InvalidContextWindow_Throws(int contextWindow, int maxOutput)
|
|
{
|
|
// Act & Assert
|
|
Assert.Throws<ArgumentOutOfRangeException>(() =>
|
|
new ContextWindowCompactionStrategy(contextWindow, maxOutput));
|
|
}
|
|
|
|
[Theory]
|
|
[InlineData(1000, -1)] // maxOutputTokens negative
|
|
[InlineData(1000, 1000)] // maxOutputTokens == contextWindow
|
|
[InlineData(1000, 1001)] // maxOutputTokens > contextWindow
|
|
public void Constructor_InvalidOutputTokens_Throws(int contextWindow, int maxOutput)
|
|
{
|
|
// Act & Assert
|
|
Assert.Throws<ArgumentOutOfRangeException>(() =>
|
|
new ContextWindowCompactionStrategy(contextWindow, maxOutput));
|
|
}
|
|
|
|
[Theory]
|
|
[InlineData(0.0)] // Zero threshold
|
|
[InlineData(-0.1)] // Negative threshold
|
|
[InlineData(1.1)] // Over 1.0
|
|
public void Constructor_InvalidToolEvictionThreshold_Throws(double threshold)
|
|
{
|
|
// Act & Assert
|
|
Assert.Throws<ArgumentOutOfRangeException>(() =>
|
|
new ContextWindowCompactionStrategy(1000, 100, toolEvictionThreshold: threshold));
|
|
}
|
|
|
|
[Theory]
|
|
[InlineData(0.0)] // Zero threshold
|
|
[InlineData(-0.1)] // Negative threshold
|
|
[InlineData(1.1)] // Over 1.0
|
|
public void Constructor_InvalidTruncationThreshold_Throws(double threshold)
|
|
{
|
|
// Act & Assert
|
|
Assert.Throws<ArgumentOutOfRangeException>(() =>
|
|
new ContextWindowCompactionStrategy(1000, 100, truncationThreshold: threshold));
|
|
}
|
|
|
|
[Fact]
|
|
public void Constructor_TruncationBelowToolEviction_Throws()
|
|
{
|
|
// Act & Assert
|
|
Assert.Throws<ArgumentOutOfRangeException>(() =>
|
|
new ContextWindowCompactionStrategy(1000, 100, toolEvictionThreshold: 0.8, truncationThreshold: 0.5));
|
|
}
|
|
|
|
[Fact]
|
|
public async Task CompactAsync_BelowToolEvictionThreshold_NoCompactionAsync()
|
|
{
|
|
// Arrange — input budget = 900 tokens, tool eviction at 450, truncation at 720
|
|
// A few short messages should be well below any threshold.
|
|
var strategy = new ContextWindowCompactionStrategy(
|
|
maxContextWindowTokens: 1000,
|
|
maxOutputTokens: 100);
|
|
|
|
CompactionMessageIndex index = CompactionMessageIndex.Create(
|
|
[
|
|
new ChatMessage(ChatRole.User, "Hello"),
|
|
new ChatMessage(ChatRole.Assistant, "Hi there!"),
|
|
]);
|
|
|
|
// Act
|
|
bool result = await strategy.CompactAsync(index);
|
|
|
|
// Assert
|
|
Assert.False(result);
|
|
Assert.Equal(2, index.IncludedGroupCount);
|
|
}
|
|
|
|
[Fact]
|
|
public async Task CompactAsync_AboveTruncationThreshold_TruncatesOldestAsync()
|
|
{
|
|
// Arrange — use a budget of 5 tokens with truncation at 80% = 4 token threshold.
|
|
// Even the shortest messages will exceed this, ensuring truncation fires.
|
|
var strategy = new ContextWindowCompactionStrategy(
|
|
maxContextWindowTokens: 10,
|
|
maxOutputTokens: 5,
|
|
toolEvictionThreshold: 0.5,
|
|
truncationThreshold: 0.8);
|
|
|
|
// Verify internal budget calculation
|
|
Assert.Equal(5, strategy.InputBudgetTokens);
|
|
|
|
CompactionMessageIndex index = CompactionMessageIndex.Create(
|
|
[
|
|
new ChatMessage(ChatRole.User, "First user message"),
|
|
new ChatMessage(ChatRole.Assistant, "First response"),
|
|
new ChatMessage(ChatRole.User, "Second user message"),
|
|
new ChatMessage(ChatRole.Assistant, "Second response"),
|
|
]);
|
|
|
|
int groupsBefore = index.IncludedGroupCount;
|
|
int tokensBefore = index.IncludedTokenCount;
|
|
|
|
// Verify tokens actually exceed the truncation threshold (80% of 5 = 4)
|
|
Assert.True(tokensBefore > 4, $"Expected tokens > 4 but got {tokensBefore}");
|
|
Assert.True(groupsBefore > 1, $"Expected groups > 1 but got {groupsBefore}");
|
|
|
|
// Act
|
|
bool result = await strategy.CompactAsync(index);
|
|
|
|
// Assert — with tokens well above a 4-token threshold, truncation should fire
|
|
Assert.True(result, $"Expected compaction to occur. Tokens before: {tokensBefore}, groups before: {groupsBefore}, NonSystemGroups: {index.IncludedNonSystemGroupCount}");
|
|
Assert.True(index.IncludedGroupCount < groupsBefore);
|
|
}
|
|
|
|
[Fact]
|
|
public async Task CompactAsync_ToolCallsAboveEvictionThreshold_CollapsesToolCallsAsync()
|
|
{
|
|
// Arrange — very small budget so tool eviction fires.
|
|
// Input budget = 5, tool eviction at 50% = 2 token threshold.
|
|
var strategy = new ContextWindowCompactionStrategy(
|
|
maxContextWindowTokens: 10,
|
|
maxOutputTokens: 5,
|
|
toolEvictionThreshold: 0.5,
|
|
truncationThreshold: 0.9);
|
|
|
|
// Build messages with a tool call group: assistant with FunctionCallContent + tool result
|
|
var assistantMessage = new ChatMessage(ChatRole.Assistant, [new FunctionCallContent("call1", "get_data", arguments: new Dictionary<string, object?> { ["query"] = "test" })]);
|
|
var toolResultMessage = new ChatMessage(ChatRole.Tool, [new FunctionResultContent("call1", "Here is a long result with many words to ensure we exceed the token threshold")]);
|
|
var userMessage = new ChatMessage(ChatRole.User, "What did you find?");
|
|
var assistantResponse = new ChatMessage(ChatRole.Assistant, "Based on the results I found information.");
|
|
|
|
CompactionMessageIndex index = CompactionMessageIndex.Create(
|
|
[
|
|
assistantMessage,
|
|
toolResultMessage,
|
|
userMessage,
|
|
assistantResponse,
|
|
]);
|
|
|
|
// Act
|
|
bool result = await strategy.CompactAsync(index);
|
|
|
|
// Assert — compaction should succeed for tool calls above the eviction threshold.
|
|
// Do not assert on IncludedTokenCount because tool-result compaction preserves content
|
|
// in summary form and tokenization can make the count stay the same or increase.
|
|
Assert.True(result);
|
|
}
|
|
|
|
[Fact]
|
|
public void Constructor_EqualThresholds_Succeeds()
|
|
{
|
|
// Arrange & Act — truncation == tool eviction should be valid
|
|
var strategy = new ContextWindowCompactionStrategy(
|
|
maxContextWindowTokens: 1000,
|
|
maxOutputTokens: 100,
|
|
toolEvictionThreshold: 0.7,
|
|
truncationThreshold: 0.7);
|
|
|
|
// Assert
|
|
Assert.Equal(0.7, strategy.ToolEvictionThreshold);
|
|
Assert.Equal(0.7, strategy.TruncationThreshold);
|
|
}
|
|
|
|
[Fact]
|
|
public void Constructor_ZeroMaxOutputTokens_FullBudget()
|
|
{
|
|
// Arrange & Act
|
|
var strategy = new ContextWindowCompactionStrategy(
|
|
maxContextWindowTokens: 1_000_000,
|
|
maxOutputTokens: 0);
|
|
|
|
// Assert — entire context window is the input budget
|
|
Assert.Equal(1_000_000, strategy.InputBudgetTokens);
|
|
}
|
|
}
|