@@ -20,19 +20,19 @@ TEST_F(GenerationConfigTest, TestResolveMaxNewTokensBothDefault) {
2020 GenerationConfig config;
2121 // Default values: seq_len = -1, max_new_tokens = -1
2222
23- // max_context_len = 100, num_prompt_tokens = 20
24- // Expected: max_context_len - num_prompt_tokens = 100 - 20 = 80
23+ // max_context_len = 100, num_tokens_occupied = 20
24+ // Expected: max_context_len - num_tokens_occupied = 100 - 20 = 80
2525 EXPECT_EQ (config.resolve_max_new_tokens (100 , 20 ), 80 );
2626
27- // max_context_len = 50, num_prompt_tokens = 30
28- // Expected: max_context_len - num_prompt_tokens = 50 - 30 = 20
27+ // max_context_len = 50, num_tokens_occupied = 30
28+ // Expected: max_context_len - num_tokens_occupied = 50 - 30 = 20
2929 EXPECT_EQ (config.resolve_max_new_tokens (50 , 30 ), 20 );
3030
31- // Edge case: num_prompt_tokens equals max_context_len
31+ // Edge case: num_tokens_occupied equals max_context_len
3232 // Expected: 0 (no tokens left)
3333 EXPECT_EQ (config.resolve_max_new_tokens (40 , 40 ), 0 );
3434
35- // Edge case: num_prompt_tokens exceeds max_context_len
35+ // Edge case: num_tokens_occupied exceeds max_context_len
3636 // Expected: 0 (no tokens left, and we ensure non-negative result)
3737 EXPECT_EQ (config.resolve_max_new_tokens (30 , 50 ), 0 );
3838}
@@ -43,17 +43,17 @@ TEST_F(GenerationConfigTest, TestResolveMaxNewTokensOnlyMaxNewTokens) {
4343 config.seq_len = -1 ;
4444 config.max_new_tokens = 25 ;
4545
46- // max_context_len = 100, num_prompt_tokens = 20
46+ // max_context_len = 100, num_tokens_occupied = 20
4747 // Available tokens: 100 - 20 = 80
4848 // Expected: min(max_new_tokens, available) = min(25, 80) = 25
4949 EXPECT_EQ (config.resolve_max_new_tokens (100 , 20 ), 25 );
5050
51- // max_context_len = 50, num_prompt_tokens = 40
51+ // max_context_len = 50, num_tokens_occupied = 40
5252 // Available tokens: 50 - 40 = 10
5353 // Expected: min(max_new_tokens, available) = min(25, 10) = 10
5454 EXPECT_EQ (config.resolve_max_new_tokens (50 , 40 ), 10 );
5555
56- // Edge case: num_prompt_tokens equals max_context_len
56+ // Edge case: num_tokens_occupied equals max_context_len
5757 // Available tokens: 0
5858 // Expected: 0 (no tokens left)
5959 EXPECT_EQ (config.resolve_max_new_tokens (40 , 40 ), 0 );
@@ -65,21 +65,21 @@ TEST_F(GenerationConfigTest, TestResolveMaxNewTokensOnlySeqLen) {
6565 config.seq_len = 50 ;
6666 config.max_new_tokens = -1 ;
6767
68- // max_context_len = 100, num_prompt_tokens = 20
68+ // max_context_len = 100, num_tokens_occupied = 20
6969 // Effective seq_len: min(seq_len, max_context_len) = min(50, 100) = 50
70- // Expected: effective_seq_len - num_prompt_tokens = 50 - 20 = 30
70+ // Expected: effective_seq_len - num_tokens_occupied = 50 - 20 = 30
7171 EXPECT_EQ (config.resolve_max_new_tokens (100 , 20 ), 30 );
7272
73- // max_context_len = 40, num_prompt_tokens = 20
73+ // max_context_len = 40, num_tokens_occupied = 20
7474 // Effective seq_len: min(seq_len, max_context_len) = min(50, 40) = 40
75- // Expected: effective_seq_len - num_prompt_tokens = 40 - 20 = 20
75+ // Expected: effective_seq_len - num_tokens_occupied = 40 - 20 = 20
7676 EXPECT_EQ (config.resolve_max_new_tokens (40 , 20 ), 20 );
7777
78- // Edge case: num_prompt_tokens equals effective seq_len
78+ // Edge case: num_tokens_occupied equals effective seq_len
7979 // Expected: 0 (no tokens left)
8080 EXPECT_EQ (config.resolve_max_new_tokens (100 , 50 ), 0 );
8181
82- // Edge case: num_prompt_tokens exceeds effective seq_len
82+ // Edge case: num_tokens_occupied exceeds effective seq_len
8383 // Expected: 0 (no tokens left, and we ensure non-negative result)
8484 EXPECT_EQ (config.resolve_max_new_tokens (100 , 60 ), 0 );
8585}
@@ -90,19 +90,19 @@ TEST_F(GenerationConfigTest, TestResolveMaxNewTokensBothSpecified) {
9090 config.seq_len = 50 ;
9191 config.max_new_tokens = 25 ;
9292
93- // max_context_len = 100, num_prompt_tokens = 20
93+ // max_context_len = 100, num_tokens_occupied = 20
9494 // Effective seq_len: min(seq_len, max_context_len) = min(50, 100) = 50
95- // Available tokens: effective_seq_len - num_prompt_tokens = 50 - 20 = 30
95+ // Available tokens: effective_seq_len - num_tokens_occupied = 50 - 20 = 30
9696 // Expected: min(max_new_tokens, available) = min(25, 30) = 25
9797 EXPECT_EQ (config.resolve_max_new_tokens (100 , 20 ), 25 );
9898
99- // max_context_len = 40, num_prompt_tokens = 20
99+ // max_context_len = 40, num_tokens_occupied = 20
100100 // Effective seq_len: min(seq_len, max_context_len) = min(50, 40) = 40
101- // Available tokens: effective_seq_len - num_prompt_tokens = 40 - 20 = 20
101+ // Available tokens: effective_seq_len - num_tokens_occupied = 40 - 20 = 20
102102 // Expected: min(max_new_tokens, available) = min(25, 20) = 20
103103 EXPECT_EQ (config.resolve_max_new_tokens (40 , 20 ), 20 );
104104
105- // Edge case: num_prompt_tokens equals effective seq_len
105+ // Edge case: num_tokens_occupied equals effective seq_len
106106 // Available tokens: 0
107107 // Expected: 0 (no tokens left)
108108 EXPECT_EQ (config.resolve_max_new_tokens (40 , 40 ), 0 );
0 commit comments