test_cpu_manager.py 21 KB
Newer Older
1
2
3
4
5
6
# SPDX-License-Identifier: Apache-2.0
# SPDX-FileCopyrightText: Copyright contributors to the vLLM project
from collections.abc import Iterable
from dataclasses import dataclass

import numpy as np
7
import pytest
8

9
10
11
from vllm.v1.kv_offload.abstract import (
    LoadStoreSpec,
    OffloadingEvent,
12
    OffloadKey,
13
    PrepareStoreOutput,
14
    ReqContext,
15
    make_offload_key,
16
)
17
18
from vllm.v1.kv_offload.cpu.manager import CPUOffloadingManager
from vllm.v1.kv_offload.cpu.policies.arc import ARCCachePolicy
19
from vllm.v1.kv_offload.mediums import CPULoadStoreSpec
20
from vllm.v1.kv_offload.reuse_manager import FilterReusedOffloadingManager
21
22


23
24
25
26
27
28
29
30
def make_req_context(kv_transfer_params: dict | None = None) -> ReqContext:
    """Create a ReqContext as production code would, from a request's params."""
    return ReqContext(kv_transfer_params=kv_transfer_params)


_EMPTY_REQ_CTX = make_req_context()


31
32
@dataclass
class ExpectedPrepareStoreOutput:
33
    keys_to_store: list[int]
34
    store_block_ids: list[int]
35
    evicted_keys: list[int]
36
37


38
39
def to_keys(int_ids: list[int]) -> list[OffloadKey]:
    return [make_offload_key(str(i).encode(), 0) for i in int_ids]
40
41
42


def verify_store_output(
43
    prepare_store_output: PrepareStoreOutput | None,
44
45
    expected_prepare_store_output: ExpectedPrepareStoreOutput,
):
46
    assert prepare_store_output is not None
47
48
    assert prepare_store_output.keys_to_store == to_keys(
        expected_prepare_store_output.keys_to_store
49
    )
50
51
    assert prepare_store_output.evicted_keys == to_keys(
        expected_prepare_store_output.evicted_keys
52
    )
53
54
    store_spec = prepare_store_output.store_spec
    assert isinstance(store_spec, CPULoadStoreSpec)
55
56
57
    expected_array = np.array(
        expected_prepare_store_output.store_block_ids, dtype=np.int64
    )
58
59
60
    assert np.array_equal(expected_array, store_spec.block_ids)


61
62
63
def verify_load_output(
    prepare_load_output: LoadStoreSpec, expected_prepare_load_output: list[int]
):
64
65
66
67
68
    assert isinstance(prepare_load_output, CPULoadStoreSpec)
    expected_array = np.array(expected_prepare_load_output, dtype=np.int64)
    assert np.array_equal(expected_array, prepare_load_output.block_ids)


69
70
71
72
73
def verify_events(
    events: Iterable[OffloadingEvent],
    expected_stores: tuple[set[int], ...] = (),
    expected_evictions: tuple[set[int], ...] = (),
):
74
75
    stores: list[set[OffloadKey]] = []
    evictions: list[set[OffloadKey]] = []
76
77
78
    for event in events:
        assert event.medium == CPULoadStoreSpec.medium()
        if event.removed:
79
            evictions.append(set(event.keys))
80
        else:
81
            stores.append(set(event.keys))
82

83
84
85
86
    def to_key_sets(
        int_sets: tuple[set[int], ...],
    ) -> tuple[set[OffloadKey], ...]:
        return tuple([set(to_keys(list(int_set))) for int_set in int_sets])
87

88
89
    assert tuple(evictions) == to_key_sets(expected_evictions)
    assert tuple(stores) == to_key_sets(expected_stores)
90
91


92
93
@pytest.mark.parametrize("eviction_policy", ["lru", "arc"])
def test_already_stored_block_not_evicted_during_prepare_store(eviction_policy):
94
95
96
    """
    Regression test: a block that is already stored must not be evicted
    by prepare_store() when it needs to make room for new blocks.
97
    Applies to both lru and arc policies.
98
99
100
101
102
103
104
105
106
107

    Scenario:
        - Store blocks [1, 2] and complete.
        - touch([1]) makes block 2 the LRU candidate.
        - prepare_store([2, 3, 4, 5]):
            * block 2 is filtered out as "already stored"
            * but without the fix, block 2 would be evicted as the LRU
              candidate to make room for [3, 4, 5]
        - After complete_store([2, 3, 4, 5]), block 2 must still be present.
    """
108
109
110
111
112
    manager = CPUOffloadingManager(
        num_blocks=4,
        cache_policy=eviction_policy,
        enable_events=True,
    )
113
114

    # store [1, 2] and complete
115
    manager.prepare_store(to_keys([1, 2]), _EMPTY_REQ_CTX)
116
    manager.complete_store(to_keys([1, 2]))
117
118

    # touch [1] to make block 2 the LRU candidate
119
    manager.touch(to_keys([1]))
120
121

    # prepare_store([2, 3, 4, 5]):
122
    #   - block 2 is already stored -> filtered out of keys_to_store
123
124
    #   - block 2 must NOT be evicted even though it is the LRU candidate
    #   - block 1 (ID 0) is evicted instead; new blocks [3,4,5] get IDs 2,3,0
125
    prepare_store_output = manager.prepare_store(to_keys([2, 3, 4, 5]), _EMPTY_REQ_CTX)
126
127
128
    verify_store_output(
        prepare_store_output,
        ExpectedPrepareStoreOutput(
129
            keys_to_store=[3, 4, 5],
130
            store_block_ids=[2, 3, 0],
131
            evicted_keys=[1],  # block 1 evicted, not block 2
132
133
134
135
        ),
    )

    # complete_store must not silently drop block 2
136
    manager.complete_store(to_keys([2, 3, 4, 5]))
137
138

    # block 2 must still be present in the cache
139
    assert manager.lookup(to_keys([2]), _EMPTY_REQ_CTX) == 1
140
141


142
143
def test_cpu_manager():
    """
144
    Tests CPUOffloadingManager with lru policy.
145
    """
146
    # initialize a CPU manager with a capacity of 4 blocks
147
    cpu_manager = CPUOffloadingManager(
148
        num_blocks=4, cache_policy="lru", enable_events=True
149
    )
150
151

    # prepare store [1, 2]
152
    prepare_store_output = cpu_manager.prepare_store(to_keys([1, 2]), _EMPTY_REQ_CTX)
153
154
155
    verify_store_output(
        prepare_store_output,
        ExpectedPrepareStoreOutput(
156
            keys_to_store=[1, 2],
157
            store_block_ids=[0, 1],
158
            evicted_keys=[],
159
160
        ),
    )
161
162

    # lookup [1, 2] -> not ready
163
    assert cpu_manager.lookup(to_keys([1, 2]), _EMPTY_REQ_CTX) == 0
164
165
166
167
168

    # no events so far
    assert list(cpu_manager.take_events()) == []

    # complete store [1, 2]
169
    cpu_manager.complete_store(to_keys([1, 2]))
170
    verify_events(cpu_manager.take_events(), expected_stores=({1, 2},))
171
172

    # lookup [1, 2]
173
174
175
    assert cpu_manager.lookup(to_keys([1]), _EMPTY_REQ_CTX) == 1
    assert cpu_manager.lookup(to_keys([1, 2]), _EMPTY_REQ_CTX) == 2
    assert cpu_manager.lookup(to_keys([1, 2, 3]), _EMPTY_REQ_CTX) == 2
176
177

    # prepare store [2, 3, 4, 5] -> evicts [1]
178
179
180
    prepare_store_output = cpu_manager.prepare_store(
        to_keys([2, 3, 4, 5]), _EMPTY_REQ_CTX
    )
181
182
183
    verify_store_output(
        prepare_store_output,
        ExpectedPrepareStoreOutput(
184
            keys_to_store=[3, 4, 5],
185
            store_block_ids=[2, 3, 0],
186
            evicted_keys=[1],
187
188
        ),
    )
189
190

    # verify eviction event
191
    verify_events(cpu_manager.take_events(), expected_evictions=({1},))
192
193

    # prepare store with no space
194
    assert cpu_manager.prepare_store(to_keys([1, 6]), _EMPTY_REQ_CTX) is None
195
196

    # complete store [2, 3, 4, 5]
197
    cpu_manager.complete_store(to_keys([2, 3, 4, 5]))
198
199

    # prepare load [2, 3]
200
    prepare_load_output = cpu_manager.prepare_load(to_keys([2, 3]), _EMPTY_REQ_CTX)
201
202
203
    verify_load_output(prepare_load_output, [1, 2])

    # prepare store with no space ([2, 3] is being loaded)
204
    assert cpu_manager.prepare_store(to_keys([6, 7, 8]), _EMPTY_REQ_CTX) is None
205
206

    # complete load [2, 3]
207
    cpu_manager.complete_load(to_keys([2, 3]))
208
209

    # prepare store [6, 7, 8] -> evicts [2, 3, 4] (oldest)
210
    prepare_store_output = cpu_manager.prepare_store(to_keys([6, 7, 8]), _EMPTY_REQ_CTX)
211
212
213
    verify_store_output(
        prepare_store_output,
        ExpectedPrepareStoreOutput(
214
            keys_to_store=[6, 7, 8],
215
            store_block_ids=[3, 2, 1],
216
            evicted_keys=[2, 3, 4],
217
218
        ),
    )
219
220

    # complete store [6, 7, 8]
221
    cpu_manager.complete_store(to_keys([6, 7, 8]))
222
223

    # touch [5, 6, 7] (move to end of LRU order)
224
    cpu_manager.touch(to_keys([5, 6, 7]))
225
226

    # prepare store [7, 9] -> evicts [8] (oldest following previous touch)
227
    prepare_store_output = cpu_manager.prepare_store(to_keys([9]), _EMPTY_REQ_CTX)
228
229
230
    verify_store_output(
        prepare_store_output,
        ExpectedPrepareStoreOutput(
231
            keys_to_store=[9],
232
            store_block_ids=[1],
233
            evicted_keys=[8],
234
235
        ),
    )
236
237

    # complete store [7, 9] with failure
238
    cpu_manager.complete_store(to_keys([7, 9]), success=False)
239
240

    # assert [7] is still stored, but [9] is not
241
242
    assert cpu_manager.lookup(to_keys([7]), _EMPTY_REQ_CTX) == 1
    assert cpu_manager.lookup(to_keys([9]), _EMPTY_REQ_CTX) == 0
243

244
245
246
247
248
    verify_events(
        cpu_manager.take_events(),
        expected_stores=({3, 4, 5}, {6, 7, 8}),
        expected_evictions=({2, 3, 4}, {8}),
    )
249
250


251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
class TestARCPolicy:
    """Unit tests for CPUOffloadingManager with ARC eviction policy."""

    def _make_manager(
        self, num_blocks: int = 4, enable_events: bool = True
    ) -> tuple[CPUOffloadingManager, ARCCachePolicy]:
        manager = CPUOffloadingManager(
            num_blocks=num_blocks,
            cache_policy="arc",
            enable_events=enable_events,
        )
        policy = manager._policy
        assert isinstance(policy, ARCCachePolicy)
        return manager, policy

    def test_basic(self):
        """
        Tests CPUOffloadingManager with arc policy.
        Verifies that ARC handles store, load, and lookup operations correctly.
        """
        cpu_manager, arc_policy = self._make_manager()

        # prepare store [1, 2]
274
275
276
        prepare_store_output = cpu_manager.prepare_store(
            to_keys([1, 2]), _EMPTY_REQ_CTX
        )
277
278
279
        verify_store_output(
            prepare_store_output,
            ExpectedPrepareStoreOutput(
280
                keys_to_store=[1, 2],
281
                store_block_ids=[0, 1],
282
                evicted_keys=[],
283
284
285
286
            ),
        )

        # lookup [1, 2] -> not ready
287
        assert cpu_manager.lookup(to_keys([1, 2]), _EMPTY_REQ_CTX) == 0
288
289
290
291
292

        # no events so far
        assert list(cpu_manager.take_events()) == []

        # complete store [1, 2]
293
        cpu_manager.complete_store(to_keys([1, 2]))
294
        verify_events(cpu_manager.take_events(), expected_stores=({1, 2},))
295
296

        # lookup [1, 2]
297
298
299
        assert cpu_manager.lookup(to_keys([1]), _EMPTY_REQ_CTX) == 1
        assert cpu_manager.lookup(to_keys([1, 2]), _EMPTY_REQ_CTX) == 2
        assert cpu_manager.lookup(to_keys([1, 2, 3]), _EMPTY_REQ_CTX) == 2
300
301
302
303
304
305
306
307
308
309
310
311
312

        # blocks should be in T1 (recent)
        assert len(arc_policy.t1) == 2
        assert len(arc_policy.t2) == 0

    def test_t1_to_t2_promotion(self):
        """
        Tests that accessing a block in T1 promotes it to T2 (frequent).
        This is a key feature of ARC's adaptive behavior.
        """
        cpu_manager, arc_policy = self._make_manager(enable_events=False)

        # store and complete block 1
313
        cpu_manager.prepare_store(to_keys([1]), _EMPTY_REQ_CTX)
314
        cpu_manager.complete_store(to_keys([1]))
315
316

        # block 1 starts in T1 (recent)
317
318
        assert to_keys([1])[0] in arc_policy.t1
        assert to_keys([1])[0] not in arc_policy.t2
319
320

        # touch block 1 (simulate second access)
321
        cpu_manager.touch(to_keys([1]))
322
323

        # block 1 should now be in T2 (frequent)
324
325
        assert to_keys([1])[0] not in arc_policy.t1
        assert to_keys([1])[0] in arc_policy.t2
326
327
328
329
330
331
332
333
334

    def test_eviction_with_load(self):
        """
        Tests ARC eviction behavior similar to LRU test.
        Verifies that blocks being loaded (ref_cnt > 0) cannot be evicted.
        """
        cpu_manager, _ = self._make_manager()

        # prepare and complete store [1, 2, 3, 4]
335
336
337
        prepare_store_output = cpu_manager.prepare_store(
            to_keys([1, 2, 3, 4]), _EMPTY_REQ_CTX
        )
338
339
340
        verify_store_output(
            prepare_store_output,
            ExpectedPrepareStoreOutput(
341
                keys_to_store=[1, 2, 3, 4],
342
                store_block_ids=[0, 1, 2, 3],
343
                evicted_keys=[],
344
345
            ),
        )
346
        cpu_manager.complete_store(to_keys([1, 2, 3, 4]))
347
348

        # prepare load [2, 3] (increases ref_cnt)
349
        prepare_load_output = cpu_manager.prepare_load(to_keys([2, 3]), _EMPTY_REQ_CTX)
350
351
352
353
        verify_load_output(prepare_load_output, [1, 2])

        # prepare store [5, 6, 7] with [2, 3] being loaded
        # should fail because [2, 3] have ref_cnt > 0
354
        assert cpu_manager.prepare_store(to_keys([5, 6, 7]), _EMPTY_REQ_CTX) is None
355
356

        # complete load [2, 3]
357
        cpu_manager.complete_load(to_keys([2, 3]))
358
359
360

        # now prepare store [5, 6, 7] should succeed
        # ARC will evict blocks one at a time from T1 as needed
361
362
363
        prepare_store_output = cpu_manager.prepare_store(
            to_keys([5, 6, 7]), _EMPTY_REQ_CTX
        )
364
365
        assert prepare_store_output is not None
        # Should successfully evict enough blocks to make room (at least 1)
366
        assert len(prepare_store_output.evicted_keys) >= 1
367
368
369
370
371
372
373
374
375
376

    def test_adaptive_target(self):
        """
        Tests ARC's adaptive target adjustment via ghost lists.
        When a block in B1 (ghost list) is accessed, target_t1_size increases.
        When a block in B2 is accessed, target_t1_size decreases.
        """
        cpu_manager, arc_policy = self._make_manager(num_blocks=2, enable_events=False)

        # store blocks 1, 2 (fills cache)
377
        cpu_manager.prepare_store(to_keys([1, 2]), _EMPTY_REQ_CTX)
378
        cpu_manager.complete_store(to_keys([1, 2]))
379
380
381
382

        initial_target = arc_policy.target_t1_size

        # store block 3, evicting block 1 (moves to B1 ghost list)
383
        cpu_manager.prepare_store(to_keys([3]), _EMPTY_REQ_CTX)
384
        cpu_manager.complete_store(to_keys([3]))
385
386

        # block 1 should be in B1 (ghost list)
387
        assert to_keys([1])[0] in arc_policy.b1
388
389
390

        # touch block 1 (cache miss, but in B1)
        # this should increase target_t1_size (favor recency)
391
        cpu_manager.touch(to_keys([1]))
392
393
394
395
396
397
398
399
400
401
402
403

        # target should have increased
        assert arc_policy.target_t1_size > initial_target

    def test_t1_t2_eviction_policy(self):
        """
        Tests that ARC evicts from T1 or T2 based on target_t1_size.
        If |T1| >= target_t1_size, evict from T1, otherwise from T2.
        """
        cpu_manager, arc_policy = self._make_manager(enable_events=False)

        # store blocks 1, 2, 3, 4
404
        cpu_manager.prepare_store(to_keys([1, 2, 3, 4]), _EMPTY_REQ_CTX)
405
        cpu_manager.complete_store(to_keys([1, 2, 3, 4]))
406
407

        # promote blocks 3, 4 to T2 by touching them
408
        cpu_manager.touch(to_keys([3, 4]))
409
410
411
412
413
414
415
416
417
418

        # now: T1 = {1, 2}, T2 = {3, 4}
        assert len(arc_policy.t1) == 2
        assert len(arc_policy.t2) == 2

        # set target_t1_size to prefer evicting from T1
        # (when |T1| >= target, evict from T1)
        arc_policy.target_t1_size = 1

        # store block 5, should evict from T1 (block 1, LRU in T1)
419
        output = cpu_manager.prepare_store(to_keys([5]), _EMPTY_REQ_CTX)
420
        assert output is not None
421
        assert to_keys([1]) == output.evicted_keys
422

423
        cpu_manager.complete_store(to_keys([5]))
424
425

        # block 1 should be in B1 (ghost list)
426
        assert to_keys([1])[0] in arc_policy.b1
427
        # block 5 should be in T1
428
        assert to_keys([5])[0] in arc_policy.t1
429
430
431
432
433
434
435
436
437

    def test_ghost_list_bounds(self):
        """
        Tests that ghost lists (B1, B2) don't grow unbounded.
        They should be capped at cache_capacity.
        """
        cpu_manager, arc_policy = self._make_manager(num_blocks=2, enable_events=False)

        # fill cache with blocks 1, 2
438
        cpu_manager.prepare_store(to_keys([1, 2]), _EMPTY_REQ_CTX)
439
        cpu_manager.complete_store(to_keys([1, 2]))
440
441
442

        # store many blocks to fill ghost lists
        for i in range(3, 20):
443
            cpu_manager.prepare_store(to_keys([i]), _EMPTY_REQ_CTX)
444
            cpu_manager.complete_store(to_keys([i]))
445
446
447
448
449
450
451
452
453
454
455
456
457

        # ghost lists should not exceed cache_capacity
        assert len(arc_policy.b1) <= arc_policy.cache_capacity
        assert len(arc_policy.b2) <= arc_policy.cache_capacity

    def test_touch_ordering(self):
        """
        Tests that touch() correctly updates access patterns.
        Similar to LRU test but verifies T1/T2 ordering.
        """
        cpu_manager, arc_policy = self._make_manager()

        # store blocks 1, 2, 3, 4
458
        cpu_manager.prepare_store(to_keys([1, 2, 3, 4]), _EMPTY_REQ_CTX)
459
        cpu_manager.complete_store(to_keys([1, 2, 3, 4]))
460
461

        # promote 3, 4 to T2
462
        cpu_manager.touch(to_keys([3, 4]))
463
464
465

        # T1 = {1, 2}, T2 = {3, 4}
        # touch [1, 3, 4] - should promote 1 to T2, and move 3,4 to end of T2
466
        cpu_manager.touch(to_keys([1, 3, 4]))
467
468
469
470
471
472

        # T1 = {2}, T2 = {1, 3, 4} (in that order, with 4 most recent)
        assert len(arc_policy.t1) == 1
        assert len(arc_policy.t2) == 3

        # store block 5, should evict from T1 (block 2, only one in T1)
473
        prepare_store_output = cpu_manager.prepare_store(to_keys([5]), _EMPTY_REQ_CTX)
474
475
476
        verify_store_output(
            prepare_store_output,
            ExpectedPrepareStoreOutput(
477
                keys_to_store=[5],
478
                store_block_ids=[1],  # reuses block 2's storage
479
                evicted_keys=[2],
480
481
482
483
484
485
486
487
488
489
490
            ),
        )

    def test_failed_store(self):
        """
        Tests that failed store operations clean up correctly.
        Similar to LRU test but for ARC.
        """
        cpu_manager, arc_policy = self._make_manager()

        # store blocks 1, 2, 3, 4
491
        cpu_manager.prepare_store(to_keys([1, 2, 3, 4]), _EMPTY_REQ_CTX)
492
        cpu_manager.complete_store(to_keys([1, 2, 3, 4]))
493
494

        # prepare store block 5 (will evict block 1)
495
        prepare_store_output = cpu_manager.prepare_store(to_keys([5]), _EMPTY_REQ_CTX)
496
        assert prepare_store_output is not None
497
        assert len(prepare_store_output.evicted_keys) == 1
498
499

        # complete store with failure
500
        cpu_manager.complete_store(to_keys([5]), success=False)
501
502

        # block 5 should not be in cache
503
        assert cpu_manager.lookup(to_keys([5]), _EMPTY_REQ_CTX) == 0
504
        # block 5 should not be in T1 or T2
505
506
        assert to_keys([5])[0] not in arc_policy.t1
        assert to_keys([5])[0] not in arc_policy.t2
507
508

        # evicted block should still be gone (in B1 ghost list)
509
        evicted_hash = prepare_store_output.evicted_keys[0]
510
511
512
513
514
515
516
517
518
519
        assert evicted_hash in arc_policy.b1

    def test_full_scenario(self):
        """
        Comprehensive test covering multiple ARC operations in sequence.
        Similar to the full LRU test but adapted for ARC behavior.
        """
        cpu_manager, arc_policy = self._make_manager()

        # store [1, 2]
520
        cpu_manager.prepare_store(to_keys([1, 2]), _EMPTY_REQ_CTX)
521
        cpu_manager.complete_store(to_keys([1, 2]))
522
523

        # store [3, 4, 5] -> evicts [1]
524
525
526
        prepare_store_output = cpu_manager.prepare_store(
            to_keys([3, 4, 5]), _EMPTY_REQ_CTX
        )
527
        assert prepare_store_output is not None
528
529
        assert len(prepare_store_output.evicted_keys) == 1
        cpu_manager.complete_store(to_keys([3, 4, 5]))
530
531

        # promote some blocks to T2
532
        cpu_manager.touch(to_keys([2, 3]))
533
534
535
536
537
538

        # T1 has {4, 5}, T2 has {2, 3}
        assert len(arc_policy.t1) == 2
        assert len(arc_policy.t2) == 2

        # store [6] -> should evict from T1 (4 is oldest in T1)
539
        prepare_store_output = cpu_manager.prepare_store(to_keys([6]), _EMPTY_REQ_CTX)
540
        assert prepare_store_output is not None
541
        cpu_manager.complete_store(to_keys([6]))
542
543

        # verify blocks 2, 3 (in T2) are still present
544
545
        assert cpu_manager.lookup(to_keys([2]), _EMPTY_REQ_CTX) == 1
        assert cpu_manager.lookup(to_keys([3]), _EMPTY_REQ_CTX) == 1
546
547
548
549

        # verify events
        events = list(cpu_manager.take_events())
        assert len(events) > 0  # should have store and eviction events
550
551
552
553


def test_filter_reused_manager():
    """
554
    Tests FilterReusedOffloadingManager with a CPUOffloadingManager.
555
    """
556
    lru_manager = CPUOffloadingManager(
557
        num_blocks=4, cache_policy="lru", enable_events=True
558
    )
559
560
561
562
563
564

    manager = FilterReusedOffloadingManager(
        backing=lru_manager, store_threshold=2, max_tracker_size=3
    )

    # Lookup [1, 2] -> 1st time, added to tracker but not eligible for store yet
565
    assert manager.lookup(to_keys([1, 2]), _EMPTY_REQ_CTX) == 0
566
567

    # prepare store [1, 2] -> should be filtered
568
    prepare_store_output = manager.prepare_store(to_keys([1, 2]), _EMPTY_REQ_CTX)
569
    assert prepare_store_output is not None
570
    assert prepare_store_output.keys_to_store == []
571
572

    # Lookup [1] -> 2nd time, eligible now
573
    assert manager.lookup(to_keys([1]), _EMPTY_REQ_CTX) == 0
574
575

    # prepare store [1, 2] -> [1] should be eligible, [2] should be filtered
576
    prepare_store_output = manager.prepare_store(to_keys([1, 2]), _EMPTY_REQ_CTX)
577
    assert prepare_store_output is not None
578
    assert prepare_store_output.keys_to_store == to_keys([1])
579
580
581

    # Lookup [3, 4] -> 1st time
    # (evicts [2] from tracker since max_size is 3 and tracker has [1])
582
    assert manager.lookup(to_keys([3, 4]), _EMPTY_REQ_CTX) == 0
583
    # Verify [2] was evicted from the tracker (tracker now has: [1], [3], [4])
584
    assert to_keys([2])[0] not in manager.counts
585
586

    # Lookup [2] again -> (this adds [2] back to the tracker as 1st time)
587
    assert manager.lookup(to_keys([2]), _EMPTY_REQ_CTX) == 0
588
    # Verify [2] was re-added with count=1 (not eligible yet)
589
    assert manager.counts.get(to_keys([2])[0]) == 1
590
591

    # prepare store [2] -> should still be filtered out since count was reset
592
    prepare_store_output = manager.prepare_store(to_keys([2]), _EMPTY_REQ_CTX)
593
    assert prepare_store_output is not None
594
    assert prepare_store_output.keys_to_store == []
595

596
    manager.complete_store(to_keys([1]))