akg/akg_agents/tests/ut/cache_tests/test_cache_integration.py-代码预览-akg:基于深度学习的算子优化与自动生成项目 - AtomGit

liuliting2025test(cache): complete test specification rectification, directory migration and code normalization
# Copyright 2026 Huawei Technologies Co., Ltd
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

import pytest

from akg_agents.core_v2.llm.cache import LLMCache, attach_cache_to_client
from akg_agents.core_v2.llm.client import LLMClient


class FakeProvider:
    def __init__(self):
        self.model_name = "fake-model"
        self.calls = 0

    async def generate(self, messages, tools=None, **config):
        self.calls += 1
        return {
            "content": f"ok-{self.calls}",
            "reasoning_content": "",
            "tool_calls": [],
            "usage": {},
        }


@pytest.mark.asyncio
async def test_cache_off_mode_bypasses_cache(temp_cache_file):
    cache = LLMCache(
        max_memory_size=10,
        cache_file_path=temp_cache_file,
        expire_seconds=3600,
    )
    provider = FakeProvider()
    client = LLMClient(provider=provider)
    attach_cache_to_client(client, cache=cache)

    messages = [{"role": "user", "content": "hello"}]

    result1 = await client.generate(messages, cache_mode="off")
    result2 = await client.generate(messages, cache_mode="off")

    assert provider.calls == 2
    assert result1 != result2


@pytest.mark.asyncio
async def test_cache_record_mode_hit(temp_cache_file):
    cache = LLMCache(
        max_memory_size=10,
        cache_file_path=temp_cache_file,
        expire_seconds=3600,
    )
    provider = FakeProvider()
    client = LLMClient(provider=provider)
    attach_cache_to_client(client, cache=cache)

    messages = [{"role": "user", "content": "hello"}]

    result1 = await client.generate(messages, cache_mode="record")
    result2 = await client.generate(messages, cache_mode="record")

    assert provider.calls == 1
    assert result1 == result2

    cache.clear_all_cache()


@pytest.mark.asyncio
async def test_cache_refresh_and_disable(temp_cache_file):
    cache = LLMCache(
        max_memory_size=10,
        cache_file_path=temp_cache_file,
        expire_seconds=3600,
    )
    provider = FakeProvider()
    client = LLMClient(provider=provider)
    attach_cache_to_client(client, cache=cache)

    messages = [{"role": "user", "content": "hello"}]

    await client.generate(messages, cache_mode="record")
    await client.generate(messages, cache_mode="record", cache_refresh=True)
    await client.generate(messages, cache_mode="off")

    assert provider.calls == 3

    cache.clear_all_cache()


@pytest.mark.asyncio
async def test_cache_session_record_and_replay(temp_cache_file):
    cache = LLMCache(
        max_memory_size=10,
        cache_file_path=temp_cache_file,
        expire_seconds=3600,
    )
    provider = FakeProvider()
    client = LLMClient(provider=provider)
    attach_cache_to_client(client, cache=cache)

    messages_a = [{"role": "user", "content": "step-a"}]
    messages_b = [{"role": "user", "content": "step-b"}]
    session_hash = "session-001"

    result_a_record = await client.generate(
        messages_a,
        cache_mode="record",
        cache_session_hash=session_hash,
        cache_agent_hash="0@1",
    )
    result_b_record = await client.generate(
        messages_b,
        cache_mode="record",
        cache_session_hash=session_hash,
        cache_agent_hash="0@2",
    )
    calls_after_record = provider.calls

    result_a_replay = await client.generate(
        [{"role": "user", "content": "different-a"}],
        cache_mode="replay",
        cache_session_hash=session_hash,
        cache_agent_hash="0@1",
    )
    result_b_replay = await client.generate(
        [{"role": "user", "content": "different-b"}],
        cache_mode="replay",
        cache_session_hash=session_hash,
        cache_agent_hash="0@2",
    )

    assert provider.calls == calls_after_record
    assert result_a_replay == result_a_record
    assert result_b_replay == result_b_record


@pytest.mark.asyncio
async def test_cache_session_replay_miss_fallback_and_fill(temp_cache_file):
    cache = LLMCache(
        max_memory_size=10,
        cache_file_path=temp_cache_file,
        expire_seconds=3600,
    )
    provider = FakeProvider()
    client = LLMClient(provider=provider)
    attach_cache_to_client(client, cache=cache)

    session_hash = "session-miss"
    with pytest.raises(RuntimeError, match="Replay cache miss"):
        await client.generate(
            [{"role": "user", "content": "first-call"}],
            cache_mode="replay",
            cache_session_hash=session_hash,
            cache_agent_hash="0@3",
        )

    assert provider.calls == 0