tests: add http_client test

ChenZiHong-Gavin · ChenZiHong-Gavin · commit ee2d35eaccbb · 2025-10-28T11:37:40.000+08:00
diff --git a/graphgen/models/llm/api/http_client.py b/graphgen/models/llm/api/http_client.py
@@ -62,9 +62,6 @@ def __init__(
         self.token_usage: List[Dict[str, int]] = []
         self._session: Optional[aiohttp.ClientSession] = None
 
-    def __post_init__(self):
-        pass
-
     @property
     def session(self) -> aiohttp.ClientSession:
         if self._session is None or self._session.closed:
@@ -102,7 +99,6 @@ def _build_body(self, text: str, history: List[str]) -> Dict[str, Any]:
             body["response_format"] = {"type": "json_object"}
         return body
 
-    # ---------------- generate_answer ----------------
     @retry(
         stop=stop_after_attempt(5),
         wait=wait_exponential(multiplier=1, min=4, max=10),
@@ -184,4 +180,6 @@ async def generate_topk_per_token(
     async def generate_inputs_prob(
         self, text: str, history: Optional[List[str]] = None, **extra: Any
     ) -> List[Token]:
-        raise NotImplementedError
+        raise NotImplementedError(
+            "generate_inputs_prob is not implemented in HTTPClient"
+        )
diff --git a/requirements.txt b/requirements.txt
@@ -25,4 +25,4 @@ igraph
 python-louvain
 
 # For visualization
-matplotlib
+matplotlib
diff --git a/tests/integration_tests/models/llm/api/test_http_client.py b/tests/integration_tests/models/llm/api/test_http_client.py
@@ -0,0 +1,143 @@
+# pylint: disable=protected-access
+import math
+
+import pytest
+
+from graphgen.models.llm.api.http_client import HTTPClient
+
+
+class DummyTokenizer:
+    def encode(self, text: str):
+        # simple tokenization: split on spaces
+        return text.split()
+
+
+class _MockResponse:
+    def __init__(self, data):
+        self._data = data
+
+    def raise_for_status(self):
+        return None
+
+    async def json(self):
+        return self._data
+
+
+class _PostCtx:
+    def __init__(self, data):
+        self._resp = _MockResponse(data)
+
+    async def __aenter__(self):
+        return self._resp
+
+    async def __aexit__(self, exc_type, exc, tb):
+        return False
+
+
+class MockSession:
+    def __init__(self, data):
+        self._data = data
+        self.closed = False
+
+    def post(self, *args, **kwargs):
+        return _PostCtx(self._data)
+
+    async def close(self):
+        self.closed = True
+
+
+class DummyLimiter:
+    def __init__(self):
+        self.calls = []
+
+    async def wait(self, *args, **kwargs):
+        self.calls.append((args, kwargs))
+
+
+@pytest.mark.asyncio
+async def test_generate_answer_records_usage_and_uses_limiters():
+    # arrange
+    data = {
+        "choices": [{"message": {"content": "Hello <think>world</think>!"}}],
+        "usage": {"prompt_tokens": 3, "completion_tokens": 2, "total_tokens": 5},
+    }
+    client = HTTPClient(model_name="m", base_url="http://test")
+    client._session = MockSession(data)
+    client.tokenizer = DummyTokenizer()
+    client.system_prompt = "sys"
+    client.temperature = 0.0
+    client.top_p = 1.0
+    client.max_tokens = 10
+    client.filter_think_tags = lambda s: s.replace("<think>", "").replace(
+        "</think>", ""
+    )
+    rpm = DummyLimiter()
+    tpm = DummyLimiter()
+    client.rpm = rpm
+    client.tpm = tpm
+    client.request_limit = True
+
+    # act
+    out = await client.generate_answer("hi", history=["u1", "a1"])
+
+    # assert
+    assert out == "Hello world!"
+    assert client.token_usage[-1] == {
+        "prompt_tokens": 3,
+        "completion_tokens": 2,
+        "total_tokens": 5,
+    }
+    assert len(rpm.calls) == 1
+    assert len(tpm.calls) == 1
+
+
+@pytest.mark.asyncio
+async def test_generate_topk_per_token_parses_logprobs():
+    # arrange
+    # create two token items with top_logprobs
+    data = {
+        "choices": [
+            {
+                "logprobs": {
+                    "content": [
+                        {
+                            "token": "A",
+                            "logprob": math.log(0.6),
+                            "top_logprobs": [
+                                {"token": "A", "logprob": math.log(0.6)},
+                                {"token": "B", "logprob": math.log(0.4)},
+                            ],
+                        },
+                        {
+                            "token": "B",
+                            "logprob": math.log(0.2),
+                            "top_logprobs": [
+                                {"token": "B", "logprob": math.log(0.2)},
+                                {"token": "C", "logprob": math.log(0.8)},
+                            ],
+                        },
+                    ]
+                }
+            }
+        ]
+    }
+    client = HTTPClient(model_name="m", base_url="http://test")
+    client._session = MockSession(data)
+    client.tokenizer = DummyTokenizer()
+    client.system_prompt = None
+    client.temperature = 0.0
+    client.top_p = 1.0
+    client.max_tokens = 10
+    client.topk_per_token = 2
+
+    # act
+    tokens = await client.generate_topk_per_token("hi", history=[])
+
+    # assert
+    assert len(tokens) == 2
+    # check probabilities and top_candidates
+    assert abs(tokens[0].prob - 0.6) < 1e-9
+    assert abs(tokens[1].prob - 0.2) < 1e-9
+    assert len(tokens[0].top_candidates) == 2
+    assert tokens[0].top_candidates[0].text == "A"
+    assert tokens[0].top_candidates[1].text == "B"