[Inference] Fix bugs and docs for feat/online-server (#5598)

* fix test bugs * add do sample test * del useless lines * fix comments * fix tests * delete version tag * delete version tag * add * del test sever * fix test * fix * Revert "add" This reverts commit b9305fb024.
2025-09-06 11:32:10 +00:00 · 2024-05-08 15:14:06 +08:00
parent 7bbb28e48b
commit 61a1b2e798
12 changed files with 98 additions and 172 deletions
--- a/tests/test_infer/test_async_engine/test_async_engine.py
+++ b/tests/test_infer/test_async_engine/test_async_engine.py
@@ -7,7 +7,7 @@ from colossalai.inference.core.async_engine import AsyncInferenceEngine


@dataclass
-class SequenceTpye:
+class MockSequence:
    request_id: int


@@ -20,7 +20,11 @@ class MockEngine:

    async def async_step(self):
        self.step_calls += 1
-        return [SequenceTpye(request_id=self.request_id)] if self.request_id else []
+        return ([MockSequence(request_id=self.request_id)], True) if self.request_id else ([], False)
+
+    def add_single_request(self, **kwargs):
+        del kwargs
+        self.add_request_calls += 1

    def generate(self, request_id):
        self.request_id = request_id
@@ -37,14 +41,14 @@ class MockEngine:
        self.abort_request_calls += 1


-class MockAsyncLLMEngine(AsyncInferenceEngine):
+class MockAsyncInferenceEngine(AsyncInferenceEngine):
    def _init_engine(self, *args, **kwargs):
        return MockEngine()


@pytest.mark.asyncio
 async def test_new_requests_event():
-    engine = MockAsyncLLMEngine(worker_use_ray=False, engine_use_ray=False)
+    engine = MockAsyncInferenceEngine()
    engine.start_background_loop()
    await asyncio.sleep(0.01)
    assert engine.engine.step_calls == 0
@@ -74,7 +78,3 @@ async def test_new_requests_event():
    await asyncio.sleep(0.01)
    assert engine.engine.add_request_calls == 3
    assert engine.engine.step_calls == 5
-
-
-if __name__ == "__main__":
-    test_new_requests_event()