From 55d037ac4f3c3d12666d94fa213802e7377b43ef Mon Sep 17 00:00:00 2001 From: aries_ckt <916701291@qq.com> Date: Fri, 22 Sep 2023 00:09:57 +0800 Subject: [PATCH] feat:llm manage --- pilot/server/llm_manage/api.py | 36 ---------------------------------- 1 file changed, 36 deletions(-) diff --git a/pilot/server/llm_manage/api.py b/pilot/server/llm_manage/api.py index ad89e8525..605947998 100644 --- a/pilot/server/llm_manage/api.py +++ b/pilot/server/llm_manage/api.py @@ -82,12 +82,6 @@ async def model_stop(request: WorkerStartupRequest): try: from pilot.model.cluster.controller.controller import BaseModelController - # controller = CFG.SYSTEM_APP.get_component( - # ComponentType.MODEL_CONTROLLER, BaseModelController - # ) - # instances = await controller.get_all_instances( - # model_name="WorkerManager@service", healthy_only=True - # ) worker_manager = CFG.SYSTEM_APP.get_component( ComponentType.WORKER_MANAGER_FACTORY, WorkerManagerFactory ).create() @@ -95,17 +89,6 @@ async def model_stop(request: WorkerStartupRequest): return Result.faild(code="E000X", msg=f"can not find worker manager") request.params = {} return Result.succ(await worker_manager.model_shutdown(request)) - # worker_instance = None - # for instance in instances: - # if instance.host == request.host and instance.port == request.port: - # from pilot.model.cluster import ModelRegistryClient - # from pilot.model.cluster import RemoteWorkerManager - # - # registry = ModelRegistryClient(f"http://{request.host}:{request.port}") - # worker_manager = RemoteWorkerManager(registry) - # return Result.succ(await worker_manager.model_shutdown(request)) - # if not worker_instance: - # return Result.faild(code="E000X", msg=f"can not find worker manager") except Exception as e: return Result.faild(code="E000X", msg=f"model stop failed {e}") @@ -114,30 +97,11 @@ async def model_stop(request: WorkerStartupRequest): async def model_start(request: WorkerStartupRequest): print(f"/v1/worker/model/start:") try: - # from pilot.model.cluster.controller.controller import BaseModelController - # - # controller = CFG.SYSTEM_APP.get_component( - # ComponentType.MODEL_CONTROLLER, BaseModelController - # ) - # instances = await controller.get_all_instances( - # model_name="WorkerManager@service", healthy_only=True - # ) worker_manager = CFG.SYSTEM_APP.get_component( ComponentType.WORKER_MANAGER_FACTORY, WorkerManagerFactory ).create() if not worker_manager: return Result.faild(code="E000X", msg=f"can not find worker manager") return Result.succ(await worker_manager.model_startup(request)) - # worker_instance = None - # for instance in instances: - # if instance.host == request.host and instance.port == request.port: - # from pilot.model.cluster import ModelRegistryClient - # from pilot.model.cluster import RemoteWorkerManager - # - # registry = ModelRegistryClient(f"http://{request.host}:{request.port}") - # worker_manager = RemoteWorkerManager(registry) - # return Result.succ(await worker_manager.model_startup(request)) - # if not worker_instance: - # return Result.faild(code="E000X", msg=f"can not find worker manager") except Exception as e: return Result.faild(code="E000X", msg=f"model start failed {e}")