From d0cc6f27b51663ed56bc3abc9b619b4c9c98f32a Mon Sep 17 00:00:00 2001 From: "kyj@bowong.ai" Date: Thu, 17 Apr 2025 15:40:28 +0800 Subject: [PATCH] =?UTF-8?q?FIX=20AutoDL=E4=BF=AE=E5=A4=8Dexception?= =?UTF-8?q?=E5=AF=BC=E8=87=B4worker=E5=81=9C=E6=AD=A2=E9=97=AE=E9=A2=98?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- AutoDL/autodl_scheduling/server.py | 15 +++++++++------ 1 file changed, 9 insertions(+), 6 deletions(-) diff --git a/AutoDL/autodl_scheduling/server.py b/AutoDL/autodl_scheduling/server.py index f7458b4..25975a8 100644 --- a/AutoDL/autodl_scheduling/server.py +++ b/AutoDL/autodl_scheduling/server.py @@ -61,13 +61,16 @@ class Server: def introspect_instance(self): loguru.logger.info("Introspecting worker started || Scaledown Window: %ds" % self.instance_pool.scaledown_window) while True: - self.instance_pool.introspection() - time.sleep(1) + try: + self.instance_pool.introspection() + time.sleep(1) + except: + traceback.print_exc() def scaling_worker(self): loguru.logger.info("Scaling worker started") - try: - while True: + while True: + try: # 提交任务 self.instance_pool.scale_instance(self.waiting_queue.get_size()+self.running_pool.get_running_size(), disable_shrink=True) for instance in self.instance_pool.instances: @@ -104,8 +107,8 @@ class Server: instance.active = False instance.last_active_time = time.time() time.sleep(0.5) - except: - traceback.print_exc() + except: + traceback.print_exc() if __name__=="__main__":