xuekailun 4 kuukautta sitten
vanhempi
commit
f31e2b86d6

+ 6 - 0
.gitignore

@@ -0,0 +1,6 @@
+.git
+.idea
+.gitignore
+__pycache__
+__pycache__/*
+README.md

+ 2 - 2
gateway/gateway_config.py

@@ -6,10 +6,10 @@ logging.basicConfig(level=logging.INFO,
                     datefmt='%a, %d %b %Y %H:%M:%S')
 
 # gateway-alb-ecs组-生产环境
-# server_group_id_list = ["sgp-l2k0p33e470vfmj538"]
+server_group_id_list = ["sgp-l2k0p33e470vfmj538"]
 
 # alb后端服务器_调试使用组
-server_group_id_list = ["sgp-ec4gopoclruofsfmxu"]
+# server_group_id_list = ["sgp-ec4gopoclruofsfmxu"]
 
 apps = 'piaoquan-gateway'
 repository = 'registry-vpc.cn-hangzhou.aliyuncs.com/stuuudy/{}'

+ 2 - 3
gateway/gateway_update.py

@@ -66,6 +66,7 @@ def update(instance_id, port):
         checkHealth(ipadd)
         print("%s :权重修改中......" % (ipadd))
         weight_list = [(10, 5), (20, 5), (40, 5), (60, 5), (80, 5), (100, 5)]
+        # weight_list = [(10, 10), (20, 10), (40, 10), (60, 10), (80, 10), (100, 10)]
         utils.update_server_group_servers_attribute(alb_client, gateway_config.server_group_id_list, instance_id_list=[instance_id], weight_list=weight_list, port=port)
         success_count += 1
         print("更新进度" + "%s/%s" % (success_count, total))
@@ -95,13 +96,11 @@ if __name__ == '__main__':
     ecs_client = utils.connect_client(access_key_id=gateway_config.ecs_client_params['access_key_id'],
                                       access_key_secret=gateway_config.ecs_client_params['access_key_secret'],
                                       region_id=gateway_config.ecs_client_params['region_id'])
-    print(f"ecs_client = {ecs_client}")
     # 初始化 ALB 客户端
     alb_client = utils.connect_alb_client(gateway_config.alb_client_params['access_key_id'],
                                           gateway_config.alb_client_params['access_key_secret'],
                                           endpoint=gateway_config.alb_client_params['endpoint']
                                           )
-    print(f"alb_client = {alb_client}")
 
     success_count = 0
     threads = []
@@ -111,8 +110,8 @@ if __name__ == '__main__':
 
     # 获取 ALB 下服务器组的实例 ID
     res = utils.list_server_group_servers(alb_client=alb_client, server_group_id=gateway_config.server_group_id_list[0])
-    print(f"res = {res}")
     total += len(res)
+    print(f"获取 ALB 下服务器组的实例 ID = {res} total = {total}")
     InstanceIDs.extend(res)
     print(InstanceIDs)
 

+ 45 - 19
gateway/utils.py

@@ -370,7 +370,10 @@ def add_servers_to_server_group(alb_client, server_group_id, instance_id, weight
         server_group_id=server_group_id,
         servers=[server]
     )
-    runtime = util_models.RuntimeOptions()
+    runtime = util_models.RuntimeOptions(
+        connect_timeout=5000,
+        read_timeout=60000
+    )
     try:
         alb_client.add_servers_to_server_group_with_options(request, runtime)
         logging.info(f"Successfully added server {instance_id} to server group {server_group_id} with weight {weight}.")
@@ -397,7 +400,10 @@ def remove_servers_from_server_group(alb_client, server_group_id, instance_ids,
             server_group_id=server_group_id,
             servers=[server]
         )
-        runtime = util_models.RuntimeOptions()
+        runtime = util_models.RuntimeOptions(
+            connect_timeout=5000,
+            read_timeout=60000
+        )
         try:
             alb_client.remove_servers_from_server_group_with_options(request, runtime)
             logging.info(f"Successfully removed server {instance_id} from server group {server_group_id}.")
@@ -414,19 +420,29 @@ def list_server_group_servers(alb_client, server_group_id):
     @param server_group_id: 服务器组ID
     @return: 实例ID列表
     """
-    list_server_group_servers_request = alb_20200616_models.ListServerGroupServersRequest(
-        server_group_id=server_group_id
-    )
-    runtime = util_models.RuntimeOptions()
-
-    try:
-        response = alb_client.list_server_group_servers_with_options(list_server_group_servers_request, runtime)
-        instance_ids = [server.server_id for server in response.body.servers]
-        return instance_ids
-    except Exception as error:
-        print(str(error))
-        UtilClient.assert_as_string(str(error))
-        return []
+    instance_ids = []
+    next_token = None
+    while True:
+        try:
+            list_server_group_servers_request = alb_20200616_models.ListServerGroupServersRequest(
+                server_group_id=server_group_id,
+                max_results=100,
+                next_token=next_token
+            )
+            runtime = util_models.RuntimeOptions(
+                connect_timeout=5000,
+                read_timeout=60000
+            )
+            response = alb_client.list_server_group_servers_with_options(list_server_group_servers_request, runtime)
+            next_token = UtilClient.to_map(response.body).get('NextToken')
+            sub_instance_ids = [server.server_id for server in response.body.servers]
+            if len(sub_instance_ids) > 0:
+                instance_ids.extend(sub_instance_ids)
+            if next_token is None:
+                break
+        except Exception as error:
+            logging.error(error)
+    return instance_ids
 
 
 async def list_server_group_servers_async(alb_client, server_group_id):
@@ -437,9 +453,13 @@ async def list_server_group_servers_async(alb_client, server_group_id):
     @return: 实例ID列表
     """
     list_server_group_servers_request = alb_20200616_models.ListServerGroupServersRequest(
-        server_group_id=server_group_id
+        server_group_id=server_group_id,
+        max_results=100
+    )
+    runtime = util_models.RuntimeOptions(
+        connect_timeout=5000,
+        read_timeout=60000
     )
-    runtime = util_models.RuntimeOptions()
 
     try:
         response = await alb_client.list_server_group_servers_with_options_async(list_server_group_servers_request, runtime)
@@ -470,7 +490,10 @@ def update_server_group_server_weight(alb_client, server_group_id, instance_id,
         servers=[server],
         server_group_id=server_group_id
     )
-    runtime = util_models.RuntimeOptions()
+    runtime = util_models.RuntimeOptions(
+        connect_timeout=5000,
+        read_timeout=60000
+    )
     try:
         alb_client.update_server_group_servers_attribute_with_options(request, runtime)
         print(f"Successfully updated server {instance_id} in group {server_group_id} to weight {weight}.")
@@ -515,7 +538,10 @@ async def update_server_group_server_weight_async(alb_client, server_group_id, i
         servers=[server],
         server_group_id=server_group_id
     )
-    runtime = util_models.RuntimeOptions()
+    runtime = util_models.RuntimeOptions(
+        connect_timeout=5000,
+        read_timeout=60000
+    )
     try:
         await alb_client.update_server_group_servers_attribute_with_options_async(request, runtime)
         print(f"Successfully updated server {instance_id} in group {server_group_id} to weight {weight} asynchronously.")

+ 2 - 4
longvideoapi/longvideoapi_config.py

@@ -5,13 +5,11 @@ logging.basicConfig(level=logging.INFO,
                     format='%(asctime)s %(filename)s[line:%(lineno)d] %(levelname)s %(message)s',
                     datefmt='%a, %d %b %Y %H:%M:%S')
 
-slb_id_list = ["lb-bp1qk9mkvjtundlzz7owm", "lb-bp1pj2v06ladvgftgxcp0", "lb-bp1y63rnrb2e64whryghz", "lb-bp17woaq4vz3gnb8ujzvh"]
-
 # longvideoapi-alb-ecs组-生产环境
-# server_group_id_list = ["sgp-h79h3lkvua1xs3418y"]
+server_group_id_list = ["sgp-h79h3lkvua1xs3418y"]
 
 # alb后端服务器_调试使用组
-server_group_id_list = ["sgp-ec4gopoclruofsfmxu"]
+# server_group_id_list = ["sgp-ec4gopoclruofsfmxu"]
 
 
 

+ 3 - 4
longvideoapi/longvideoapi_grayscale_update.py

@@ -101,8 +101,6 @@ def update_instance(ecs_client, alb_client, instance_id, version, port):
     """
     logging.info(f"update instance: {instance_id}")
     # 1. 摘流量,将权重降为0
-    # weight_list = [(0, 20)]  # 设置权重为0,等待20秒
-
     utils.update_server_group_servers_attribute(alb_client=alb_client,
                                                 server_group_id_list=longvideoapi_config.server_group_id_list,
                                                 instance_id_list=[instance_id],
@@ -142,11 +140,12 @@ def update_instance(ecs_client, alb_client, instance_id, version, port):
         sys.exit()
     # 机器探活成功
     time.sleep(20)
-
+    health_instance_ids = [instance_id for instance_id, _ in health_instances]
     add_weight_list = [(10, 5), (20, 5), (40, 5), (60, 5), (80, 5), (100, 5)]
+    # add_weight_list = [(10, 10), (20, 10), (40, 10), (60, 10), (80, 10), (100, 10)]
     utils.update_server_group_servers_attribute(alb_client=alb_client,
                                                 server_group_id_list=longvideoapi_config.server_group_id_list,
-                                                instance_id_list=health_instances,
+                                                instance_id_list=health_instance_ids,
                                                 weight_list=add_weight_list,
                                                 port=port)
     logging.info(f"finished instances: {health_instances}, count: {len(health_instances)}")

+ 53 - 43
longvideoapi/longvideoapi_reduce_with_count.py

@@ -34,48 +34,54 @@ def remove_instances(ecs_client, alb_client, instance_ids, port):
     time.sleep(20)
 
     # 2. 从 ALB 服务器组中移除实例
-    for server_group_id in longvideoapi_config.server_group_id_list:
-        try:
-            utils.remove_servers_from_server_group(alb_client=alb_client, server_group_id=server_group_id,
-                                                   instance_ids=instance_ids, port=port)
-            logging.info(f"Successfully removed instances from server group {server_group_id}.")
-        except Exception as e:
-            logging.error(f"Failed to remove instances from server group {server_group_id}: {e}")
+    # for server_group_id in longvideoapi_config.server_group_id_list:
+    try:
+        utils.remove_servers_from_server_group(alb_client=alb_client,
+                                               server_group_id_list=longvideoapi_config.server_group_id_list,
+                                               instance_ids=instance_ids, port=port)
+        logging.info(
+            f"Successfully removed count:{len(instance_ids)} instance_ids:  {instance_ids} from server group {longvideoapi_config.server_group_id_list}.")
+    except Exception as e:
+        logging.error(
+            f"Failed to remove count:{len(instance_ids)} instance_ids: {instance_ids} from server group {longvideoapi_config.server_group_id_list}: {e}")
 
-    logging.info(f"Remove from ALB finished, instances: {instance_ids}")
+    logging.info(f"Remove from ALB finished, count:{len(instance_ids)} instances: {instance_ids}")
 
     # 3. 停止机器
-    stop_response = utils.stop_instances(ecs_client=ecs_client, instance_ids=instance_ids)
-    if stop_response.get('Code') is None:
-        logging.info(f"Instances stop finished, instances: {instance_ids}")
-    else:
-        logging.error(f"Failed to stop instances: {stop_response}")
-        sys.exit()
+    utils.stop_instances(ecs_client=ecs_client, instance_ids=instance_ids)
+    # stop_response = utils.stop_instances(ecs_client=ecs_client, instance_ids=instance_ids)
+    # if stop_response.get('Code') is None:
+    #     logging.info(f"Instances stop finished, instances: {instance_ids}")
+    # else:
+    #     logging.error(f"Failed to stop instances: {stop_response}")
+    #     sys.exit()
 
     # 4. 判断机器运行状态是否为 Stopped
-    while True:
-        response = utils.get_instances_status(ecs_client=ecs_client, instance_ids=instance_ids)
-        if response.get('Code') is None:
-            instances_list = response.get('InstanceStatuses').get('InstanceStatus')
-            stopped_instances = [instance.get('InstanceId') for instance in instances_list if
-                                 instance.get('Status') == 'Stopped']
-            if len(stopped_instances) == len(instance_ids):
-                logging.info(f"Instances stopped status set success, instances: {stopped_instances}")
-                break
-            else:
-                logging.info(f"Stopped instances count = {len(stopped_instances)}, instances: {stopped_instances}")
-                time.sleep(5)
-        else:
-            logging.error(response)
-            sys.exit()
+    stopped_instances = utils.get_instances_status(ecs_client=ecs_client, instance_ids=instance_ids)
+    # while True:
+    #     response = utils.get_instances_status(ecs_client=ecs_client, instance_ids=instance_ids)
+    #     if response.get('Code') is None:
+    #         instances_list = response.get('InstanceStatuses').get('InstanceStatus')
+    #         stopped_instances = [instance.get('InstanceId') for instance in instances_list if
+    #                              instance.get('Status') == 'Stopped']
+    #         if len(stopped_instances) == len(instance_ids):
+    #             logging.info(f"Instances stopped status set success, instances: {stopped_instances}")
+    #             break
+    #         else:
+    #             logging.info(f"Stopped instances count = {len(stopped_instances)}, instances: {stopped_instances}")
+    #             time.sleep(5)
+    #     else:
+    #         logging.error(response)
+    #         sys.exit()
 
     # 5. 释放机器
-    release_response = utils.release_instances(ecs_client=ecs_client, instance_ids=stopped_instances)
-    if release_response.get('Code') is None:
-        logging.info(f"Release instances finished, instances: {stopped_instances}")
-    else:
-        logging.error(f"Release instances fail!!!")
-        sys.exit()
+    utils.release_instances(ecs_client=ecs_client, instance_ids=stopped_instances)
+    # release_response = utils.release_instances(ecs_client=ecs_client, instance_ids=stopped_instances)
+    # if release_response.get('Code') is None:
+    #     logging.info(f"Release instances finished, instances: {stopped_instances}")
+    # else:
+    #     logging.error(f"Release instances fail!!!")
+    #     sys.exit()
 
 
 def main():
@@ -94,27 +100,31 @@ def main():
 
         # 获取指定释放的机器数量
         reduce_count = int(sys.argv[1])
-        logging.info(f"reduce instances count: {reduce_count}")
+        logging.info(f"reduce_count: {reduce_count}")
 
         # 获取 ALB 下所有机器
-        online_instance_ids = utils.list_server_group_servers(alb_client=alb_client, server_group_id=longvideoapi_config.server_group_id_list[0])
+        online_instance_ids = utils.list_server_group_servers(alb_client=alb_client,
+                                                              server_group_id=longvideoapi_config.server_group_id_list[
+                                                                  0])
         online_instance_count = len(online_instance_ids)
-        logging.info(f"online instance count: {online_instance_count}.")
-        logging.info(f"online instance ids: {online_instance_ids}")
+        logging.info(f"online instance count: {online_instance_count} instance_ids: {online_instance_ids}")
+
+        if online_instance_count - reduce_count < 10:
+            logging.error("缩容后服务器数量不能小于10台")
+            sys.exit()
 
         # 获取前 count 台机器进行释放
         reduce_instance_ids = online_instance_ids[:reduce_count]
-        logging.info(f"reduce instances: {reduce_instance_ids}")
+        logging.info(f"reduce instances count = {len(reduce_instance_ids)} instances: {reduce_instance_ids}")
 
         # 停止并释放机器
-        remove_instances(ecs_client=ecs_client, alb_client=alb_client, instance_ids=reduce_instance_ids, port=longvideoapi_config.port)
+        remove_instances(ecs_client=ecs_client, alb_client=alb_client, instance_ids=reduce_instance_ids,
+                         port=longvideoapi_config.port)
         logging.info(f"stop & release instances end!")
     except Exception as e:
         logging.error(e)
         sys.exit()
 
 
-
 if __name__ == '__main__':
     main()
-

+ 1 - 0
longvideoapi/longvideoapi_restart.py

@@ -37,6 +37,7 @@ def server_restart(alb_client, ecs_client, instance_id, image_name, port):
 
         # 设置权重
         add_weight_list = [(10, 5), (20, 5), (40, 5), (60, 5), (80, 5), (100, 5)]
+        # add_weight_list = [(10, 10), (20, 10), (40, 10), (60, 10), (80, 10), (100, 10)]
         utils.update_server_group_servers_attribute(alb_client=alb_client,
                                                     server_group_id_list=longvideoapi_config.server_group_id_list,
                                                     instance_id_list=[instance_id],

+ 8 - 5
longvideoapi/longvideoapi_scaling_k_count.py

@@ -65,7 +65,7 @@ async def ess_instance(ecs_client, alb_client, ess_count, max_workers, port):
 
     # 2. 发送启动脚本到机器上
     utils.send_file_to_ecs(ecs_client=ecs_client, instance_id_list=ess_instance_ids, **longvideoapi_config.start_sh)
-    logging.info(f"send start shell file finished, instances: {ess_instance_ids}")
+    logging.info(f"send start shell file finished, count: {len(ess_instance_ids)} instances: {ess_instance_ids}")
     # 3. 启动服务
     start_sh_param = "latest"
     server_start_sh = os.path.join(longvideoapi_config.start_sh['target_dir'], longvideoapi_config.start_sh['name'])
@@ -74,7 +74,7 @@ async def ess_instance(ecs_client, alb_client, ess_count, max_workers, port):
     # 4. 异步探活
     global health_instances
     health_instances = []
-    max_wait_time = 180
+    max_wait_time = 360
     loop = asyncio.get_running_loop()
     executor = ThreadPoolExecutor(max_workers=max_workers)
     tasks = [
@@ -88,9 +88,12 @@ async def ess_instance(ecs_client, alb_client, ess_count, max_workers, port):
     if len(health_instances) > 0:
         # 所有机器探活成功
         time.sleep(20)
-        for instance_id, ip in health_instances:
-            for server_group_id in longvideoapi_config.server_group_id_list:
-                utils.add_servers_to_server_group(alb_client, server_group_id, instance_id, weight=100, port=port)
+        # instance_id_list = []
+        # for instance_id, ip in health_instances:
+        #     instance_id_list.append(instance_id)
+        # #     for server_group_id in longvideoapi_config.server_group_id_list:
+        health_instance_ids = [instance_id for instance_id, _ in health_instances]
+        utils.add_servers_to_server_group(alb_client, longvideoapi_config.server_group_id_list, health_instance_ids, weight=100, port=port)
         logging.info(f"ess count: {ess_count}, "
                      f"create count: {len(ess_instance_ids)}, "
                      f"finished count: {len(health_instances)}")

+ 31 - 0
longvideoapi/longvideoapi_unittest.py

@@ -0,0 +1,31 @@
+import logging
+import unittest
+
+from longvideoapi import utils, longvideoapi_config
+
+
+class MyTestCase(unittest.TestCase):
+    def test_list_server_group_servers(self):
+        alb_client = utils.connect_alb_client(
+            access_key_id=longvideoapi_config.alb_client_params['access_key_id'],
+            access_key_secret=longvideoapi_config.alb_client_params['access_key_secret'],
+            endpoint=longvideoapi_config.alb_client_params['endpoint']
+        )
+
+        instance_ids = utils.list_server_group_servers(alb_client, longvideoapi_config.server_group_id_list[0])
+        logging.info(instance_ids)
+
+    def test_create_multiple_instances(self):
+        ecs_client = utils.connect_client(access_key_id=longvideoapi_config.ecs_client_params['access_key_id'],
+                                          access_key_secret=longvideoapi_config.ecs_client_params['access_key_secret'],
+                                          region_id=longvideoapi_config.ecs_client_params['region_id'])
+        ess_instance_ids = utils.create_multiple_instances(
+            amount=120,
+            ecs_client=ecs_client,
+            **longvideoapi_config.instance_config_k,
+        )
+        logging.info(ess_instance_ids)
+
+
+if __name__ == '__main__':
+    unittest.main()

+ 52 - 45
longvideoapi/longvideoapi_update_k.py

@@ -61,11 +61,12 @@ async def ess_instance(ecs_client, alb_client, ess_count, max_workers, version,
 
     # 2. 发送启动脚本到机器上
     utils.send_file_to_ecs(ecs_client=ecs_client, instance_id_list=ess_instance_ids, **longvideoapi_config.start_sh)
-    logging.info(f"send start shell file finished, instances: {ess_instance_ids}")
+    logging.info(f"send start shell file finished, count: {len(ess_instance_ids)} instances: {ess_instance_ids}")
     # 3. 启动服务
     server_start_sh = os.path.join(longvideoapi_config.start_sh['target_dir'], longvideoapi_config.start_sh['name'])
     server_start_commend = f"sh {server_start_sh} {version}"
     utils.run_command(ecs_client=ecs_client, instance_ids=ess_instance_ids, command=server_start_commend)
+    logging.info(f"start server finish, count: {len(ess_instance_ids)} instances: {ess_instance_ids}")
     # 4. 异步探活
     global health_instances
     health_instances = []
@@ -76,18 +77,21 @@ async def ess_instance(ecs_client, alb_client, ess_count, max_workers, version,
         [(ecs_client, instance_id) for instance_id in ess_instance_ids]
     ]
     await asyncio.wait(tasks)
-    logging.info(f"health instances count: {len(health_instances)}, {health_instances}")
+    logging.info(f"health instances count: {len(health_instances)}, instances: {health_instances}")
     # 5. 挂载流量
     if len(health_instances) == len(ess_instance_ids):
         # 所有机器探活成功
         time.sleep(20)
         health_instance_ids = [instance_id for instance_id, _ in health_instances]
-        for server_group_id in longvideoapi_config.server_group_id_list:
-            for instance_id in health_instance_ids:
-                utils.add_servers_to_server_group(alb_client, server_group_id, instance_id, weight=0, port=port)
-                logging.info(f"Successfully added instance {instance_id} to server group {server_group_id}.")
+        # for server_group_id in longvideoapi_config.server_group_id_list:
+            # for instance_id in health_instance_ids:
+        utils.add_servers_to_server_group(alb_client, longvideoapi_config.server_group_id_list, health_instance_ids, weight=0, port=port)
+        logging.info(f"Successfully added count: {len(health_instance_ids)} health_instance_ids {health_instance_ids} to server groups {longvideoapi_config.server_group_id_list}.")
 
+        time.sleep(20)
+        logging.info(f"start update weight count: {len(health_instance_ids)} instances: {health_instance_ids} server groups: {longvideoapi_config.server_group_id_list}.")
         add_weight_list = [(10, 5), (20, 5), (40, 5), (60, 5), (80, 5), (100, 5)]
+        # add_weight_list = [(10, 10), (20, 10), (40, 10), (60, 10), (80, 10), (100, 10)]
         utils.update_server_group_servers_attribute(alb_client,
                                                     server_group_id_list=longvideoapi_config.server_group_id_list,
                                                     instance_id_list=health_instance_ids,
@@ -168,8 +172,8 @@ async def update_instance(ecs_client, alb_client, instance_ids, max_workers, ver
     :param port: 后端服务器使用的端口
     :return:
     """
-    media_index = len(instance_ids)//2
-    instance_ids_group = [instance_ids[:media_index], instance_ids[media_index:]]
+    sub_index = len(instance_ids)//2
+    instance_ids_group = [instance_ids[:sub_index], instance_ids[sub_index:]]
     update_finished_count = 0
     for instance_id_list in instance_ids_group:
         logging.info(f"update instances: {instance_id_list}")
@@ -179,7 +183,7 @@ async def update_instance(ecs_client, alb_client, instance_ids, max_workers, ver
                                                     instance_id_list=instance_id_list,
                                                     weight_list=[(0, 20)],
                                                     port=port)
-        logging.info(f"set weight with 0 finished, instances: {instance_id_list}")
+        logging.info(f"set weight with 0 finished, count: {len(instance_id_list)} instances: {instance_id_list}")
         # 2. 异步移除旧容器并删除旧镜像
         global remove_container_instances
         remove_container_instances = []
@@ -223,6 +227,7 @@ async def update_instance(ecs_client, alb_client, instance_ids, max_workers, ver
             health_instance_ids = [instance_id for instance_id, _ in health_instances]
 
             add_weight_list = [(10, 5), (20, 5), (40, 5), (60, 5), (80, 5), (100, 5)]
+            # add_weight_list = [(10, 10), (20, 10), (40, 10), (60, 10), (80, 10), (100, 10)]
             utils.update_server_group_servers_attribute(alb_client,
                                                         server_group_id_list=longvideoapi_config.server_group_id_list,
                                                         instance_id_list=health_instance_ids,
@@ -259,47 +264,50 @@ def remove_instances(ecs_client, alb_client, instance_ids, port):
 
     time.sleep(10)
     # 2.移除alb
-    for server_group_id in longvideoapi_config.server_group_id_list:
-        try:
-            utils.remove_servers_from_server_group(alb_client=alb_client, server_group_id=server_group_id,
-                                                   instance_ids=instance_ids, port=port)
-            logging.info(f"Successfully removed instances from server group {server_group_id}.")
-        except Exception as e:
-            logging.error(f"Failed to remove instances from server group {server_group_id}: {e}")
+    # for server_group_id in longvideoapi_config.server_group_id_list:
+    try:
+        utils.remove_servers_from_server_group(alb_client=alb_client, server_group_id_list=longvideoapi_config.server_group_id_list,
+                                               instance_ids=instance_ids, port=port)
+        logging.info(f"Successfully removed instances: {instance_ids} from server group {longvideoapi_config.server_group_id_list}.")
+    except Exception as e:
+        logging.error(f"Failed to remove instances: {instance_ids} from server group {longvideoapi_config.server_group_id_list}: {e}")
 
     logging.info(f"Remove from ALB finished, instances: {instance_ids}")
 
     # 3. 停止机器
-    stop_response = utils.stop_instances(ecs_client=ecs_client, instance_ids=instance_ids)
-    if stop_response.get('Code') is None:
-        logging.info(f"Instances stop finished, instances: {instance_ids}")
-    else:
-        logging.error(f"Failed to stop instances: {stop_response}")
-        sys.exit()
+    utils.stop_instances(ecs_client=ecs_client, instance_ids=instance_ids)
+    # stop_response = utils.stop_instances(ecs_client=ecs_client, instance_ids=instance_ids)
+    # if stop_response.get('Code') is None:
+    #     logging.info(f"Instances stop finished, instances: {instance_ids}")
+    # else:
+    #     logging.error(f"Failed to stop instances: {stop_response}")
+    #     sys.exit()
 
     # 4. 判断机器运行状态是否为Stopped
-    while True:
-        response = utils.get_instances_status(ecs_client=ecs_client, instance_ids=instance_ids)
-        if response.get('Code') is None:
-            instances_list = response.get('InstanceStatuses').get('InstanceStatus')
-            stopped_instances = [instance.get('InstanceId') for instance in instances_list if
-                                 instance.get('Status') == 'Stopped']
-            if len(stopped_instances) == len(instance_ids):
-                logging.info(f"Instances stopped status set success, instances: {stopped_instances}")
-                break
-            else:
-                logging.info(f"Stopped instances count = {len(stopped_instances)}, instances: {stopped_instances}")
-                time.sleep(5)
-        else:
-            logging.error(response)
-            sys.exit()
+    # while True:
+    stopped_instances = utils.get_instances_status(ecs_client=ecs_client, instance_ids=instance_ids)
+        # response = utils.get_instances_status(ecs_client=ecs_client, instance_ids=instance_ids)
+        # if response.get('Code') is None:
+        #     instances_list = response.get('InstanceStatuses').get('InstanceStatus')
+        #     stopped_instances = [instance.get('InstanceId') for instance in instances_list if
+        #                          instance.get('Status') == 'Stopped']
+        #     if len(stopped_instances) == len(instance_ids):
+        #         logging.info(f"Instances stopped status set success, instances: {stopped_instances}")
+        #         break
+        #     else:
+        #         logging.info(f"Stopped instances count = {len(stopped_instances)}, instances: {stopped_instances}")
+        #         time.sleep(5)
+        # else:
+        #     logging.error(response)
+        #     sys.exit()
     # 5. 释放机器
-    release_response = utils.release_instances(ecs_client=ecs_client, instance_ids=stopped_instances)
-    if release_response.get('Code') is None:
-        logging.info(f"Release instances finished, instances: {stopped_instances}")
-    else:
-        logging.error(f"Release instances fail!!!")
-        sys.exit()
+    utils.release_instances(ecs_client=ecs_client, instance_ids=stopped_instances)
+    # release_response = utils.release_instances(ecs_client=ecs_client, instance_ids=stopped_instances)
+    # if release_response.get('Code') is None:
+    #     logging.info(f"Release instances finished, instances: {stopped_instances}")
+    # else:
+    #     logging.error(f"Release instances fail!!!")
+    #     sys.exit()
 
 
 def main():
@@ -317,8 +325,7 @@ def main():
         # 1. 获取alb下所有机器
         online_instance_ids = utils.list_server_group_servers(alb_client=alb_client, server_group_id=longvideoapi_config.server_group_id_list[0])
         online_instance_count = len(online_instance_ids)
-        logging.info(f"online instance count: {online_instance_count}.")
-        logging.info(f"online instance ids: {online_instance_ids}")
+        logging.info(f"online instance count: {online_instance_count} instance_ids: {online_instance_ids}")
 
         # 2. 扩容机器并启动新服务 扩容数量:线上机器数量//2
         logging.info(f"ess instances start ...")

+ 257 - 204
longvideoapi/utils.py

@@ -24,7 +24,7 @@ from alibabacloud_tea_openapi import models as open_api_models
 from alibabacloud_alb20200616 import models as alb_models
 from alibabacloud_alb20200616 import models as alb_20200616_models
 from alibabacloud_tea_util import models as util_models
-
+from urllib3 import request
 
 logging.basicConfig(level=logging.INFO,
                     format='%(asctime)s %(filename)s[line:%(lineno)d] %(levelname)s %(message)s',
@@ -77,9 +77,6 @@ def connect_alb_client(access_key_id, access_key_secret, endpoint):
     return alb_client
 
 
-
-
-
 def build_create_instances_request(image_id, vswitch_id, security_group_id, zone_id, instance_type, instance_name,
                                    disk_size, disk_category, key_pair_name, tags):
     """
@@ -119,16 +116,16 @@ def send_req(client, request):
     """
     request.set_accept_format('json')
     response = client.do_action_with_exception(request)
-    #print(response)
+    # print(response)
     response = json.loads(response)
     print(response)
-        # logging.info(response)
+    # logging.info(response)
     print(response.get('Code'))
     return response
-    #except Exception as e:
-        # 失败,记录报错信息,发送通知,停止并退出
-    #logging.error(e)
-    #sys.exit()
+    # except Exception as e:
+    # 失败,记录报错信息,发送通知,停止并退出
+    # logging.error(e)
+    # sys.exit()
 
 
 def check_instance_running(ecs_client, instance_ids):
@@ -177,7 +174,6 @@ def get_ip_address(ecs_client, instance_id):
     return ip_address
 
 
-
 def create_multiple_instances(amount, ecs_client,
                               image_id, vswitch_id, security_group_id, zone_id, instance_type, instance_name,
                               disk_size, disk_category, key_pair_name, tags):
@@ -203,29 +199,42 @@ def create_multiple_instances(amount, ecs_client,
     #     access_key_id=access_key_id, access_key_secret=access_key_secret, region_id=region_id
     # )
     # 2. 请求参数配置
-    request = build_create_instances_request(
-        image_id=image_id, vswitch_id=vswitch_id, security_group_id=security_group_id, zone_id=zone_id,
-        instance_type=instance_type, instance_name=instance_name, disk_size=disk_size, disk_category=disk_category,
-        key_pair_name=key_pair_name, tags=tags
-    )
-    request.set_Amount(amount)
-    # 3. 发送API请求,购买机器并启动
-    response = send_request(ecs_client=ecs_client, request=request)
-    if response.get('Code') is None:
-        instance_ids = response.get('InstanceIdSets').get('InstanceIdSet')
-        logging.info(f"success amount: {len(instance_ids)}, instance ids: {instance_ids}.")
-        # 获取机器运行状态
-        running_amount = 0
-        while running_amount < amount:
-            time.sleep(10)
-            running_amount, running_instances = check_instance_running(ecs_client=ecs_client, instance_ids=instance_ids)
-            logging.info(f"running amount: {running_amount}, running instances: {running_instances}.")
-        return instance_ids
-    else:
-        # 失败,记录报错信息,发送通知,停止并退出
-        logging.error(response)
-        sys.exit()
-
+    instance_ids = []
+    remain = amount
+    while True:
+        if remain <= 0:
+            break
+        if remain > 50:
+            sub_amount = 50
+            remain = remain - sub_amount
+        else:
+            sub_amount = remain
+            remain = 0
+        request = build_create_instances_request(
+            image_id=image_id, vswitch_id=vswitch_id, security_group_id=security_group_id, zone_id=zone_id,
+            instance_type=instance_type, instance_name=instance_name, disk_size=disk_size, disk_category=disk_category,
+            key_pair_name=key_pair_name, tags=tags
+        )
+        request.set_Amount(sub_amount)
+        # 3. 发送API请求,购买机器并启动
+        response = send_request(ecs_client=ecs_client, request=request)
+        if response.get('Code') is None:
+            sub_instance_ids = response.get('InstanceIdSets').get('InstanceIdSet')
+            logging.info(f"success amount: {len(sub_instance_ids)}, instance ids: {sub_instance_ids}.")
+            # 获取机器运行状态
+            running_amount = 0
+            while running_amount < sub_amount:
+                time.sleep(20)
+                running_amount, running_instances = check_instance_running(ecs_client=ecs_client,
+                                                                           instance_ids=sub_instance_ids)
+                logging.info(f"running amount: {running_amount}, running instances: {running_instances}.")
+            # return instance_ids
+            instance_ids.extend(sub_instance_ids)
+        else:
+            # 失败,记录报错信息,发送通知,停止并退出
+            logging.error(response)
+            sys.exit()
+    return instance_ids
 
 
 def release_instances(ecs_client, instance_ids, force=False):
@@ -236,12 +245,19 @@ def release_instances(ecs_client, instance_ids, force=False):
     :param force: 是否强制释放, True-强制释放, False-正常释放, type-bool
     :return:
     """
-    request = DeleteInstancesRequest()
-    request.set_InstanceIds(instance_ids)
-    request.set_Force(force)
-    response = send_request(ecs_client=ecs_client, request=request)
-    return response
-
+    instance_id_list_array = [instance_ids[i:i + 100] for i in range(0, len(instance_ids), 100)]
+    for instance_id_sub_array in instance_id_list_array:
+        request = DeleteInstancesRequest()
+        request.set_InstanceIds(instance_id_sub_array)
+        request.set_Force(force)
+        response = send_request(ecs_client=ecs_client, request=request)
+        # return response
+        if response.get('Code') is None:
+            logging.info(f"Release instances finished, count = {len(instance_id_sub_array)} instances: {instance_id_sub_array}")
+        else:
+            logging.error(f"Release instances fail!!!")
+            sys.exit()
+        time.sleep(3)
 
 
 def get_instances_status(ecs_client, instance_ids):
@@ -251,13 +267,31 @@ def get_instances_status(ecs_client, instance_ids):
     :param instance_ids: instance_id, type-list
     :return:
     """
-    request = DescribeInstanceStatusRequest()
-    request.set_InstanceIds(instance_ids)
-    request.set_PageSize(50)
-    response = send_request(ecs_client=ecs_client, request=request)
-    return response
-
-
+    stopped_instances = []
+    instance_id_list_array = [instance_ids[i:i + 50] for i in range(0, len(instance_ids), 50)]
+    for instance_id_sub_array in instance_id_list_array:
+        while True:
+            request = DescribeInstanceStatusRequest()
+            request.set_InstanceIds(instance_id_sub_array)
+            request.set_PageSize(50)
+            response = send_request(ecs_client=ecs_client, request=request)
+            # return response
+            if response.get('Code') is None:
+                instances_list = response.get('InstanceStatuses').get('InstanceStatus')
+                stopped_instances_sub = [instance.get('InstanceId') for instance in instances_list if
+                                     instance.get('Status') == 'Stopped']
+                if len(stopped_instances_sub) == len(instance_id_sub_array):
+                    logging.info(f"Instances stopped status set success, count:{len(stopped_instances_sub)} instances: {stopped_instances_sub}")
+                    stopped_instances.extend(stopped_instances_sub)
+                    break
+                else:
+                    logging.info(f"Stopped instances count = {len(stopped_instances_sub)}, instances: {stopped_instances_sub}")
+                    time.sleep(5)
+            else:
+                logging.error(response)
+                sys.exit()
+            time.sleep(3)
+    return stopped_instances
 
 def stop_instances(ecs_client, instance_ids, force_stop=False):
     """
@@ -267,13 +301,19 @@ def stop_instances(ecs_client, instance_ids, force_stop=False):
     :param force_stop: 是否强制关机, True-强制关机, False-正常关机, type-bool
     :return:
     """
-    request = StopInstancesRequest()
-    request.set_InstanceIds(instance_ids)
-    request.set_ForceStop(force_stop)
-    response = send_request(ecs_client=ecs_client, request=request)
-    return response
-
-
+    instance_id_list_array = [instance_ids[i:i + 100] for i in range(0, len(instance_ids), 100)]
+    for instance_id_sub_array in instance_id_list_array:
+        request = StopInstancesRequest()
+        request.set_InstanceIds(instance_id_sub_array)
+        request.set_ForceStop(force_stop)
+        response = send_request(ecs_client=ecs_client, request=request)
+        # return response
+        if response.get('Code') is None:
+            logging.info(f"Instances stop finished, count:{len(instance_id_sub_array)} instances: {instance_id_sub_array}")
+        else:
+            logging.error(f"Failed to stop instances: {response}")
+            sys.exit()
+        time.sleep(3)
 
 
 def send_request(ecs_client, request):
@@ -295,7 +335,6 @@ def send_request(ecs_client, request):
         sys.exit()
 
 
-
 def run_command(ecs_client, instance_ids, command):
     """
     批量执行命令
@@ -313,8 +352,9 @@ def run_command(ecs_client, instance_ids, command):
         request.set_Type("RunShellScript")
         request.set_CommandContent(command)
         request.set_InstanceIds(instance_id_list)
+        request.set_Timeout(180)
         response = send_request(ecs_client=ecs_client, request=request)
-        logging.info(response)
+        logging.info(f"run_command count:{len(instance_id_list)} instance_id_list:{instance_id_list} response:{response}")
 
 
 def send_file_to_ecs(ecs_client, instance_id_list, target_dir, name, content):
@@ -350,61 +390,85 @@ def send_file_to_ecs(ecs_client, instance_id_list, target_dir, name, content):
             logging.error(f"发送文件到实例 {instance_ids} 失败,错误: {str(e)}")
 
 
-
-def add_servers_to_server_group(alb_client, server_group_id, instance_id, weight, port):
+def add_servers_to_server_group(alb_client, server_group_ids, instance_ids, weight, port):
     """
     添加服务器到ALB服务器组
     :param alb_client: ALB客户端连接
-    :param server_group_id: 服务器组ID
-    :param instance_id: 实例ID
+    :param server_group_ids: 服务器组ID
+    :param instance_ids: 实例ID
     :param weight: 权重
     :param port: 后端服务器使用的端口
     """
-    server = alb_models.AddServersToServerGroupRequestServers(
-        server_id=instance_id,
-        server_type='ecs',
-        weight=weight,
-        port=port
-    )
-    request = alb_models.AddServersToServerGroupRequest(
-        server_group_id=server_group_id,
-        servers=[server]
-    )
-    runtime = util_models.RuntimeOptions()
-    try:
-        alb_client.add_servers_to_server_group_with_options(request, runtime)
-        logging.info(f"Successfully added server {instance_id} to server group {server_group_id} with weight {weight}.")
-    except Exception as e:
-        logging.error(f"Failed to add server {instance_id} to server group {server_group_id}: {str(e)}")
-
-
-
-def remove_servers_from_server_group(alb_client, server_group_id, instance_ids, port):
+    instance_ids_array = [instance_ids[i:i + 200] for i in range(0, len(instance_ids), 200)]
+    for instance_ids_sub_array in instance_ids_array:
+        servers = []
+        for i in range(len(instance_ids_sub_array)):
+            server = alb_models.AddServersToServerGroupRequestServers(
+                server_id=instance_ids_sub_array[i],
+                server_type='ecs',
+                weight=weight,
+                port=port
+            )
+            servers.append(server)
+
+        # server = alb_models.AddServersToServerGroupRequestServers(
+        #     server_id=instance_id,
+        #     server_type='ecs',
+        #     weight=weight,
+        #     port=port
+        # )
+        for server_group_id in server_group_ids:
+            request = alb_models.AddServersToServerGroupRequest(
+                server_group_id=server_group_id,
+                servers=servers
+            )
+            runtime = util_models.RuntimeOptions(
+                connect_timeout=5000,
+                read_timeout=60000
+            )
+            try:
+                alb_client.add_servers_to_server_group_with_options(request, runtime)
+                logging.info(
+                    f"Successfully added count:{len(instance_ids_sub_array)} instance_ids: {instance_ids_sub_array} to server group {server_group_id} with weight {weight}.")
+            except Exception as e:
+                logging.error(f"Failed to add count:{len(instance_ids_sub_array)} instance_ids: {instance_ids_sub_array} to server group {server_group_id}: {str(e)}")
+                sys.exit()
+        time.sleep(5)
+
+def remove_servers_from_server_group(alb_client, server_group_id_list, instance_ids, port):
     """
     从ALB服务器组中移除服务器
     :param alb_client: ALB客户端连接
-    :param server_group_id: 服务器组ID
-    :param instance_ids: 实例ID
+    :param server_group_id_list: 服务器组ID list
+    :param instance_ids: 实例ID list
     :param port: 后端服务器使用的端口
     """
-    for instance_id in instance_ids:
-        server = alb_models.RemoveServersFromServerGroupRequestServers(
-            port=port,
-            server_id=instance_id,
-            server_type='ecs'
-        )
-        request = alb_models.RemoveServersFromServerGroupRequest(
-            server_group_id=server_group_id,
-            servers=[server]
-        )
-        runtime = util_models.RuntimeOptions()
-        try:
-            alb_client.remove_servers_from_server_group_with_options(request, runtime)
-            logging.info(f"Successfully removed server {instance_id} from server group {server_group_id}.")
-        except Exception as e:
-            logging.error(f"Failed to remove server {instance_id} from server group {server_group_id}: {str(e)}")
-
-
+    instance_ids_array = [instance_ids[i:i + 200] for i in range(0, len(instance_ids), 200)]
+    for instance_ids_sub_array in instance_ids_array:
+        servers = []
+        for instance_id in instance_ids_sub_array:
+            server = alb_models.RemoveServersFromServerGroupRequestServers(
+                port=port,
+                server_id=instance_id,
+                server_type='ecs'
+            )
+            servers.append(server)
+        for server_group_id in server_group_id_list:
+            request = alb_models.RemoveServersFromServerGroupRequest(
+                server_group_id=server_group_id,
+                servers=servers
+            )
+            runtime = util_models.RuntimeOptions(
+                connect_timeout=5000,
+                read_timeout=60000
+            )
+            try:
+                alb_client.remove_servers_from_server_group_with_options(request, runtime)
+                logging.info(f"Successfully removed count: {len(instance_ids_sub_array)} instance_ids: {instance_ids_sub_array} from server group {server_group_id}.")
+            except Exception as e:
+                logging.error(f"Failed to remove count: {len(instance_ids_sub_array)} instance_ids: {instance_ids_sub_array} from server group {server_group_id}: {str(e)}")
+                sys.exit()
+        time.sleep(5)
 
 
 def list_server_group_servers(alb_client, server_group_id):
@@ -414,69 +478,72 @@ def list_server_group_servers(alb_client, server_group_id):
     @param server_group_id: 服务器组ID
     @return: 实例ID列表
     """
-    list_server_group_servers_request = alb_20200616_models.ListServerGroupServersRequest(
-        server_group_id=server_group_id
-    )
-    runtime = util_models.RuntimeOptions()
-
-    try:
-        response = alb_client.list_server_group_servers_with_options(list_server_group_servers_request, runtime)
-        instance_ids = [server.server_id for server in response.body.servers]
-        return instance_ids
-    except Exception as error:
-        print(str(error))
-        UtilClient.assert_as_string(str(error))
-        return []
-
-
-async def list_server_group_servers_async(alb_client, server_group_id):
-    """
-    异步列出指定服务器组中的服务器并返回实例ID列表
-    @param alb_client: ALB客户端
-    @param server_group_id: 服务器组ID
-    @return: 实例ID列表
-    """
-    list_server_group_servers_request = alb_20200616_models.ListServerGroupServersRequest(
-        server_group_id=server_group_id
-    )
-    runtime = util_models.RuntimeOptions()
-
-    try:
-        response = await alb_client.list_server_group_servers_with_options_async(list_server_group_servers_request, runtime)
-        instance_ids = [server.server_id for server in response.body.servers]
-        return instance_ids
-    except Exception as error:
-        print(str(error))
-        UtilClient.assert_as_string(str(error))
-        return []
-
-
-def update_server_group_server_weight(alb_client, server_group_id, instance_id, weight, port):
+    instance_ids = []
+    next_token = None
+    while True:
+        try:
+            list_server_group_servers_request = alb_20200616_models.ListServerGroupServersRequest(
+                server_group_id=server_group_id,
+                max_results=100,
+                next_token=next_token
+            )
+            runtime = util_models.RuntimeOptions(
+                connect_timeout=5000,
+                read_timeout=60000
+            )
+            response = alb_client.list_server_group_servers_with_options(list_server_group_servers_request, runtime)
+            next_token = UtilClient.to_map(response.body).get('NextToken')
+            sub_instance_ids = [server.server_id for server in response.body.servers]
+            if len(sub_instance_ids) > 0:
+                instance_ids.extend(sub_instance_ids)
+            if next_token is None:
+                break
+        except Exception as error:
+            logging.error(error)
+        time.sleep(3)
+    return instance_ids
+
+
+def update_server_group_server_weight(alb_client, server_group_id_list, instance_id_list, weight, port):
     """
     更指定服务器在服务器组中的权重
     :param alb_client: ALB客户端
-    :param server_group_id: 服务器组ID
-    :param instance_id: 实例ID
+    :param server_group_id_list: 服务器组ID list
+    :param instance_id_list: 实例ID list
     :param weight: 权重值
     :param port: 后端服务器使用的端口
     """
-    server = alb_20200616_models.UpdateServerGroupServersAttributeRequestServers(
-        server_type='Ecs',
-        server_id=instance_id,
-        weight=weight,
-        port=port
-    )
-    request = alb_20200616_models.UpdateServerGroupServersAttributeRequest(
-        servers=[server],
-        server_group_id=server_group_id
-    )
-    runtime = util_models.RuntimeOptions()
-    try:
-        alb_client.update_server_group_servers_attribute_with_options(request, runtime)
-        print(f"Successfully updated server {instance_id} in group {server_group_id} to weight {weight}.")
-    except Exception as error:
-        print(str(error))
-        UtilClient.assert_as_string(str(error))
+    instance_id_list_array = [instance_id_list[i:i + 40] for i in range(0, len(instance_id_list), 40)]
+    for instance_ids_sub_array in instance_id_list_array:
+        servers = []
+        for i in range(len(instance_ids_sub_array)):
+            server = alb_20200616_models.UpdateServerGroupServersAttributeRequestServers(
+                server_type='Ecs',
+                server_id=instance_ids_sub_array[i],
+                weight=weight,
+                port=port
+            )
+            servers.append(server)
+        for server_group_id in server_group_id_list:
+            request = alb_20200616_models.UpdateServerGroupServersAttributeRequest(
+                servers=servers,
+                server_group_id=server_group_id
+            )
+            # logging.info(f"servers = {servers}")
+            runtime = util_models.RuntimeOptions(
+                connect_timeout=5000,
+                read_timeout=60000
+            )
+            try:
+                # logging.info(f"instance_id_list = {instance_id_list} request = {request}")
+                alb_client.update_server_group_servers_attribute_with_options(request, runtime)
+                logging.info(
+                    f"Successfully updated count = {len(instance_ids_sub_array)} instance_ids: {instance_ids_sub_array} in group {server_group_id} to weight {weight}.")
+            except Exception as e:
+                logging.error(e)
+                sys.exit()
+        time.sleep(5)
+
 
 def update_server_group_servers_attribute(alb_client, server_group_id_list, instance_id_list, weight_list, port):
     """
@@ -487,54 +554,40 @@ def update_server_group_servers_attribute(alb_client, server_group_id_list, inst
     :param weight_list: 权重修改列表 type-list [(weight, sleep_time), ...]
     :param port: 后端服务器使用的端口
     """
-    for server_group_id in server_group_id_list:
-        for instance_id in instance_id_list:
-            for weight, sleep_time in weight_list:
-                update_server_group_server_weight(alb_client, server_group_id, instance_id, weight, port)
-                time.sleep(sleep_time)
+    # for server_group_id in server_group_id_list:
+    #     for instance_id in instance_id_list:
+    for weight, sleep_time in weight_list:
+        update_server_group_server_weight(alb_client, server_group_id_list, instance_id_list, weight, port)
+        time.sleep(sleep_time)
+        # check_server_group_status(alb_client, server_group_id_list)
 
 
-
-
-async def update_server_group_server_weight_async(alb_client, server_group_id, instance_id, weight, port):
-    """
-    异步更新特定服务器在服务器组中的权重
-    :param alb_client: ALB客户端
-    :param server_group_id: 服务器组ID
-    :param instance_id: 实例ID
-    :param weight: 权重值
-    :param port: 后端服务器使用的端口
-    """
-    server = alb_20200616_models.UpdateServerGroupServersAttributeRequestServers(
-        server_type='Ecs',
-        server_id=instance_id,
-        weight=weight,
-        port=port
+def check_server_group_status(alb_client, server_group_id_list):
+    list_server_groups_request = alb_20200616_models.ListServerGroupsRequest(
+        server_group_ids=server_group_id_list,
+        max_results=100
     )
-    request = alb_20200616_models.UpdateServerGroupServersAttributeRequest(
-        servers=[server],
-        server_group_id=server_group_id
+    flag = False
+    runtime = util_models.RuntimeOptions(
+        connect_timeout=5000,
+        read_timeout=60000
     )
-    runtime = util_models.RuntimeOptions()
-    try:
-        await alb_client.update_server_group_servers_attribute_with_options_async(request, runtime)
-        print(f"Successfully updated server {instance_id} in group {server_group_id} to weight {weight} asynchronously.")
-    except Exception as error:
-        print(str(error))
-        UtilClient.assert_as_string(str(error))
-
-async def update_server_group_servers_attribute_async(alb_client, server_group_id_list, instance_ids, weight_list, port):
-    """
-    异步更新服务器组中的服务器属性
-    :param alb_client: ALB客户端
-    :param server_group_id_list: 服务器组ID列表
-    :param instance_ids: 实例ID列表
-    :param weight_list: 权重修改列表 type-list [(weight, sleep_time), ...]
-    """
-    tasks = []
-    for server_group_id in server_group_id_list:
-        for instance_id in instance_ids:
-            for weight, sleep_time in weight_list:
-                tasks.append(update_server_group_server_weight_async(alb_client, server_group_id, instance_id, weight, port))
-                await asyncio.sleep(sleep_time)
-    await asyncio.gather(*tasks)
+    for i in range(10):
+        try:
+            response = alb_client.list_server_groups_with_options(list_server_groups_request, runtime)
+            count = 0
+            if response.body:
+                server_groups = UtilClient.to_map(response.body).get("ServerGroups")
+                if server_groups:
+                    for server_group in server_groups:
+                        if server_group.get("ServerGroupStatus") == "Available":
+                            logging.info(f"Server group {server_group} is available.")
+                            count += 1
+            if count == len(server_group_id_list):
+                flag = True
+                break
+            time.sleep(2)
+        except Exception as e:
+            logging.error(e)
+    if not flag:
+        sys.exit()

+ 0 - 0
test/__init__.py


+ 0 - 96
test/albtest.py

@@ -1,96 +0,0 @@
-import unittest
-import sys
-import logging
-from util import utils
-from aliyunsdkcore.client import AcsClient
-from alibabacloud_alb20200616.client import Client as Alb20200616Client
-from alibabacloud_tea_openapi import models as open_api_models
-
-# 配置客户端参数
-alb_client_params = {
-    'access_key_id': 'LTAI5tASD5yEZLeC8ffmNebY',
-    'access_key_secret': '1PtsFRdp8viJmI78lEhNZR8MezWZBq',
-    # 'endpoint': 'alb-vpc.cn-hangzhou.aliyuncs.com',
-    'endpoint': 'alb.cn-hangzhou.aliyuncs.com',    #  外网调试
-    'region_id': 'cn-hangzhou'
-}
-
-ecs_client_params = {
-    'access_key_id': 'LTAI4GBWbFvvXoXsSVBe1o9f',
-    'access_key_secret': 'kRAikWitb4kDxaAyBqNrmLmllMEDO3',
-    'region_id': 'cn-hangzhou'
-}
-
-server_group_id = "sgp-ec4gopoclruofsfmxu"  # 测试用的服务器组
-instance_id = "i-bp19n839usecekzn2ig9"  # PaddlePaddle_k8s集群登陆实例,不影响线上服务
-
-
-def connect_client(access_key_id, access_key_secret, region_id):
-    try:
-        clt = AcsClient(ak=access_key_id, secret=access_key_secret, region_id=region_id)
-        return clt
-    except Exception as e:
-        logging.error(e)
-        sys.exit()
-
-def connect_alb_client(access_key_id, access_key_secret, endpoint):
-    config = open_api_models.Config(
-        access_key_id=access_key_id,
-        access_key_secret=access_key_secret,
-        endpoint=endpoint
-    )
-    alb_client = Alb20200616Client(config)
-    return alb_client
-
-class MyTestCase(unittest.TestCase):
-    ecs_client = connect_client(
-        access_key_id=ecs_client_params['access_key_id'],
-        access_key_secret=ecs_client_params['access_key_secret'],
-        region_id=ecs_client_params['region_id']
-    )
-    alb_client = connect_alb_client(
-        access_key_id=alb_client_params['access_key_id'],
-        access_key_secret=alb_client_params['access_key_secret'],
-        endpoint=alb_client_params['endpoint']
-    )
-
-
-    def test_add_servers_to_server_group(self):
-        weight=0
-        server_group_id = "sgp-ec4gopoclruofsfmxu"
-        instance_id = "i-bp19n839usecekzn2ig9"
-        utils.add_servers_to_server_group(self.alb_client, server_group_id, instance_id, weight, port=80)
-
-    def test_list_server_group_servers(self):
-        instance_ids = utils.list_server_group_servers(self.alb_client, server_group_id)
-        print(instance_ids)
-
-
-#  todo
-    def test_remove_servers_from_server_group(self):
-        utils.remove_servers_from_server_group(self.alb_client, server_group_id, instance_id, port=80)
-
-
-
-
-    def test_update_server_group_servers_attribute(self):
-        instance_id = ["i-bp19n839usecekzn2ig9"]
-        server_group_id = "sgp-ec4gopoclruofsfmxu"
-        add_weight_list = [(10, 3), (0, 1)]
-        port = "80"
-        utils.update_server_group_servers_attribute(self.alb_client, [server_group_id], instance_id, add_weight_list, port)
-
-
-
-    def test_run_command(self):
-        instance_id = ["i-bp19n839usecekzn2ig9"]
-        command="ls"
-        utils.run_command(self.ecs_client, instance_ids=instance_id, command=command)
-
-
-
-
-
-
-if __name__ == '__main__':
-    unittest.main()

+ 0 - 8
test/runcommand.py

@@ -1,8 +0,0 @@
-import unittest
-
-class MyTestCase(unittest.TestCase):
-    def test_something(self):
-        self.assertEqual(True, False)  # add assertion here
-
-if __name__ == '__main__':
-    unittest.main()

+ 0 - 0
util/__init__.py


+ 0 - 555
util/utils.py

@@ -1,555 +0,0 @@
-import logging
-import json
-import sys
-import time
-from asyncio import wait_for
-
-import requests
-import asyncio
-import time
-
-from alibabacloud_tea_util.client import Client as UtilClient
-from aliyunsdkcore.client import AcsClient
-from aliyunsdkecs.request.v20140526.RunInstancesRequest import RunInstancesRequest
-from aliyunsdkecs.request.v20140526.DescribeInstancesRequest import DescribeInstancesRequest
-from aliyunsdkecs.request.v20140526.DescribeNetworkInterfacesRequest import DescribeNetworkInterfacesRequest
-from aliyunsdkecs.request.v20140526.RunCommandRequest import RunCommandRequest
-from aliyunsdkecs.request.v20140526.SendFileRequest import SendFileRequest
-from aliyunsdkecs.request.v20140526.StopInstancesRequest import StopInstancesRequest
-from aliyunsdkecs.request.v20140526.DeleteInstancesRequest import DeleteInstancesRequest
-from aliyunsdkecs.request.v20140526.DescribeInstanceStatusRequest import DescribeInstanceStatusRequest
-from aliyunsdkecs.request.v20140526.ModifySecurityGroupRuleRequest import ModifySecurityGroupRuleRequest
-from alibabacloud_alb20200616.client import Client as Alb20200616Client
-from alibabacloud_tea_openapi import models as open_api_models
-from alibabacloud_alb20200616 import models as alb_models
-from alibabacloud_alb20200616 import models as alb_20200616_models
-from alibabacloud_tea_util import models as util_models
-
-
-logging.basicConfig(level=logging.INFO,
-                    format='%(asctime)s %(filename)s[line:%(lineno)d] %(levelname)s %(message)s',
-                    datefmt='%a, %d %b %Y %H:%M:%S')
-
-
-def send_msg_to_feishu(webhook, key_word, msg_text):
-    """发送消息到飞书"""
-    headers = {'Content-Type': 'application/json'}
-    payload_message = {
-        "msg_type": "text",
-        "content": {
-            "text": '{}: {}'.format(key_word, msg_text)
-        }
-    }
-    response = requests.request('POST', url=webhook, headers=headers, data=json.dumps(payload_message))
-    logging.info(response.text)
-
-
-def connect_client(access_key_id, access_key_secret, region_id):
-    """
-    初始化账号,连接客户端
-    :param access_key_id: access key Id, type-string
-    :param access_key_secret: access key secret, type-string
-    :param region_id: region_id
-    :return: clt
-    """
-    try:
-        clt = AcsClient(ak=access_key_id, secret=access_key_secret, region_id=region_id)
-        return clt
-    except Exception as e:
-        # 失败,记录报错信息,发送通知,停止并退出
-        logging.error(e)
-        sys.exit()
-
-
-def connect_alb_client(access_key_id, access_key_secret, endpoint):
-    """
-    初始化ALB客户端
-    :param access_key_id: access key Id, type-string
-    :param access_key_secret: access key secret, type-string
-    :return: alb_client
-    """
-    config = open_api_models.Config(
-        access_key_id=access_key_id,
-        access_key_secret=access_key_secret,
-        endpoint=endpoint
-    )
-    alb_client = Alb20200616Client(config)
-    return alb_client
-
-
-
-
-
-def build_create_instances_request(image_id, vswitch_id, security_group_id, zone_id, instance_type, instance_name,
-                                   disk_size, disk_category, key_pair_name, tags):
-    """
-    购买服务器参数配置
-    :param image_id: 使用的镜像信息 type-string
-    :param vswitch_id: 选择的交换机 type-string
-    :param security_group_id: 当前vpc类型的安全组 type-string
-    :param zone_id: 服务器所在区域 type-string
-    :param instance_type: 实例规格 type-string
-    :param instance_name: 实例命名 type-string
-    :param disk_size: 磁盘大小,单位:G,type-string
-    :param disk_category: 磁盘类型 type-string
-    :param key_pair_name: 密钥对名称 type-string
-    :param tags: 标签 type-list, eg: [{"Key": "ecs", "Value": "rov-server.prod"}, ...]
-    :return: request
-    """
-    request = RunInstancesRequest()
-    request.set_ImageId(image_id)
-    request.set_VSwitchId(vswitch_id)
-    request.set_SecurityGroupId(security_group_id)
-    request.set_ZoneId(zone_id)
-    request.set_InstanceType(instance_type)
-    request.set_InstanceName(instance_name)
-    request.set_SystemDiskSize(disk_size)
-    request.set_SystemDiskCategory(disk_category)
-    request.set_KeyPairName(key_pair_name)
-    request.set_Tags(tags)
-    return request
-
-
-def send_req(client, request):
-    """
-    发送API请求
-    :param client: 客户端连接
-    :param request: 请求配置
-    :return: response
-    """
-    request.set_accept_format('json')
-    response = client.do_action_with_exception(request)
-    #print(response)
-    response = json.loads(response)
-    print(response)
-        # logging.info(response)
-    print(response.get('Code'))
-    return response
-    #except Exception as e:
-        # 失败,记录报错信息,发送通知,停止并退出
-    #logging.error(e)
-    #sys.exit()
-
-
-def check_instance_running(ecs_client, instance_ids):
-    """
-    检查服务器运行状态
-    :param ecs_client: 客户端连接
-    :param instance_ids: 实例id列表, type-list
-    :return: running_count,Status为Running的实例数
-    """
-    try:
-        request = DescribeInstancesRequest()
-        request.set_InstanceIds(json.dumps(instance_ids))
-        request.set_PageSize(100)
-        response = send_request(ecs_client=ecs_client, request=request)
-        if response.get('Code') is None:
-            instances_list = response.get('Instances').get('Instance')
-            running_count = 0
-            running_instances = []
-            for instance_detail in instances_list:
-                if instance_detail.get('Status') == "Running":
-                    running_count += 1
-                    running_instances.append(instance_detail.get('InstanceId'))
-            return running_count, running_instances
-        else:
-            # 失败,记录报错信息,发送通知,停止并退出
-            logging.error(response)
-            sys.exit()
-    except Exception as e:
-        # 失败,记录报错信息,发送通知,停止并退出
-        logging.error(e)
-        sys.exit()
-
-
-def get_ip_address(ecs_client, instance_id):
-    """
-    获取实例IP地址
-    :param ecs_client: 客户端连接
-    :param instance_id: 实例id, type-string
-    :return: ip_address, type-string
-    """
-    request = DescribeNetworkInterfacesRequest()
-    request.set_accept_format('json')
-    request.set_InstanceId(instance_id)
-    response = send_request(ecs_client=ecs_client, request=request)
-    ip_address = response['NetworkInterfaceSets']['NetworkInterfaceSet'][0]['PrivateIpAddress']
-    return ip_address
-
-
-
-def create_multiple_instances(amount, ecs_client,
-                              image_id, vswitch_id, security_group_id, zone_id, instance_type, instance_name,
-                              disk_size, disk_category, key_pair_name, tags):
-    """
-    创建多个ECS实例
-    :param amount: 创建实例数 type-int 取值范围:[1, 100]
-    :param ecs_client: 购买机器客户端连接
-    :param image_id: 使用的镜像信息 type-string
-    :param vswitch_id: 选择的交换机 type-string
-    :param security_group_id: 当前vpc类型的安全组 type-string
-    :param zone_id: 服务器所在区域 type-string
-    :param instance_type: 实例规格 type-string
-    :param instance_name: 实例命名 type-string
-    :param disk_size: 磁盘大小,单位:G,type-string
-    :param disk_category: 磁盘类型 type-string
-    :param key_pair_name: 密钥对名称 type-string
-    :param tags: 标签 type-list, eg: [{"Key": "ecs", "Value": "rov-server.prod"}, ...]
-    :return:
-    """
-    logging.info(f"create instances start, request amount: {amount}.")
-    # 1. 连接客户端
-    # create_instances_clt = connect_client(
-    #     access_key_id=access_key_id, access_key_secret=access_key_secret, region_id=region_id
-    # )
-    # 2. 请求参数配置
-    request = build_create_instances_request(
-        image_id=image_id, vswitch_id=vswitch_id, security_group_id=security_group_id, zone_id=zone_id,
-        instance_type=instance_type, instance_name=instance_name, disk_size=disk_size, disk_category=disk_category,
-        key_pair_name=key_pair_name, tags=tags
-    )
-    request.set_Amount(amount)
-    # 3. 发送API请求,购买机器并启动
-    response = send_request(ecs_client=ecs_client, request=request)
-    if response.get('Code') is None:
-        instance_ids = response.get('InstanceIdSets').get('InstanceIdSet')
-        logging.info(f"success amount: {len(instance_ids)}, instance ids: {instance_ids}.")
-        # 获取机器运行状态
-        running_amount = 0
-        while running_amount < amount:
-            time.sleep(10)
-            running_amount, running_instances = check_instance_running(ecs_client=ecs_client, instance_ids=instance_ids)
-            logging.info(f"running amount: {running_amount}, running instances: {running_instances}.")
-        return instance_ids
-    else:
-        # 失败,记录报错信息,发送通知,停止并退出
-        logging.error(response)
-        sys.exit()
-
-
-
-def release_instances(ecs_client, instance_ids, force=False):
-    """
-    释放实例
-    :param ecs_client:
-    :param instance_ids: instance_id, type-list
-    :param force: 是否强制释放, True-强制释放, False-正常释放, type-bool
-    :return:
-    """
-    request = DeleteInstancesRequest()
-    request.set_InstanceIds(instance_ids)
-    request.set_Force(force)
-    response = send_request(ecs_client=ecs_client, request=request)
-    return response
-
-
-
-def get_instances_status(ecs_client, instance_ids):
-    """
-    获取实例运行状态
-    :param ecs_client:
-    :param instance_ids: instance_id, type-list
-    :return:
-    """
-    request = DescribeInstanceStatusRequest()
-    request.set_InstanceIds(instance_ids)
-    request.set_PageSize(50)
-    response = send_request(ecs_client=ecs_client, request=request)
-    return response
-
-
-
-def stop_instances(ecs_client, instance_ids, force_stop=False):
-    """
-    停止实例
-    :param ecs_client:
-    :param instance_ids: 实例ID, type-list
-    :param force_stop: 是否强制关机, True-强制关机, False-正常关机, type-bool
-    :return:
-    """
-    request = StopInstancesRequest()
-    request.set_InstanceIds(instance_ids)
-    request.set_ForceStop(force_stop)
-    response = send_request(ecs_client=ecs_client, request=request)
-    return response
-
-
-
-
-def send_request(ecs_client, request):
-    """
-    发送API请求
-    :param ecs_client: 客户端连接
-    :param request: 请求配置
-    :return: response
-    """
-    request.set_accept_format('json')
-    try:
-        response = ecs_client.do_action_with_exception(request)
-        response = json.loads(response)
-        # logging.info(response)
-        return response
-    except Exception as e:
-        # 失败,记录报错信息,发送通知,停止并退出
-        logging.error(e)
-        sys.exit()
-
-
-
-def run_command(ecs_client, instance_ids, command):
-    """
-    批量执行命令
-    :param ecs_client: 客户端连接
-    :param instance_ids: 实例id列表, type-list, 最多能指定50台ECS实例ID
-    :param command: 命令 type-string
-    :return:
-    """
-    print(11111)
-    print(ecs_client, instance_ids, command)
-    for i in range(len(instance_ids) // 50 + 1):
-        instance_id_list = instance_ids[i * 50:(i + 1) * 50]
-        if len(instance_id_list) == 0:
-            return
-        request = RunCommandRequest()
-        request.set_accept_format('json')
-        request.set_Type("RunShellScript")
-        request.set_CommandContent(command)
-        request.set_InstanceIds(instance_id_list)
-        response = send_request(ecs_client=ecs_client, request=request)
-        logging.info(response)
-
-
-def send_file_to_ecs(ecs_client, instance_id_list, target_dir, name, content):
-    """
-    发送文件到ecs;alb应用,区分上方clb
-    :param ecs_client:
-    :param instance_id_list: 最多能指定50台ECS实例ID
-    :param target_dir: 文件存放目录 type-string
-    :param name: 文件名 type-string
-    :param content: 文件内容 type-string
-    :return:
-    """
-    if not instance_id_list:
-        logging.warning("实例ID列表为空,无法发送文件。")
-        return
-
-    for i in range(len(instance_id_list) // 50 + 1):
-        instance_ids = instance_id_list[i * 50:(i + 1) * 50]
-        if len(instance_ids) == 0:
-            logging.info("没有更多的实例ID需要发送文件,退出。")
-            return
-        request = SendFileRequest()
-        request.set_Content(content)
-        request.set_TargetDir(target_dir)
-        request.set_Name(name)
-        request.set_Overwrite(True)
-        request.set_InstanceIds(instance_ids)
-        try:
-            logging.info(f"正在向实例 {instance_ids} 发送文件 '{name}' 到目录 '{target_dir}'")
-            response = send_request(ecs_client=ecs_client, request=request)
-            logging.info(f"成功发送文件到实例 {instance_ids},响应: {response}")
-        except Exception as e:
-            logging.error(f"发送文件到实例 {instance_ids} 失败,错误: {str(e)}")
-
-
-
-def add_servers_to_server_group(alb_client, server_group_id, instance_id, weight, port):
-    """
-    添加服务器到ALB服务器组
-    :param alb_client: ALB客户端连接
-    :param server_group_id: 服务器组ID
-    :param instance_id: 实例ID
-    :param weight: 权重
-    :param port: 后端服务器使用的端口
-    """
-    server = alb_models.AddServersToServerGroupRequestServers(
-        server_id=instance_id,
-        server_type='ecs',
-        weight=weight,
-        port=port
-    )
-    request = alb_models.AddServersToServerGroupRequest(
-        server_group_id=server_group_id,
-        servers=[server]
-    )
-    runtime = util_models.RuntimeOptions()
-    try:
-        alb_client.add_servers_to_server_group_with_options(request, runtime)
-        logging.info(f"Successfully added server {instance_id} to server group {server_group_id} with weight {weight}.")
-    except Exception as e:
-        logging.error(f"Failed to add server {instance_id} to server group {server_group_id}: {str(e)}")
-
-
-
-def remove_servers_from_server_group(alb_client, server_group_id, instance_ids, port):
-    """
-    从ALB服务器组中移除服务器
-    :param alb_client: ALB客户端连接
-    :param server_group_id: 服务器组ID
-    :param instance_ids: 实例ID
-    :param port: 后端服务器使用的端口
-    """
-    for instance_id in instance_ids:
-        server = alb_models.RemoveServersFromServerGroupRequestServers(
-            port=port,
-            server_id=instance_id,
-            server_type='ecs'
-        )
-        request = alb_models.RemoveServersFromServerGroupRequest(
-            server_group_id=server_group_id,
-            servers=[server]
-        )
-        runtime = util_models.RuntimeOptions()
-        try:
-            alb_client.remove_servers_from_server_group_with_options(request, runtime)
-            logging.info(f"Successfully removed server {instance_id} from server group {server_group_id}.")
-        except Exception as e:
-            logging.error(f"Failed to remove server {instance_id} from server group {server_group_id}: {str(e)}")
-
-
-
-
-def list_server_group_servers(alb_client, server_group_id):
-    """
-    列出服务器组中的服务器并返回实例ID列表
-    @param alb_client: ALB客户端
-    @param server_group_id: 服务器组ID
-    @return: 实例ID列表
-    """
-    list_server_group_servers_request = alb_20200616_models.ListServerGroupServersRequest(
-        server_group_id=server_group_id
-    )
-    runtime = util_models.RuntimeOptions()
-
-    try:
-        response = alb_client.list_server_group_servers_with_options(list_server_group_servers_request, runtime)
-        instance_ids = [server.server_id for server in response.body.servers]
-        return instance_ids
-    except Exception as error:
-        print(str(error))
-        UtilClient.assert_as_string(str(error))
-        return []
-
-
-async def list_server_group_servers_async(alb_client, server_group_id):
-    """
-    异步列出指定服务器组中的服务器并返回实例ID列表
-    @param alb_client: ALB客户端
-    @param server_group_id: 服务器组ID
-    @return: 实例ID列表
-    """
-    list_server_group_servers_request = alb_20200616_models.ListServerGroupServersRequest(
-        server_group_id=server_group_id
-    )
-    runtime = util_models.RuntimeOptions()
-
-    try:
-        response = await alb_client.list_server_group_servers_with_options_async(list_server_group_servers_request, runtime)
-        instance_ids = [server.server_id for server in response.body.servers]
-        return instance_ids
-    except Exception as error:
-        print(str(error))
-        UtilClient.assert_as_string(str(error))
-        return []
-
-
-def update_server_group_server_weight(alb_client, server_group_id, instance_id_list, weight, port):
-    """
-    更指定服务器在服务器组中的权重
-    :param alb_client: ALB客户端
-    :param server_group_id: 服务器组ID
-    :param instance_id_list: 实例ID
-    :param weight: 权重值
-    :param port: 后端服务器使用的端口
-    """
-    # for i in range(0, len(instance_id_list), 20):
-    #     instances_list = instance_id_list[i * 20:(i + 1) * 20]
-    #     if not instances_list:
-    #         return
-    print(instance_id_list)
-    for server_id in instance_id_list:
-        server = alb_20200616_models.UpdateServerGroupServersAttributeRequestServers(
-            server_type='Ecs',
-            server_id=server_id,
-            weight=weight,
-            port=port
-        )
-        request = alb_20200616_models.UpdateServerGroupServersAttributeRequest(
-            servers=[server],
-            server_group_id=server_group_id
-        )
-        runtime = util_models.RuntimeOptions()
-        try:
-            alb_client.update_server_group_servers_attribute_with_options(request, runtime)
-            logging.info(f"Successfully updated server {server_id} in group {server_group_id} to weight {weight}.")
-        except Exception as error:
-            logging.error(f"Failed to update server {server_id}: {str(error)}")
-
-def update_server_group_servers_attribute(alb_client, server_group_id_list, instance_id_list, weight_list, port):
-    """
-    更新服务器组中的服务器权重
-    :param alb_client: ALB客户端
-    :param server_group_id_list: 服务器组ID列表
-    :param instance_id_list: 实例ID列表
-    :param weight_list: 权重修改列表 type-list [(weight, sleep_time), ...]
-    :param port: 后端服务器使用的端口
-    """
-    for weight, sleep_time in weight_list:
-        logging.info(f"修改权重中: weight = {weight}")
-        for server_group_id in server_group_id_list:
-            flag = True
-            while flag:
-                try:
-                    update_server_group_server_weight(alb_client=alb_client, server_group_id=server_group_id, instance_id_list=instance_id_list,
-                                             weight=weight, port=port)
-                    logging.info(f"alb: {server_group_id} finished!")
-                    flag = False
-                except Exception as e:
-                    logging.warning(f"Error updating group {server_group_id}, retrying in 10 seconds: {str(e)}")
-                    time.sleep(10)
-                    continue
-        time.sleep(sleep_time)
-
-
-async def update_server_group_server_weight_async(alb_client, server_group_id, instance_id, weight, port):
-    """
-    异步更新特定服务器在服务器组中的权重
-    :param alb_client: ALB客户端
-    :param server_group_id: 服务器组ID
-    :param instance_id: 实例ID
-    :param weight: 权重值
-    :param port: 后端服务器使用的端口
-    """
-    server = alb_20200616_models.UpdateServerGroupServersAttributeRequestServers(
-        server_type='Ecs',
-        server_id=instance_id,
-        weight=weight,
-        port=port
-    )
-    request = alb_20200616_models.UpdateServerGroupServersAttributeRequest(
-        servers=[server],
-        server_group_id=server_group_id
-    )
-    runtime = util_models.RuntimeOptions()
-    try:
-        await alb_client.update_server_group_servers_attribute_with_options_async(request, runtime)
-        print(f"Successfully updated server {instance_id} in group {server_group_id} to weight {weight} asynchronously.")
-    except Exception as error:
-        print(str(error))
-        UtilClient.assert_as_string(str(error))
-
-async def update_server_group_servers_attribute_async(alb_client, server_group_id_list, instance_ids, weight_list, port):
-    """
-    异步更新服务器组中的服务器属性
-    :param alb_client: ALB客户端
-    :param server_group_id_list: 服务器组ID列表
-    :param instance_ids: 实例ID列表
-    :param weight_list: 权重修改列表 type-list [(weight, sleep_time), ...]
-    """
-    tasks = []
-    for server_group_id in server_group_id_list:
-        for instance_id in instance_ids:
-            for weight, sleep_time in weight_list:
-                tasks.append(update_server_group_server_weight_async(alb_client, server_group_id, instance_id, weight, port))
-                await asyncio.sleep(sleep_time)
-    await asyncio.gather(*tasks)