alb_utils.py 20 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541
  1. import logging
  2. import json
  3. import sys
  4. import time
  5. from asyncio import wait_for
  6. import requests
  7. import asyncio
  8. import time
  9. from alibabacloud_tea_util.client import Client as UtilClient
  10. from aliyunsdkcore.client import AcsClient
  11. from aliyunsdkslb.request.v20140515.AddBackendServersRequest import AddBackendServersRequest
  12. from aliyunsdkslb.request.v20140515.RemoveBackendServersRequest import RemoveBackendServersRequest
  13. from aliyunsdkecs.request.v20140526.RunInstancesRequest import RunInstancesRequest
  14. from aliyunsdkecs.request.v20140526.DescribeInstancesRequest import DescribeInstancesRequest
  15. from aliyunsdkecs.request.v20140526.DescribeNetworkInterfacesRequest import DescribeNetworkInterfacesRequest
  16. from aliyunsdkslb.request.v20140515.DescribeLoadBalancerAttributeRequest import DescribeLoadBalancerAttributeRequest
  17. from aliyunsdkecs.request.v20140526.RunCommandRequest import RunCommandRequest
  18. from aliyunsdkecs.request.v20140526.SendFileRequest import SendFileRequest
  19. from aliyunsdkecs.request.v20140526.StopInstancesRequest import StopInstancesRequest
  20. from aliyunsdkecs.request.v20140526.DeleteInstancesRequest import DeleteInstancesRequest
  21. from aliyunsdkecs.request.v20140526.DescribeInstanceStatusRequest import DescribeInstanceStatusRequest
  22. from aliyunsdkcore.request import CommonRequest
  23. from alibabacloud_alb20200616.client import Client as Alb20200616Client
  24. from alibabacloud_tea_openapi import models as open_api_models
  25. from alibabacloud_alb20200616 import models as alb_models
  26. from alibabacloud_alb20200616 import models as alb_20200616_models
  27. from alibabacloud_tea_util import models as util_models
  28. from aliyunsdkalb.request.v20200616.ListServerGroupServersRequest import ListServerGroupServersRequest
  29. from aliyunsdkcore.acs_exception.exceptions import ClientException, ServerException
  30. from urllib3.connection import port_by_scheme
  31. logging.basicConfig(level=logging.INFO,
  32. format='%(asctime)s %(filename)s[line:%(lineno)d] %(levelname)s %(message)s',
  33. datefmt='%a, %d %b %Y %H:%M:%S')
  34. def send_msg_to_feishu(webhook, key_word, msg_text):
  35. """发送消息到飞书"""
  36. headers = {'Content-Type': 'application/json'}
  37. payload_message = {
  38. "msg_type": "text",
  39. "content": {
  40. "text": '{}: {}'.format(key_word, msg_text)
  41. }
  42. }
  43. response = requests.request('POST', url=webhook, headers=headers, data=json.dumps(payload_message))
  44. logging.info(response.text)
  45. def connect_client(access_key_id, access_key_secret, region_id):
  46. """
  47. 初始化账号,连接客户端
  48. :param access_key_id: access key Id, type-string
  49. :param access_key_secret: access key secret, type-string
  50. :param region_id: region_id
  51. :return: clt
  52. """
  53. try:
  54. clt = AcsClient(ak=access_key_id, secret=access_key_secret, region_id=region_id)
  55. return clt
  56. except Exception as e:
  57. # 失败,记录报错信息,发送通知,停止并退出
  58. logging.error(e)
  59. sys.exit()
  60. def connect_alb_client(access_key_id, access_key_secret, endpoint):
  61. """
  62. 初始化ALB客户端
  63. :param access_key_id: access key Id, type-string
  64. :param access_key_secret: access key secret, type-string
  65. :return: alb_client
  66. """
  67. config = open_api_models.Config(
  68. access_key_id=access_key_id,
  69. access_key_secret=access_key_secret,
  70. endpoint=endpoint
  71. )
  72. alb_client = Alb20200616Client(config)
  73. return alb_client
  74. def build_create_instances_request(image_id, vswitch_id, security_group_id, zone_id, instance_type, instance_name,
  75. disk_size, disk_category, key_pair_name, tags):
  76. """
  77. 购买服务器参数配置
  78. :param image_id: 使用的镜像信息 type-string
  79. :param vswitch_id: 选择的交换机 type-string
  80. :param security_group_id: 当前vpc类型的安全组 type-string
  81. :param zone_id: 服务器所在区域 type-string
  82. :param instance_type: 实例规格 type-string
  83. :param instance_name: 实例命名 type-string
  84. :param disk_size: 磁盘大小,单位:G,type-string
  85. :param disk_category: 磁盘类型 type-string
  86. :param key_pair_name: 密钥对名称 type-string
  87. :param tags: 标签 type-list, eg: [{"Key": "ecs", "Value": "rov-server.prod"}, ...]
  88. :return: request
  89. """
  90. request = RunInstancesRequest()
  91. request.set_ImageId(image_id)
  92. request.set_VSwitchId(vswitch_id)
  93. request.set_SecurityGroupId(security_group_id)
  94. request.set_ZoneId(zone_id)
  95. request.set_InstanceType(instance_type)
  96. request.set_InstanceName(instance_name)
  97. request.set_SystemDiskSize(disk_size)
  98. request.set_SystemDiskCategory(disk_category)
  99. request.set_KeyPairName(key_pair_name)
  100. request.set_Tags(tags)
  101. return request
  102. def send_req(client, request):
  103. """
  104. 发送API请求
  105. :param client: 客户端连接
  106. :param request: 请求配置
  107. :return: response
  108. """
  109. request.set_accept_format('json')
  110. response = client.do_action_with_exception(request)
  111. #print(response)
  112. response = json.loads(response)
  113. print(response)
  114. # logging.info(response)
  115. print(response.get('Code'))
  116. return response
  117. #except Exception as e:
  118. # 失败,记录报错信息,发送通知,停止并退出
  119. #logging.error(e)
  120. #sys.exit()
  121. def check_instance_running(ecs_client, instance_ids):
  122. """
  123. 检查服务器运行状态
  124. :param ecs_client: 客户端连接
  125. :param instance_ids: 实例id列表, type-list
  126. :return: running_count,Status为Running的实例数
  127. """
  128. try:
  129. request = DescribeInstancesRequest()
  130. request.set_InstanceIds(json.dumps(instance_ids))
  131. request.set_PageSize(100)
  132. response = send_request(ecs_client=ecs_client, request=request)
  133. if response.get('Code') is None:
  134. instances_list = response.get('Instances').get('Instance')
  135. running_count = 0
  136. running_instances = []
  137. for instance_detail in instances_list:
  138. if instance_detail.get('Status') == "Running":
  139. running_count += 1
  140. running_instances.append(instance_detail.get('InstanceId'))
  141. return running_count, running_instances
  142. else:
  143. # 失败,记录报错信息,发送通知,停止并退出
  144. logging.error(response)
  145. sys.exit()
  146. except Exception as e:
  147. # 失败,记录报错信息,发送通知,停止并退出
  148. logging.error(e)
  149. sys.exit()
  150. def get_ip_address(ecs_client, instance_id):
  151. """
  152. 获取实例IP地址
  153. :param ecs_client: 客户端连接
  154. :param instance_id: 实例id, type-string
  155. :return: ip_address, type-string
  156. """
  157. request = DescribeNetworkInterfacesRequest()
  158. request.set_accept_format('json')
  159. request.set_InstanceId(instance_id)
  160. response = send_request(ecs_client=ecs_client, request=request)
  161. ip_address = response['NetworkInterfaceSets']['NetworkInterfaceSet'][0]['PrivateIpAddress']
  162. return ip_address
  163. def create_multiple_instances(amount, ecs_client,
  164. image_id, vswitch_id, security_group_id, zone_id, instance_type, instance_name,
  165. disk_size, disk_category, key_pair_name, tags):
  166. """
  167. 创建多个ECS实例
  168. :param amount: 创建实例数 type-int 取值范围:[1, 100]
  169. :param ecs_client: 购买机器客户端连接
  170. :param image_id: 使用的镜像信息 type-string
  171. :param vswitch_id: 选择的交换机 type-string
  172. :param security_group_id: 当前vpc类型的安全组 type-string
  173. :param zone_id: 服务器所在区域 type-string
  174. :param instance_type: 实例规格 type-string
  175. :param instance_name: 实例命名 type-string
  176. :param disk_size: 磁盘大小,单位:G,type-string
  177. :param disk_category: 磁盘类型 type-string
  178. :param key_pair_name: 密钥对名称 type-string
  179. :param tags: 标签 type-list, eg: [{"Key": "ecs", "Value": "rov-server.prod"}, ...]
  180. :return:
  181. """
  182. logging.info(f"create instances start, request amount: {amount}.")
  183. # 1. 连接客户端
  184. # create_instances_clt = connect_client(
  185. # access_key_id=access_key_id, access_key_secret=access_key_secret, region_id=region_id
  186. # )
  187. # 2. 请求参数配置
  188. request = build_create_instances_request(
  189. image_id=image_id, vswitch_id=vswitch_id, security_group_id=security_group_id, zone_id=zone_id,
  190. instance_type=instance_type, instance_name=instance_name, disk_size=disk_size, disk_category=disk_category,
  191. key_pair_name=key_pair_name, tags=tags
  192. )
  193. request.set_Amount(amount)
  194. # 3. 发送API请求,购买机器并启动
  195. response = send_request(ecs_client=ecs_client, request=request)
  196. if response.get('Code') is None:
  197. instance_ids = response.get('InstanceIdSets').get('InstanceIdSet')
  198. logging.info(f"success amount: {len(instance_ids)}, instance ids: {instance_ids}.")
  199. # 获取机器运行状态
  200. running_amount = 0
  201. while running_amount < amount:
  202. time.sleep(10)
  203. running_amount, running_instances = check_instance_running(ecs_client=ecs_client, instance_ids=instance_ids)
  204. logging.info(f"running amount: {running_amount}, running instances: {running_instances}.")
  205. return instance_ids
  206. else:
  207. # 失败,记录报错信息,发送通知,停止并退出
  208. logging.error(response)
  209. sys.exit()
  210. def release_instances(ecs_client, instance_ids, force=False):
  211. """
  212. 释放实例
  213. :param ecs_client:
  214. :param instance_ids: instance_id, type-list
  215. :param force: 是否强制释放, True-强制释放, False-正常释放, type-bool
  216. :return:
  217. """
  218. request = DeleteInstancesRequest()
  219. request.set_InstanceIds(instance_ids)
  220. request.set_Force(force)
  221. response = send_request(ecs_client=ecs_client, request=request)
  222. return response
  223. def get_instances_status(ecs_client, instance_ids):
  224. """
  225. 获取实例运行状态
  226. :param ecs_client:
  227. :param instance_ids: instance_id, type-list
  228. :return:
  229. """
  230. request = DescribeInstanceStatusRequest()
  231. request.set_InstanceIds(instance_ids)
  232. request.set_PageSize(50)
  233. response = send_request(ecs_client=ecs_client, request=request)
  234. return response
  235. def stop_instances(ecs_client, instance_ids, force_stop=False):
  236. """
  237. 停止实例
  238. :param ecs_client:
  239. :param instance_ids: 实例ID, type-list
  240. :param force_stop: 是否强制关机, True-强制关机, False-正常关机, type-bool
  241. :return:
  242. """
  243. request = StopInstancesRequest()
  244. request.set_InstanceIds(instance_ids)
  245. request.set_ForceStop(force_stop)
  246. response = send_request(ecs_client=ecs_client, request=request)
  247. return response
  248. def send_request(ecs_client, request):
  249. """
  250. 发送API请求
  251. :param ecs_client: 客户端连接
  252. :param request: 请求配置
  253. :return: response
  254. """
  255. request.set_accept_format('json')
  256. try:
  257. response = ecs_client.do_action_with_exception(request)
  258. response = json.loads(response)
  259. # logging.info(response)
  260. return response
  261. except Exception as e:
  262. # 失败,记录报错信息,发送通知,停止并退出
  263. logging.error(e)
  264. sys.exit()
  265. def run_command(ecs_client, instance_ids, command):
  266. """
  267. 批量执行命令
  268. :param ecs_client: 客户端连接
  269. :param instance_ids: 实例id列表, type-list, 最多能指定50台ECS实例ID
  270. :param command: 命令 type-string
  271. :return:
  272. """
  273. for i in range(len(instance_ids) // 50 + 1):
  274. instance_id_list = instance_ids[i * 50:(i + 1) * 50]
  275. if len(instance_id_list) == 0:
  276. return
  277. request = RunCommandRequest()
  278. request.set_accept_format('json')
  279. request.set_Type("RunShellScript")
  280. request.set_CommandContent(command)
  281. request.set_InstanceIds(instance_id_list)
  282. response = send_request(ecs_client=ecs_client, request=request)
  283. logging.info(response)
  284. def send_file_to_ecs(ecs_client, instance_id_list, target_dir, name, content):
  285. """
  286. 发送文件到ecs;alb应用,区分上方clb
  287. :param ecs_client:
  288. :param instance_id_list: 最多能指定50台ECS实例ID
  289. :param target_dir: 文件存放目录 type-string
  290. :param name: 文件名 type-string
  291. :param content: 文件内容 type-string
  292. :return:
  293. """
  294. if not instance_id_list:
  295. logging.warning("实例ID列表为空,无法发送文件。")
  296. return
  297. for i in range(len(instance_id_list) // 50 + 1):
  298. instance_ids = instance_id_list[i * 50:(i + 1) * 50]
  299. if len(instance_ids) == 0:
  300. logging.info("没有更多的实例ID需要发送文件,退出。")
  301. return
  302. request = SendFileRequest()
  303. request.set_Content(content)
  304. request.set_TargetDir(target_dir)
  305. request.set_Name(name)
  306. request.set_Overwrite(True)
  307. request.set_InstanceIds(instance_ids)
  308. try:
  309. logging.info(f"正在向实例 {instance_ids} 发送文件 '{name}' 到目录 '{target_dir}'")
  310. response = send_request(ecs_client=ecs_client, request=request)
  311. logging.info(f"成功发送文件到实例 {instance_ids},响应: {response}")
  312. except Exception as e:
  313. logging.error(f"发送文件到实例 {instance_ids} 失败,错误: {str(e)}")
  314. def add_servers_to_server_group(alb_client, server_group_id, instance_id, weight, port):
  315. """
  316. 添加服务器到ALB服务器组
  317. :param alb_client: ALB客户端连接
  318. :param server_group_id: 服务器组ID
  319. :param instance_id: 实例ID
  320. :param weight: 权重
  321. :param port: 后端服务器使用的端口
  322. """
  323. server = alb_models.AddServersToServerGroupRequestServers(
  324. server_id=instance_id,
  325. server_type='ecs',
  326. weight=weight,
  327. port=port
  328. )
  329. request = alb_models.AddServersToServerGroupRequest(
  330. server_group_id=server_group_id,
  331. servers=[server]
  332. )
  333. runtime = util_models.RuntimeOptions()
  334. try:
  335. alb_client.add_servers_to_server_group_with_options(request, runtime)
  336. logging.info(f"Successfully added server {instance_id} to server group {server_group_id} with weight {weight}.")
  337. except Exception as e:
  338. logging.error(f"Failed to add server {instance_id} to server group {server_group_id}: {str(e)}")
  339. def remove_servers_from_server_group(alb_client, server_group_id, instance_id, port):
  340. """
  341. 从ALB服务器组中移除服务器
  342. :param alb_client: ALB客户端连接
  343. :param server_group_id: 服务器组ID
  344. :param instance_id: 实例ID
  345. :param port: 后端服务器使用的端口
  346. """
  347. server = alb_models.RemoveServersFromServerGroupRequestServers(
  348. port=port,
  349. server_id=instance_id,
  350. server_type='ecs'
  351. )
  352. request = alb_models.RemoveServersFromServerGroupRequest(
  353. server_group_id=server_group_id,
  354. servers=[server]
  355. )
  356. runtime = util_models.RuntimeOptions()
  357. try:
  358. alb_client.remove_servers_from_server_group_with_options(request, runtime)
  359. logging.info(f"Successfully removed server {instance_id} from server group {server_group_id}.")
  360. except Exception as e:
  361. logging.error(f"Failed to remove server {instance_id} from server group {server_group_id}: {str(e)}")
  362. def list_server_group_servers(alb_client, server_group_id):
  363. """
  364. 列出服务器组中的服务器并返回实例ID列表
  365. @param alb_client: ALB客户端
  366. @param server_group_id: 服务器组ID
  367. @return: 实例ID列表
  368. """
  369. list_server_group_servers_request = alb_20200616_models.ListServerGroupServersRequest(
  370. server_group_id=server_group_id
  371. )
  372. runtime = util_models.RuntimeOptions()
  373. try:
  374. response = alb_client.list_server_group_servers_with_options(list_server_group_servers_request, runtime)
  375. instance_ids = [server.server_id for server in response.body.servers]
  376. return instance_ids
  377. except Exception as error:
  378. print(str(error))
  379. UtilClient.assert_as_string(str(error))
  380. return []
  381. async def list_server_group_servers_async(alb_client, server_group_id):
  382. """
  383. 异步列出指定服务器组中的服务器并返回实例ID列表
  384. @param alb_client: ALB客户端
  385. @param server_group_id: 服务器组ID
  386. @return: 实例ID列表
  387. """
  388. list_server_group_servers_request = alb_20200616_models.ListServerGroupServersRequest(
  389. server_group_id=server_group_id
  390. )
  391. runtime = util_models.RuntimeOptions()
  392. try:
  393. response = await alb_client.list_server_group_servers_with_options_async(list_server_group_servers_request, runtime)
  394. instance_ids = [server.server_id for server in response.body.servers]
  395. return instance_ids
  396. except Exception as error:
  397. print(str(error))
  398. UtilClient.assert_as_string(str(error))
  399. return []
  400. def update_server_group_server_weight(alb_client, server_group_id, instance_id, weight, port):
  401. """
  402. 更新特定服务器在服务器组中的权重
  403. :param alb_client: ALB客户端
  404. :param server_group_id: 服务器组ID
  405. :param instance_id: 实例ID
  406. :param weight: 权重值
  407. :param port: 后端服务器使用的端口
  408. """
  409. server = alb_20200616_models.UpdateServerGroupServersAttributeRequestServers(
  410. server_type='Ecs',
  411. server_id=instance_id,
  412. weight=weight,
  413. port=port
  414. )
  415. request = alb_20200616_models.UpdateServerGroupServersAttributeRequest(
  416. servers=[server],
  417. server_group_id=server_group_id
  418. )
  419. runtime = util_models.RuntimeOptions()
  420. try:
  421. alb_client.update_server_group_servers_attribute_with_options(request, runtime)
  422. print(f"Successfully updated server {instance_id} in group {server_group_id} to weight {weight}.")
  423. except Exception as error:
  424. print(str(error))
  425. UtilClient.assert_as_string(str(error))
  426. def update_server_group_servers_attribute(alb_client, server_group_id_list, instance_id_list, weight_list, port):
  427. """
  428. 更新服务器组中的服务器权重
  429. :param alb_client: ALB客户端
  430. :param server_group_id_list: 服务器组ID列表
  431. :param instance_id_list: 实例ID列表
  432. :param weight_list: 权重修改列表 type-list [(weight, sleep_time), ...]
  433. :param port: 后端服务器使用的端口
  434. """
  435. for server_group_id in server_group_id_list:
  436. for instance_id in instance_id_list:
  437. for weight, sleep_time in weight_list:
  438. update_server_group_server_weight(alb_client, server_group_id, instance_id, weight, port)
  439. time.sleep(sleep_time)
  440. async def update_server_group_server_weight_async(alb_client, server_group_id, instance_id, weight, port):
  441. """
  442. 异步更新特定服务器在服务器组中的权重
  443. :param alb_client: ALB客户端
  444. :param server_group_id: 服务器组ID
  445. :param instance_id: 实例ID
  446. :param weight: 权重值
  447. :param port: 后端服务器使用的端口
  448. """
  449. server = alb_20200616_models.UpdateServerGroupServersAttributeRequestServers(
  450. server_type='Ecs',
  451. server_id=instance_id,
  452. weight=weight,
  453. port=port
  454. )
  455. request = alb_20200616_models.UpdateServerGroupServersAttributeRequest(
  456. servers=[server],
  457. server_group_id=server_group_id
  458. )
  459. runtime = util_models.RuntimeOptions()
  460. try:
  461. await alb_client.update_server_group_servers_attribute_with_options_async(request, runtime)
  462. print(f"Successfully updated server {instance_id} in group {server_group_id} to weight {weight} asynchronously.")
  463. except Exception as error:
  464. print(str(error))
  465. UtilClient.assert_as_string(str(error))
  466. async def update_server_group_servers_attribute_async(alb_client, server_group_id_list, instance_ids, weight_list, port):
  467. """
  468. 异步更新服务器组中的服务器属性
  469. :param alb_client: ALB客户端
  470. :param server_group_id_list: 服务器组ID列表
  471. :param instance_ids: 实例ID列表
  472. :param weight_list: 权重修改列表 type-list [(weight, sleep_time), ...]
  473. """
  474. tasks = []
  475. for server_group_id in server_group_id_list:
  476. for instance_id in instance_ids:
  477. for weight, sleep_time in weight_list:
  478. tasks.append(update_server_group_server_weight_async(alb_client, server_group_id, instance_id, weight, port))
  479. await asyncio.sleep(sleep_time)
  480. await asyncio.gather(*tasks)