utils.py 19 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524
  1. import logging
  2. import json
  3. import sys
  4. import time
  5. from asyncio import wait_for
  6. import requests
  7. import asyncio
  8. import time
  9. from alibabacloud_tea_util.client import Client as UtilClient
  10. from aliyunsdkcore.client import AcsClient
  11. from aliyunsdkecs.request.v20140526.RunInstancesRequest import RunInstancesRequest
  12. from aliyunsdkecs.request.v20140526.DescribeInstancesRequest import DescribeInstancesRequest
  13. from aliyunsdkecs.request.v20140526.DescribeNetworkInterfacesRequest import DescribeNetworkInterfacesRequest
  14. from aliyunsdkecs.request.v20140526.RunCommandRequest import RunCommandRequest
  15. from aliyunsdkecs.request.v20140526.SendFileRequest import SendFileRequest
  16. from aliyunsdkecs.request.v20140526.StopInstancesRequest import StopInstancesRequest
  17. from aliyunsdkecs.request.v20140526.DeleteInstancesRequest import DeleteInstancesRequest
  18. from aliyunsdkecs.request.v20140526.DescribeInstanceStatusRequest import DescribeInstanceStatusRequest
  19. from aliyunsdkecs.request.v20140526.ModifySecurityGroupRuleRequest import ModifySecurityGroupRuleRequest
  20. from alibabacloud_alb20200616.client import Client as Alb20200616Client
  21. from alibabacloud_tea_openapi import models as open_api_models
  22. from alibabacloud_alb20200616 import models as alb_models
  23. from alibabacloud_alb20200616 import models as alb_20200616_models
  24. from alibabacloud_tea_util import models as util_models
  25. from urllib3 import request
  26. logging.basicConfig(level=logging.INFO,
  27. format='%(asctime)s %(filename)s[line:%(lineno)d] %(levelname)s %(message)s',
  28. datefmt='%a, %d %b %Y %H:%M:%S')
  29. def send_msg_to_feishu(webhook, key_word, msg_text):
  30. """发送消息到飞书"""
  31. headers = {'Content-Type': 'application/json'}
  32. payload_message = {
  33. "msg_type": "text",
  34. "content": {
  35. "text": '{}: {}'.format(key_word, msg_text)
  36. }
  37. }
  38. response = requests.request('POST', url=webhook, headers=headers, data=json.dumps(payload_message))
  39. logging.info(response.text)
  40. def connect_client(access_key_id, access_key_secret, region_id):
  41. """
  42. 初始化账号,连接客户端
  43. :param access_key_id: access key Id, type-string
  44. :param access_key_secret: access key secret, type-string
  45. :param region_id: region_id
  46. :return: clt
  47. """
  48. try:
  49. clt = AcsClient(ak=access_key_id, secret=access_key_secret, region_id=region_id)
  50. return clt
  51. except Exception as e:
  52. # 失败,记录报错信息,发送通知,停止并退出
  53. logging.error(e)
  54. sys.exit()
  55. def connect_alb_client(access_key_id, access_key_secret, endpoint):
  56. """
  57. 初始化ALB客户端
  58. :param access_key_id: access key Id, type-string
  59. :param access_key_secret: access key secret, type-string
  60. :return: alb_client
  61. """
  62. config = open_api_models.Config(
  63. access_key_id=access_key_id,
  64. access_key_secret=access_key_secret,
  65. endpoint=endpoint
  66. )
  67. alb_client = Alb20200616Client(config)
  68. return alb_client
  69. def build_create_instances_request(image_id, vswitch_id, security_group_id, zone_id, instance_type, instance_name,
  70. disk_size, disk_category, key_pair_name, tags):
  71. """
  72. 购买服务器参数配置
  73. :param image_id: 使用的镜像信息 type-string
  74. :param vswitch_id: 选择的交换机 type-string
  75. :param security_group_id: 当前vpc类型的安全组 type-string
  76. :param zone_id: 服务器所在区域 type-string
  77. :param instance_type: 实例规格 type-string
  78. :param instance_name: 实例命名 type-string
  79. :param disk_size: 磁盘大小,单位:G,type-string
  80. :param disk_category: 磁盘类型 type-string
  81. :param key_pair_name: 密钥对名称 type-string
  82. :param tags: 标签 type-list, eg: [{"Key": "ecs", "Value": "rov-server.prod"}, ...]
  83. :return: request
  84. """
  85. request = RunInstancesRequest()
  86. request.set_ImageId(image_id)
  87. request.set_VSwitchId(vswitch_id)
  88. request.set_SecurityGroupId(security_group_id)
  89. request.set_ZoneId(zone_id)
  90. request.set_InstanceType(instance_type)
  91. request.set_InstanceName(instance_name)
  92. request.set_SystemDiskSize(disk_size)
  93. request.set_SystemDiskCategory(disk_category)
  94. request.set_KeyPairName(key_pair_name)
  95. request.set_Tags(tags)
  96. return request
  97. def send_req(client, request):
  98. """
  99. 发送API请求
  100. :param client: 客户端连接
  101. :param request: 请求配置
  102. :return: response
  103. """
  104. request.set_accept_format('json')
  105. response = client.do_action_with_exception(request)
  106. #print(response)
  107. response = json.loads(response)
  108. print(response)
  109. # logging.info(response)
  110. print(response.get('Code'))
  111. return response
  112. #except Exception as e:
  113. # 失败,记录报错信息,发送通知,停止并退出
  114. #logging.error(e)
  115. #sys.exit()
  116. def check_instance_running(ecs_client, instance_ids):
  117. """
  118. 检查服务器运行状态
  119. :param ecs_client: 客户端连接
  120. :param instance_ids: 实例id列表, type-list
  121. :return: running_count,Status为Running的实例数
  122. """
  123. try:
  124. request = DescribeInstancesRequest()
  125. request.set_InstanceIds(json.dumps(instance_ids))
  126. request.set_PageSize(100)
  127. response = send_request(ecs_client=ecs_client, request=request)
  128. if response.get('Code') is None:
  129. instances_list = response.get('Instances').get('Instance')
  130. running_count = 0
  131. running_instances = []
  132. for instance_detail in instances_list:
  133. if instance_detail.get('Status') == "Running":
  134. running_count += 1
  135. running_instances.append(instance_detail.get('InstanceId'))
  136. return running_count, running_instances
  137. else:
  138. # 失败,记录报错信息,发送通知,停止并退出
  139. logging.error(response)
  140. sys.exit()
  141. except Exception as e:
  142. # 失败,记录报错信息,发送通知,停止并退出
  143. logging.error(e)
  144. sys.exit()
  145. def get_ip_address(ecs_client, instance_id):
  146. """
  147. 获取实例IP地址
  148. :param ecs_client: 客户端连接
  149. :param instance_id: 实例id, type-string
  150. :return: ip_address, type-string
  151. """
  152. request = DescribeNetworkInterfacesRequest()
  153. request.set_accept_format('json')
  154. request.set_InstanceId(instance_id)
  155. response = send_request(ecs_client=ecs_client, request=request)
  156. ip_address = response['NetworkInterfaceSets']['NetworkInterfaceSet'][0]['PrivateIpAddress']
  157. return ip_address
  158. def create_multiple_instances(amount, ecs_client,
  159. image_id, vswitch_id, security_group_id, zone_id, instance_type, instance_name,
  160. disk_size, disk_category, key_pair_name, tags):
  161. """
  162. 创建多个ECS实例
  163. :param amount: 创建实例数 type-int 取值范围:[1, 100]
  164. :param ecs_client: 购买机器客户端连接
  165. :param image_id: 使用的镜像信息 type-string
  166. :param vswitch_id: 选择的交换机 type-string
  167. :param security_group_id: 当前vpc类型的安全组 type-string
  168. :param zone_id: 服务器所在区域 type-string
  169. :param instance_type: 实例规格 type-string
  170. :param instance_name: 实例命名 type-string
  171. :param disk_size: 磁盘大小,单位:G,type-string
  172. :param disk_category: 磁盘类型 type-string
  173. :param key_pair_name: 密钥对名称 type-string
  174. :param tags: 标签 type-list, eg: [{"Key": "ecs", "Value": "rov-server.prod"}, ...]
  175. :return:
  176. """
  177. logging.info(f"create instances start, request amount: {amount}.")
  178. # 1. 连接客户端
  179. # create_instances_clt = connect_client(
  180. # access_key_id=access_key_id, access_key_secret=access_key_secret, region_id=region_id
  181. # )
  182. # 2. 请求参数配置
  183. request = build_create_instances_request(
  184. image_id=image_id, vswitch_id=vswitch_id, security_group_id=security_group_id, zone_id=zone_id,
  185. instance_type=instance_type, instance_name=instance_name, disk_size=disk_size, disk_category=disk_category,
  186. key_pair_name=key_pair_name, tags=tags
  187. )
  188. request.set_Amount(amount)
  189. # 3. 发送API请求,购买机器并启动
  190. response = send_request(ecs_client=ecs_client, request=request)
  191. if response.get('Code') is None:
  192. instance_ids = response.get('InstanceIdSets').get('InstanceIdSet')
  193. logging.info(f"success amount: {len(instance_ids)}, instance ids: {instance_ids}.")
  194. # 获取机器运行状态
  195. running_amount = 0
  196. while running_amount < amount:
  197. time.sleep(10)
  198. running_amount, running_instances = check_instance_running(ecs_client=ecs_client, instance_ids=instance_ids)
  199. logging.info(f"running amount: {running_amount}, running instances: {running_instances}.")
  200. return instance_ids
  201. else:
  202. # 失败,记录报错信息,发送通知,停止并退出
  203. logging.error(response)
  204. sys.exit()
  205. def release_instances(ecs_client, instance_ids, force=False):
  206. """
  207. 释放实例
  208. :param ecs_client:
  209. :param instance_ids: instance_id, type-list
  210. :param force: 是否强制释放, True-强制释放, False-正常释放, type-bool
  211. :return:
  212. """
  213. request = DeleteInstancesRequest()
  214. request.set_InstanceIds(instance_ids)
  215. request.set_Force(force)
  216. response = send_request(ecs_client=ecs_client, request=request)
  217. return response
  218. def get_instances_status(ecs_client, instance_ids):
  219. """
  220. 获取实例运行状态
  221. :param ecs_client:
  222. :param instance_ids: instance_id, type-list
  223. :return:
  224. """
  225. request = DescribeInstanceStatusRequest()
  226. request.set_InstanceIds(instance_ids)
  227. request.set_PageSize(50)
  228. response = send_request(ecs_client=ecs_client, request=request)
  229. return response
  230. def stop_instances(ecs_client, instance_ids, force_stop=False):
  231. """
  232. 停止实例
  233. :param ecs_client:
  234. :param instance_ids: 实例ID, type-list
  235. :param force_stop: 是否强制关机, True-强制关机, False-正常关机, type-bool
  236. :return:
  237. """
  238. request = StopInstancesRequest()
  239. request.set_InstanceIds(instance_ids)
  240. request.set_ForceStop(force_stop)
  241. response = send_request(ecs_client=ecs_client, request=request)
  242. return response
  243. def send_request(ecs_client, request):
  244. """
  245. 发送API请求
  246. :param ecs_client: 客户端连接
  247. :param request: 请求配置
  248. :return: response
  249. """
  250. request.set_accept_format('json')
  251. try:
  252. response = ecs_client.do_action_with_exception(request)
  253. response = json.loads(response)
  254. # logging.info(response)
  255. return response
  256. except Exception as e:
  257. # 失败,记录报错信息,发送通知,停止并退出
  258. logging.error(e)
  259. sys.exit()
  260. def run_command(ecs_client, instance_ids, command):
  261. """
  262. 批量执行命令
  263. :param ecs_client: 客户端连接
  264. :param instance_ids: 实例id列表, type-list, 最多能指定50台ECS实例ID
  265. :param command: 命令 type-string
  266. :return:
  267. """
  268. for i in range(len(instance_ids) // 50 + 1):
  269. instance_id_list = instance_ids[i * 50:(i + 1) * 50]
  270. if len(instance_id_list) == 0:
  271. return
  272. request = RunCommandRequest()
  273. request.set_accept_format('json')
  274. request.set_Type("RunShellScript")
  275. request.set_CommandContent(command)
  276. request.set_InstanceIds(instance_id_list)
  277. response = send_request(ecs_client=ecs_client, request=request)
  278. logging.info(response)
  279. def send_file_to_ecs(ecs_client, instance_id_list, target_dir, name, content):
  280. """
  281. 发送文件到ecs;alb应用,区分上方clb
  282. :param ecs_client:
  283. :param instance_id_list: 最多能指定50台ECS实例ID
  284. :param target_dir: 文件存放目录 type-string
  285. :param name: 文件名 type-string
  286. :param content: 文件内容 type-string
  287. :return:
  288. """
  289. if not instance_id_list:
  290. logging.warning("实例ID列表为空,无法发送文件。")
  291. return
  292. for i in range(len(instance_id_list) // 50 + 1):
  293. instance_ids = instance_id_list[i * 50:(i + 1) * 50]
  294. if len(instance_ids) == 0:
  295. logging.info("没有更多的实例ID需要发送文件,退出。")
  296. return
  297. request = SendFileRequest()
  298. request.set_Content(content)
  299. request.set_TargetDir(target_dir)
  300. request.set_Name(name)
  301. request.set_Overwrite(True)
  302. request.set_InstanceIds(instance_ids)
  303. try:
  304. logging.info(f"正在向实例 {instance_ids} 发送文件 '{name}' 到目录 '{target_dir}'")
  305. response = send_request(ecs_client=ecs_client, request=request)
  306. logging.info(f"成功发送文件到实例 {instance_ids},响应: {response}")
  307. except Exception as e:
  308. logging.error(f"发送文件到实例 {instance_ids} 失败,错误: {str(e)}")
  309. def add_servers_to_server_group(alb_client, server_group_ids, instance_ids, weight, port):
  310. """
  311. 添加服务器到ALB服务器组
  312. :param alb_client: ALB客户端连接
  313. :param server_group_ids: 服务器组ID
  314. :param instance_ids: 实例ID
  315. :param weight: 权重
  316. :param port: 后端服务器使用的端口
  317. """
  318. servers = []
  319. for i in range(len(instance_ids)):
  320. server = alb_models.AddServersToServerGroupRequestServers(
  321. server_id=instance_ids[i],
  322. server_type='ecs',
  323. weight=weight,
  324. port=port
  325. )
  326. servers.append(server)
  327. # server = alb_models.AddServersToServerGroupRequestServers(
  328. # server_id=instance_id,
  329. # server_type='ecs',
  330. # weight=weight,
  331. # port=port
  332. # )
  333. for server_group_id in server_group_ids:
  334. request = alb_models.AddServersToServerGroupRequest(
  335. server_group_id=server_group_id,
  336. servers=servers
  337. )
  338. runtime = util_models.RuntimeOptions()
  339. try:
  340. alb_client.add_servers_to_server_group_with_options(request, runtime)
  341. logging.info(f"Successfully added instance_ids {instance_ids} to server group {server_group_id} with weight {weight}.")
  342. except Exception as e:
  343. logging.error(f"Failed to add instance_ids {instance_ids} to server group {server_group_id}: {str(e)}")
  344. sys.exit()
  345. def remove_servers_from_server_group(alb_client, server_group_id_list, instance_ids, port):
  346. """
  347. 从ALB服务器组中移除服务器
  348. :param alb_client: ALB客户端连接
  349. :param server_group_id_list: 服务器组ID list
  350. :param instance_ids: 实例ID list
  351. :param port: 后端服务器使用的端口
  352. """
  353. servers = []
  354. for instance_id in instance_ids:
  355. server = alb_models.RemoveServersFromServerGroupRequestServers(
  356. port=port,
  357. server_id=instance_id,
  358. server_type='ecs'
  359. )
  360. servers.append(server)
  361. for server_group_id in server_group_id_list:
  362. request = alb_models.RemoveServersFromServerGroupRequest(
  363. server_group_id=server_group_id,
  364. servers=servers
  365. )
  366. runtime = util_models.RuntimeOptions()
  367. try:
  368. alb_client.remove_servers_from_server_group_with_options(request, runtime)
  369. logging.info(f"Successfully removed instance_ids {instance_ids} from server group {server_group_id}.")
  370. except Exception as e:
  371. logging.error(f"Failed to remove instance_ids {instance_ids} from server group {server_group_id}: {str(e)}")
  372. sys.exit()
  373. def list_server_group_servers(alb_client, server_group_id):
  374. """
  375. 列出服务器组中的服务器并返回实例ID列表
  376. @param alb_client: ALB客户端
  377. @param server_group_id: 服务器组ID
  378. @return: 实例ID列表
  379. """
  380. list_server_group_servers_request = alb_20200616_models.ListServerGroupServersRequest(
  381. server_group_id=server_group_id,
  382. max_results=100
  383. )
  384. runtime = util_models.RuntimeOptions()
  385. try:
  386. response = alb_client.list_server_group_servers_with_options(list_server_group_servers_request, runtime)
  387. instance_ids = [server.server_id for server in response.body.servers]
  388. return instance_ids
  389. except Exception as error:
  390. print(str(error))
  391. UtilClient.assert_as_string(str(error))
  392. return []
  393. def update_server_group_server_weight(alb_client, server_group_id_list, instance_id_list, weight, port):
  394. """
  395. 更指定服务器在服务器组中的权重
  396. :param alb_client: ALB客户端
  397. :param server_group_id_list: 服务器组ID list
  398. :param instance_id_list: 实例ID list
  399. :param weight: 权重值
  400. :param port: 后端服务器使用的端口
  401. """
  402. servers = []
  403. for i in range(len(instance_id_list)):
  404. server = alb_20200616_models.UpdateServerGroupServersAttributeRequestServers(
  405. server_type='Ecs',
  406. server_id=instance_id_list[i],
  407. weight=weight,
  408. port=port
  409. )
  410. servers.append(server)
  411. for server_group_id in server_group_id_list:
  412. request = alb_20200616_models.UpdateServerGroupServersAttributeRequest(
  413. servers=servers,
  414. server_group_id=server_group_id
  415. )
  416. # logging.info(f"servers = {servers}")
  417. runtime = util_models.RuntimeOptions()
  418. try:
  419. # logging.info(f"instance_id_list = {instance_id_list} request = {request}")
  420. alb_client.update_server_group_servers_attribute_with_options(request, runtime)
  421. logging.info(f"Successfully updated servers {instance_id_list} in group {server_group_id} to weight {weight}.")
  422. except Exception as e:
  423. logging.error(e)
  424. sys.exit()
  425. def update_server_group_servers_attribute(alb_client, server_group_id_list, instance_id_list, weight_list, port):
  426. """
  427. 更新服务器组中的服务器权重
  428. :param alb_client: ALB客户端
  429. :param server_group_id_list: 服务器组ID列表
  430. :param instance_id_list: 实例ID列表
  431. :param weight_list: 权重修改列表 type-list [(weight, sleep_time), ...]
  432. :param port: 后端服务器使用的端口
  433. """
  434. # for server_group_id in server_group_id_list:
  435. # for instance_id in instance_id_list:
  436. for weight, sleep_time in weight_list:
  437. update_server_group_server_weight(alb_client, server_group_id_list, instance_id_list, weight, port)
  438. time.sleep(sleep_time)
  439. # check_server_group_status(alb_client, server_group_id_list)
  440. def check_server_group_status(alb_client, server_group_id_list):
  441. list_server_groups_request = alb_20200616_models.ListServerGroupsRequest(
  442. server_group_ids=server_group_id_list,
  443. max_results=100
  444. )
  445. flag = False
  446. runtime = util_models.RuntimeOptions()
  447. for i in range(10):
  448. try:
  449. response = alb_client.list_server_groups_with_options(list_server_groups_request, runtime)
  450. count = 0
  451. if response.body:
  452. server_groups = UtilClient.to_map(response.body).get("ServerGroups")
  453. if server_groups:
  454. for server_group in server_groups:
  455. if server_group.get("ServerGroupStatus") == "Available":
  456. logging.info(f"Server group {server_group} is available.")
  457. count +=1
  458. if count == len(server_group_id_list):
  459. flag = True
  460. break
  461. time.sleep(2)
  462. except Exception as e:
  463. logging.error(e)
  464. if not flag:
  465. sys.exit()