utils.py 20 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540
  1. import logging
  2. import json
  3. import sys
  4. import time
  5. from asyncio import wait_for
  6. import requests
  7. import asyncio
  8. import time
  9. from alibabacloud_tea_util.client import Client as UtilClient
  10. from aliyunsdkcore.client import AcsClient
  11. from aliyunsdkecs.request.v20140526.RunInstancesRequest import RunInstancesRequest
  12. from aliyunsdkecs.request.v20140526.DescribeInstancesRequest import DescribeInstancesRequest
  13. from aliyunsdkecs.request.v20140526.DescribeNetworkInterfacesRequest import DescribeNetworkInterfacesRequest
  14. from aliyunsdkecs.request.v20140526.RunCommandRequest import RunCommandRequest
  15. from aliyunsdkecs.request.v20140526.SendFileRequest import SendFileRequest
  16. from aliyunsdkecs.request.v20140526.StopInstancesRequest import StopInstancesRequest
  17. from aliyunsdkecs.request.v20140526.DeleteInstancesRequest import DeleteInstancesRequest
  18. from aliyunsdkecs.request.v20140526.DescribeInstanceStatusRequest import DescribeInstanceStatusRequest
  19. from alibabacloud_alb20200616.client import Client as Alb20200616Client
  20. from alibabacloud_tea_openapi import models as open_api_models
  21. from alibabacloud_alb20200616 import models as alb_models
  22. from alibabacloud_alb20200616 import models as alb_20200616_models
  23. from alibabacloud_tea_util import models as util_models
  24. logging.basicConfig(level=logging.INFO,
  25. format='%(asctime)s %(filename)s[line:%(lineno)d] %(levelname)s %(message)s',
  26. datefmt='%a, %d %b %Y %H:%M:%S')
  27. def send_msg_to_feishu(webhook, key_word, msg_text):
  28. """发送消息到飞书"""
  29. headers = {'Content-Type': 'application/json'}
  30. payload_message = {
  31. "msg_type": "text",
  32. "content": {
  33. "text": '{}: {}'.format(key_word, msg_text)
  34. }
  35. }
  36. response = requests.request('POST', url=webhook, headers=headers, data=json.dumps(payload_message))
  37. logging.info(response.text)
  38. def connect_client(access_key_id, access_key_secret, region_id):
  39. """
  40. 初始化账号,连接客户端
  41. :param access_key_id: access key Id, type-string
  42. :param access_key_secret: access key secret, type-string
  43. :param region_id: region_id
  44. :return: clt
  45. """
  46. try:
  47. clt = AcsClient(ak=access_key_id, secret=access_key_secret, region_id=region_id)
  48. return clt
  49. except Exception as e:
  50. # 失败,记录报错信息,发送通知,停止并退出
  51. logging.error(e)
  52. sys.exit()
  53. def connect_alb_client(access_key_id, access_key_secret, endpoint):
  54. """
  55. 初始化ALB客户端
  56. :param access_key_id: access key Id, type-string
  57. :param access_key_secret: access key secret, type-string
  58. :return: alb_client
  59. """
  60. config = open_api_models.Config(
  61. access_key_id=access_key_id,
  62. access_key_secret=access_key_secret,
  63. endpoint=endpoint
  64. )
  65. alb_client = Alb20200616Client(config)
  66. return alb_client
  67. def build_create_instances_request(image_id, vswitch_id, security_group_id, zone_id, instance_type, instance_name,
  68. disk_size, disk_category, key_pair_name, tags):
  69. """
  70. 购买服务器参数配置
  71. :param image_id: 使用的镜像信息 type-string
  72. :param vswitch_id: 选择的交换机 type-string
  73. :param security_group_id: 当前vpc类型的安全组 type-string
  74. :param zone_id: 服务器所在区域 type-string
  75. :param instance_type: 实例规格 type-string
  76. :param instance_name: 实例命名 type-string
  77. :param disk_size: 磁盘大小,单位:G,type-string
  78. :param disk_category: 磁盘类型 type-string
  79. :param key_pair_name: 密钥对名称 type-string
  80. :param tags: 标签 type-list, eg: [{"Key": "ecs", "Value": "rov-server.prod"}, ...]
  81. :return: request
  82. """
  83. request = RunInstancesRequest()
  84. request.set_ImageId(image_id)
  85. request.set_VSwitchId(vswitch_id)
  86. request.set_SecurityGroupId(security_group_id)
  87. request.set_ZoneId(zone_id)
  88. request.set_InstanceType(instance_type)
  89. request.set_InstanceName(instance_name)
  90. request.set_SystemDiskSize(disk_size)
  91. request.set_SystemDiskCategory(disk_category)
  92. request.set_KeyPairName(key_pair_name)
  93. request.set_Tags(tags)
  94. return request
  95. def send_req(client, request):
  96. """
  97. 发送API请求
  98. :param client: 客户端连接
  99. :param request: 请求配置
  100. :return: response
  101. """
  102. request.set_accept_format('json')
  103. response = client.do_action_with_exception(request)
  104. #print(response)
  105. response = json.loads(response)
  106. print(response)
  107. # logging.info(response)
  108. print(response.get('Code'))
  109. return response
  110. #except Exception as e:
  111. # 失败,记录报错信息,发送通知,停止并退出
  112. #logging.error(e)
  113. #sys.exit()
  114. def check_instance_running(ecs_client, instance_ids):
  115. """
  116. 检查服务器运行状态
  117. :param ecs_client: 客户端连接
  118. :param instance_ids: 实例id列表, type-list
  119. :return: running_count,Status为Running的实例数
  120. """
  121. try:
  122. request = DescribeInstancesRequest()
  123. request.set_InstanceIds(json.dumps(instance_ids))
  124. request.set_PageSize(100)
  125. response = send_request(ecs_client=ecs_client, request=request)
  126. if response.get('Code') is None:
  127. instances_list = response.get('Instances').get('Instance')
  128. running_count = 0
  129. running_instances = []
  130. for instance_detail in instances_list:
  131. if instance_detail.get('Status') == "Running":
  132. running_count += 1
  133. running_instances.append(instance_detail.get('InstanceId'))
  134. return running_count, running_instances
  135. else:
  136. # 失败,记录报错信息,发送通知,停止并退出
  137. logging.error(response)
  138. sys.exit()
  139. except Exception as e:
  140. # 失败,记录报错信息,发送通知,停止并退出
  141. logging.error(e)
  142. sys.exit()
  143. def get_ip_address(ecs_client, instance_id):
  144. """
  145. 获取实例IP地址
  146. :param ecs_client: 客户端连接
  147. :param instance_id: 实例id, type-string
  148. :return: ip_address, type-string
  149. """
  150. request = DescribeNetworkInterfacesRequest()
  151. request.set_accept_format('json')
  152. request.set_InstanceId(instance_id)
  153. response = send_request(ecs_client=ecs_client, request=request)
  154. ip_address = response['NetworkInterfaceSets']['NetworkInterfaceSet'][0]['PrivateIpAddress']
  155. return ip_address
  156. def create_multiple_instances(amount, ecs_client,
  157. image_id, vswitch_id, security_group_id, zone_id, instance_type, instance_name,
  158. disk_size, disk_category, key_pair_name, tags):
  159. """
  160. 创建多个ECS实例
  161. :param amount: 创建实例数 type-int 取值范围:[1, 100]
  162. :param ecs_client: 购买机器客户端连接
  163. :param image_id: 使用的镜像信息 type-string
  164. :param vswitch_id: 选择的交换机 type-string
  165. :param security_group_id: 当前vpc类型的安全组 type-string
  166. :param zone_id: 服务器所在区域 type-string
  167. :param instance_type: 实例规格 type-string
  168. :param instance_name: 实例命名 type-string
  169. :param disk_size: 磁盘大小,单位:G,type-string
  170. :param disk_category: 磁盘类型 type-string
  171. :param key_pair_name: 密钥对名称 type-string
  172. :param tags: 标签 type-list, eg: [{"Key": "ecs", "Value": "rov-server.prod"}, ...]
  173. :return:
  174. """
  175. logging.info(f"create instances start, request amount: {amount}.")
  176. # 1. 连接客户端
  177. # create_instances_clt = connect_client(
  178. # access_key_id=access_key_id, access_key_secret=access_key_secret, region_id=region_id
  179. # )
  180. # 2. 请求参数配置
  181. request = build_create_instances_request(
  182. image_id=image_id, vswitch_id=vswitch_id, security_group_id=security_group_id, zone_id=zone_id,
  183. instance_type=instance_type, instance_name=instance_name, disk_size=disk_size, disk_category=disk_category,
  184. key_pair_name=key_pair_name, tags=tags
  185. )
  186. request.set_Amount(amount)
  187. # 3. 发送API请求,购买机器并启动
  188. response = send_request(ecs_client=ecs_client, request=request)
  189. if response.get('Code') is None:
  190. instance_ids = response.get('InstanceIdSets').get('InstanceIdSet')
  191. logging.info(f"success amount: {len(instance_ids)}, instance ids: {instance_ids}.")
  192. # 获取机器运行状态
  193. running_amount = 0
  194. while running_amount < amount:
  195. time.sleep(10)
  196. running_amount, running_instances = check_instance_running(ecs_client=ecs_client, instance_ids=instance_ids)
  197. logging.info(f"running amount: {running_amount}, running instances: {running_instances}.")
  198. return instance_ids
  199. else:
  200. # 失败,记录报错信息,发送通知,停止并退出
  201. logging.error(response)
  202. sys.exit()
  203. def release_instances(ecs_client, instance_ids, force=False):
  204. """
  205. 释放实例
  206. :param ecs_client:
  207. :param instance_ids: instance_id, type-list
  208. :param force: 是否强制释放, True-强制释放, False-正常释放, type-bool
  209. :return:
  210. """
  211. request = DeleteInstancesRequest()
  212. request.set_InstanceIds(instance_ids)
  213. request.set_Force(force)
  214. response = send_request(ecs_client=ecs_client, request=request)
  215. return response
  216. def get_instances_status(ecs_client, instance_ids):
  217. """
  218. 获取实例运行状态
  219. :param ecs_client:
  220. :param instance_ids: instance_id, type-list
  221. :return:
  222. """
  223. request = DescribeInstanceStatusRequest()
  224. request.set_InstanceIds(instance_ids)
  225. request.set_PageSize(50)
  226. response = send_request(ecs_client=ecs_client, request=request)
  227. return response
  228. def stop_instances(ecs_client, instance_ids, force_stop=False):
  229. """
  230. 停止实例
  231. :param ecs_client:
  232. :param instance_ids: 实例ID, type-list
  233. :param force_stop: 是否强制关机, True-强制关机, False-正常关机, type-bool
  234. :return:
  235. """
  236. request = StopInstancesRequest()
  237. request.set_InstanceIds(instance_ids)
  238. request.set_ForceStop(force_stop)
  239. response = send_request(ecs_client=ecs_client, request=request)
  240. return response
  241. def send_request(ecs_client, request):
  242. """
  243. 发送API请求
  244. :param ecs_client: 客户端连接
  245. :param request: 请求配置
  246. :return: response
  247. """
  248. request.set_accept_format('json')
  249. try:
  250. response = ecs_client.do_action_with_exception(request)
  251. response = json.loads(response)
  252. # logging.info(response)
  253. return response
  254. except Exception as e:
  255. # 失败,记录报错信息,发送通知,停止并退出
  256. logging.error(e)
  257. sys.exit()
  258. def run_command(ecs_client, instance_ids, command):
  259. """
  260. 批量执行命令
  261. :param ecs_client: 客户端连接
  262. :param instance_ids: 实例id列表, type-list, 最多能指定50台ECS实例ID
  263. :param command: 命令 type-string
  264. :return:
  265. """
  266. for i in range(len(instance_ids) // 50 + 1):
  267. instance_id_list = instance_ids[i * 50:(i + 1) * 50]
  268. if len(instance_id_list) == 0:
  269. return
  270. request = RunCommandRequest()
  271. request.set_accept_format('json')
  272. request.set_Type("RunShellScript")
  273. request.set_CommandContent(command)
  274. request.set_InstanceIds(instance_id_list)
  275. response = send_request(ecs_client=ecs_client, request=request)
  276. logging.info(response)
  277. def send_file_to_ecs(ecs_client, instance_id_list, target_dir, name, content):
  278. """
  279. 发送文件到ecs;alb应用,区分上方clb
  280. :param ecs_client:
  281. :param instance_id_list: 最多能指定50台ECS实例ID
  282. :param target_dir: 文件存放目录 type-string
  283. :param name: 文件名 type-string
  284. :param content: 文件内容 type-string
  285. :return:
  286. """
  287. if not instance_id_list:
  288. logging.warning("实例ID列表为空,无法发送文件。")
  289. return
  290. for i in range(len(instance_id_list) // 50 + 1):
  291. instance_ids = instance_id_list[i * 50:(i + 1) * 50]
  292. if len(instance_ids) == 0:
  293. logging.info("没有更多的实例ID需要发送文件,退出。")
  294. return
  295. request = SendFileRequest()
  296. request.set_Content(content)
  297. request.set_TargetDir(target_dir)
  298. request.set_Name(name)
  299. request.set_Overwrite(True)
  300. request.set_InstanceIds(instance_ids)
  301. try:
  302. logging.info(f"正在向实例 {instance_ids} 发送文件 '{name}' 到目录 '{target_dir}'")
  303. response = send_request(ecs_client=ecs_client, request=request)
  304. logging.info(f"成功发送文件到实例 {instance_ids},响应: {response}")
  305. except Exception as e:
  306. logging.error(f"发送文件到实例 {instance_ids} 失败,错误: {str(e)}")
  307. def add_servers_to_server_group(alb_client, server_group_id, instance_id, weight, port):
  308. """
  309. 添加服务器到ALB服务器组
  310. :param alb_client: ALB客户端连接
  311. :param server_group_id: 服务器组ID
  312. :param instance_id: 实例ID
  313. :param weight: 权重
  314. :param port: 后端服务器使用的端口
  315. """
  316. server = alb_models.AddServersToServerGroupRequestServers(
  317. server_id=instance_id,
  318. server_type='ecs',
  319. weight=weight,
  320. port=port
  321. )
  322. request = alb_models.AddServersToServerGroupRequest(
  323. server_group_id=server_group_id,
  324. servers=[server]
  325. )
  326. runtime = util_models.RuntimeOptions()
  327. try:
  328. alb_client.add_servers_to_server_group_with_options(request, runtime)
  329. logging.info(f"Successfully added server {instance_id} to server group {server_group_id} with weight {weight}.")
  330. except Exception as e:
  331. logging.error(f"Failed to add server {instance_id} to server group {server_group_id}: {str(e)}")
  332. def remove_servers_from_server_group(alb_client, server_group_id, instance_ids, port):
  333. """
  334. 从ALB服务器组中移除服务器
  335. :param alb_client: ALB客户端连接
  336. :param server_group_id: 服务器组ID
  337. :param instance_ids: 实例ID
  338. :param port: 后端服务器使用的端口
  339. """
  340. for instance_id in instance_ids:
  341. server = alb_models.RemoveServersFromServerGroupRequestServers(
  342. port=port,
  343. server_id=instance_id,
  344. server_type='ecs'
  345. )
  346. request = alb_models.RemoveServersFromServerGroupRequest(
  347. server_group_id=server_group_id,
  348. servers=[server]
  349. )
  350. runtime = util_models.RuntimeOptions()
  351. try:
  352. alb_client.remove_servers_from_server_group_with_options(request, runtime)
  353. logging.info(f"Successfully removed server {instance_id} from server group {server_group_id}.")
  354. except Exception as e:
  355. logging.error(f"Failed to remove server {instance_id} from server group {server_group_id}: {str(e)}")
  356. def list_server_group_servers(alb_client, server_group_id):
  357. """
  358. 列出服务器组中的服务器并返回实例ID列表
  359. @param alb_client: ALB客户端
  360. @param server_group_id: 服务器组ID
  361. @return: 实例ID列表
  362. """
  363. list_server_group_servers_request = alb_20200616_models.ListServerGroupServersRequest(
  364. server_group_id=server_group_id
  365. )
  366. runtime = util_models.RuntimeOptions()
  367. try:
  368. response = alb_client.list_server_group_servers_with_options(list_server_group_servers_request, runtime)
  369. instance_ids = [server.server_id for server in response.body.servers]
  370. return instance_ids
  371. except Exception as error:
  372. print(str(error))
  373. UtilClient.assert_as_string(str(error))
  374. return []
  375. async def list_server_group_servers_async(alb_client, server_group_id):
  376. """
  377. 异步列出指定服务器组中的服务器并返回实例ID列表
  378. @param alb_client: ALB客户端
  379. @param server_group_id: 服务器组ID
  380. @return: 实例ID列表
  381. """
  382. list_server_group_servers_request = alb_20200616_models.ListServerGroupServersRequest(
  383. server_group_id=server_group_id
  384. )
  385. runtime = util_models.RuntimeOptions()
  386. try:
  387. response = await alb_client.list_server_group_servers_with_options_async(list_server_group_servers_request, runtime)
  388. instance_ids = [server.server_id for server in response.body.servers]
  389. return instance_ids
  390. except Exception as error:
  391. print(str(error))
  392. UtilClient.assert_as_string(str(error))
  393. return []
  394. def update_server_group_server_weight(alb_client, server_group_id, instance_id, weight, port):
  395. """
  396. 更指定服务器在服务器组中的权重
  397. :param alb_client: ALB客户端
  398. :param server_group_id: 服务器组ID
  399. :param instance_id: 实例ID
  400. :param weight: 权重值
  401. :param port: 后端服务器使用的端口
  402. """
  403. server = alb_20200616_models.UpdateServerGroupServersAttributeRequestServers(
  404. server_type='Ecs',
  405. server_id=instance_id,
  406. weight=weight,
  407. port=port
  408. )
  409. request = alb_20200616_models.UpdateServerGroupServersAttributeRequest(
  410. servers=[server],
  411. server_group_id=server_group_id
  412. )
  413. runtime = util_models.RuntimeOptions()
  414. try:
  415. alb_client.update_server_group_servers_attribute_with_options(request, runtime)
  416. print(f"Successfully updated server {instance_id} in group {server_group_id} to weight {weight}.")
  417. except Exception as error:
  418. print(str(error))
  419. UtilClient.assert_as_string(str(error))
  420. def update_server_group_servers_attribute(alb_client, server_group_id_list, instance_id_list, weight_list, port):
  421. """
  422. 更新服务器组中的服务器权重
  423. :param alb_client: ALB客户端
  424. :param server_group_id_list: 服务器组ID列表
  425. :param instance_id_list: 实例ID列表
  426. :param weight_list: 权重修改列表 type-list [(weight, sleep_time), ...]
  427. :param port: 后端服务器使用的端口
  428. """
  429. for server_group_id in server_group_id_list:
  430. for instance_id in instance_id_list:
  431. for weight, sleep_time in weight_list:
  432. update_server_group_server_weight(alb_client, server_group_id, instance_id, weight, port)
  433. time.sleep(sleep_time)
  434. async def update_server_group_server_weight_async(alb_client, server_group_id, instance_id, weight, port):
  435. """
  436. 异步更新特定服务器在服务器组中的权重
  437. :param alb_client: ALB客户端
  438. :param server_group_id: 服务器组ID
  439. :param instance_id: 实例ID
  440. :param weight: 权重值
  441. :param port: 后端服务器使用的端口
  442. """
  443. server = alb_20200616_models.UpdateServerGroupServersAttributeRequestServers(
  444. server_type='Ecs',
  445. server_id=instance_id,
  446. weight=weight,
  447. port=port
  448. )
  449. request = alb_20200616_models.UpdateServerGroupServersAttributeRequest(
  450. servers=[server],
  451. server_group_id=server_group_id
  452. )
  453. runtime = util_models.RuntimeOptions()
  454. try:
  455. await alb_client.update_server_group_servers_attribute_with_options_async(request, runtime)
  456. print(f"Successfully updated server {instance_id} in group {server_group_id} to weight {weight} asynchronously.")
  457. except Exception as error:
  458. print(str(error))
  459. UtilClient.assert_as_string(str(error))
  460. async def update_server_group_servers_attribute_async(alb_client, server_group_id_list, instance_ids, weight_list, port):
  461. """
  462. 异步更新服务器组中的服务器属性
  463. :param alb_client: ALB客户端
  464. :param server_group_id_list: 服务器组ID列表
  465. :param instance_ids: 实例ID列表
  466. :param weight_list: 权重修改列表 type-list [(weight, sleep_time), ...]
  467. """
  468. tasks = []
  469. for server_group_id in server_group_id_list:
  470. for instance_id in instance_ids:
  471. for weight, sleep_time in weight_list:
  472. tasks.append(update_server_group_server_weight_async(alb_client, server_group_id, instance_id, weight, port))
  473. await asyncio.sleep(sleep_time)
  474. await asyncio.gather(*tasks)