utils.py 18 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480
  1. import logging
  2. import json
  3. import sys
  4. import time
  5. import requests
  6. import asyncio
  7. from aliyunsdkcore.client import AcsClient
  8. from aliyunsdkslb.request.v20140515.AddBackendServersRequest import AddBackendServersRequest
  9. from aliyunsdkslb.request.v20140515.RemoveBackendServersRequest import RemoveBackendServersRequest
  10. from aliyunsdkecs.request.v20140526.RunInstancesRequest import RunInstancesRequest
  11. from aliyunsdkecs.request.v20140526.DescribeInstancesRequest import DescribeInstancesRequest
  12. from aliyunsdkecs.request.v20140526.DescribeNetworkInterfacesRequest import DescribeNetworkInterfacesRequest
  13. from aliyunsdkslb.request.v20140515.DescribeLoadBalancerAttributeRequest import DescribeLoadBalancerAttributeRequest
  14. from aliyunsdkecs.request.v20140526.RunCommandRequest import RunCommandRequest
  15. from aliyunsdkecs.request.v20140526.SendFileRequest import SendFileRequest
  16. from aliyunsdkecs.request.v20140526.StopInstancesRequest import StopInstancesRequest
  17. from aliyunsdkecs.request.v20140526.DeleteInstancesRequest import DeleteInstancesRequest
  18. from aliyunsdkecs.request.v20140526.DescribeInstanceStatusRequest import DescribeInstanceStatusRequest
  19. from aliyunsdkcore.request import CommonRequest
  20. logging.basicConfig(level=logging.INFO,
  21. format='%(asctime)s %(filename)s[line:%(lineno)d] %(levelname)s %(message)s',
  22. datefmt='%a, %d %b %Y %H:%M:%S')
  23. def send_msg_to_feishu(webhook, key_word, msg_text):
  24. """发送消息到飞书"""
  25. headers = {'Content-Type': 'application/json'}
  26. payload_message = {
  27. "msg_type": "text",
  28. "content": {
  29. "text": '{}: {}'.format(key_word, msg_text)
  30. }
  31. }
  32. response = requests.request('POST', url=webhook, headers=headers, data=json.dumps(payload_message))
  33. logging.info(response.text)
  34. def connect_client(access_key_id, access_key_secret, region_id):
  35. """
  36. 初始化账号,连接客户端
  37. :param access_key_id: access key Id, type-string
  38. :param access_key_secret: access key secret, type-string
  39. :param region_id: region_id
  40. :return: clt
  41. """
  42. try:
  43. clt = AcsClient(ak=access_key_id, secret=access_key_secret, region_id=region_id)
  44. return clt
  45. except Exception as e:
  46. # 失败,记录报错信息,发送通知,停止并退出
  47. logging.error(e)
  48. sys.exit()
  49. def build_create_instances_request(image_id, vswitch_id, security_group_id, zone_id, instance_type, instance_name,
  50. disk_size, disk_category, key_pair_name, tags):
  51. """
  52. 购买服务器参数配置
  53. :param image_id: 使用的镜像信息 type-string
  54. :param vswitch_id: 选择的交换机 type-string
  55. :param security_group_id: 当前vpc类型的安全组 type-string
  56. :param zone_id: 服务器所在区域 type-string
  57. :param instance_type: 实例规格 type-string
  58. :param instance_name: 实例命名 type-string
  59. :param disk_size: 磁盘大小,单位:G,type-string
  60. :param disk_category: 磁盘类型 type-string
  61. :param key_pair_name: 密钥对名称 type-string
  62. :param tags: 标签 type-list, eg: [{"Key": "ecs", "Value": "rov-server.prod"}, ...]
  63. :return: request
  64. """
  65. request = RunInstancesRequest()
  66. request.set_ImageId(image_id)
  67. request.set_VSwitchId(vswitch_id)
  68. request.set_SecurityGroupId(security_group_id)
  69. request.set_ZoneId(zone_id)
  70. request.set_InstanceType(instance_type)
  71. request.set_InstanceName(instance_name)
  72. request.set_SystemDiskSize(disk_size)
  73. request.set_SystemDiskCategory(disk_category)
  74. request.set_KeyPairName(key_pair_name)
  75. request.set_Tags(tags)
  76. return request
  77. def send_request(client, request):
  78. """
  79. 发送API请求
  80. :param client: 客户端连接
  81. :param request: 请求配置
  82. :return: response
  83. """
  84. request.set_accept_format('json')
  85. try:
  86. response = client.do_action_with_exception(request)
  87. response = json.loads(response)
  88. # logging.info(response)
  89. return response
  90. except Exception as e:
  91. # 失败,记录报错信息,发送通知,停止并退出
  92. logging.error(e)
  93. sys.exit()
  94. def check_instance_running(client, instance_ids):
  95. """
  96. 检查服务器运行状态
  97. :param client: 客户端连接
  98. :param instance_ids: 实例id列表, type-list
  99. :return: running_count,Status为Running的实例数
  100. """
  101. try:
  102. request = DescribeInstancesRequest()
  103. request.set_InstanceIds(json.dumps(instance_ids))
  104. request.set_PageSize(100)
  105. response = send_request(client=client, request=request)
  106. if response.get('Code') is None:
  107. instances_list = response.get('Instances').get('Instance')
  108. running_count = 0
  109. running_instances = []
  110. for instance_detail in instances_list:
  111. if instance_detail.get('Status') == "Running":
  112. running_count += 1
  113. running_instances.append(instance_detail.get('InstanceId'))
  114. return running_count, running_instances
  115. else:
  116. # 失败,记录报错信息,发送通知,停止并退出
  117. logging.error(response)
  118. sys.exit()
  119. except Exception as e:
  120. # 失败,记录报错信息,发送通知,停止并退出
  121. logging.error(e)
  122. sys.exit()
  123. def create_multiple_instances(amount, client,
  124. image_id, vswitch_id, security_group_id, zone_id, instance_type, instance_name,
  125. disk_size, disk_category, key_pair_name, tags):
  126. """
  127. 创建多个ECS实例
  128. :param amount: 创建实例数 type-int 取值范围:[1, 100]
  129. :param client: 购买机器客户端连接
  130. :param image_id: 使用的镜像信息 type-string
  131. :param vswitch_id: 选择的交换机 type-string
  132. :param security_group_id: 当前vpc类型的安全组 type-string
  133. :param zone_id: 服务器所在区域 type-string
  134. :param instance_type: 实例规格 type-string
  135. :param instance_name: 实例命名 type-string
  136. :param disk_size: 磁盘大小,单位:G,type-string
  137. :param disk_category: 磁盘类型 type-string
  138. :param key_pair_name: 密钥对名称 type-string
  139. :param tags: 标签 type-list, eg: [{"Key": "ecs", "Value": "rov-server.prod"}, ...]
  140. :return:
  141. """
  142. logging.info(f"create instances start, request amount: {amount}.")
  143. # 1. 连接客户端
  144. # create_instances_clt = connect_client(
  145. # access_key_id=access_key_id, access_key_secret=access_key_secret, region_id=region_id
  146. # )
  147. # 2. 请求参数配置
  148. request = build_create_instances_request(
  149. image_id=image_id, vswitch_id=vswitch_id, security_group_id=security_group_id, zone_id=zone_id,
  150. instance_type=instance_type, instance_name=instance_name, disk_size=disk_size, disk_category=disk_category,
  151. key_pair_name=key_pair_name, tags=tags
  152. )
  153. request.set_Amount(amount)
  154. # 3. 发送API请求,购买机器并启动
  155. response = send_request(client=client, request=request)
  156. if response.get('Code') is None:
  157. instance_ids = response.get('InstanceIdSets').get('InstanceIdSet')
  158. logging.info(f"success amount: {len(instance_ids)}, instance ids: {instance_ids}.")
  159. # 获取机器运行状态
  160. running_amount = 0
  161. while running_amount < amount:
  162. time.sleep(10)
  163. running_amount, running_instances = check_instance_running(client=client, instance_ids=instance_ids)
  164. logging.info(f"running amount: {running_amount}, running instances: {running_instances}.")
  165. return instance_ids
  166. else:
  167. # 失败,记录报错信息,发送通知,停止并退出
  168. logging.error(response)
  169. sys.exit()
  170. def run_command(client, instance_ids, command):
  171. """
  172. 批量执行命令
  173. :param client: 客户端连接
  174. :param instance_ids: 实例id列表, type-list
  175. :param command: 命令 type-string
  176. :return:
  177. """
  178. request = RunCommandRequest()
  179. request.set_accept_format('json')
  180. request.set_Type("RunShellScript")
  181. request.set_CommandContent(command)
  182. request.set_InstanceIds(instance_ids)
  183. response = send_request(client=client, request=request)
  184. logging.info(response)
  185. def get_instance_ids(client, slb_id):
  186. """
  187. 获取slb下所有服务器instanceId
  188. :param client: 客户端连接
  189. :param slb_id: 负载均衡id type-string
  190. :return: instance_ids type-list
  191. """
  192. request = DescribeLoadBalancerAttributeRequest()
  193. request.set_accept_format('json')
  194. request.set_LoadBalancerId(slb_id)
  195. response = send_request(client=client, request=request)
  196. instance_ids = [instance["ServerId"] for instance in response["BackendServers"]["BackendServer"]]
  197. return instance_ids
  198. def get_ip_address(client, instance_id):
  199. """
  200. 获取实例IP地址
  201. :param client: 客户端连接
  202. :param instance_id: 实例id, type-string
  203. :return: ip_address, type-string
  204. """
  205. request = DescribeNetworkInterfacesRequest()
  206. request.set_accept_format('json')
  207. request.set_InstanceId(instance_id)
  208. response = send_request(client=client, request=request)
  209. ip_address = response['NetworkInterfaceSets']['NetworkInterfaceSet'][0]['PrivateIpAddress']
  210. return ip_address
  211. def set_weight_for_instances(client, slb_id, instance_id_list, weight):
  212. """
  213. 同时设置多台服务器的slb权重,权重一样
  214. :param client: 客户端连接
  215. :param slb_id: slb_id
  216. :param instance_id_list: 服务器id list
  217. :param weight: 权重值
  218. :return: None
  219. """
  220. BackendServers = [{"ServerId": instance_id, "Weight": weight} for instance_id in instance_id_list]
  221. request = CommonRequest()
  222. request.set_accept_format('json')
  223. request.set_domain('slb.aliyuncs.com')
  224. request.set_version('2014-05-15')
  225. request.set_method('POST')
  226. request.set_action_name('SetBackendServers')
  227. request.add_query_param('BackendServers', BackendServers)
  228. request.add_query_param('LoadBalancerId', slb_id)
  229. response = send_request(client=client, request=request)
  230. return response
  231. def send_file_to_ecs(client, instance_id_list, target_dir, name, content):
  232. """
  233. 发送文件到ecs
  234. :param client:
  235. :param instance_id_list:
  236. :param target_dir: 文件存放目录 type-string
  237. :param name: 文件名 type-string
  238. :param content: 文件内容 type-string
  239. :return:
  240. """
  241. request = SendFileRequest()
  242. request.set_Content(content)
  243. request.set_TargetDir(target_dir)
  244. request.set_Name(name)
  245. request.set_Overwrite(True)
  246. request.set_InstanceIds(instance_id_list)
  247. response = send_request(client=client, request=request)
  248. return response
  249. def stop_instances(client, instance_ids, force_stop=False):
  250. """
  251. 停止实例
  252. :param client:
  253. :param instance_ids: 实例ID, type-list
  254. :param force_stop: 是否强制关机, True-强制关机, False-正常关机, type-bool
  255. :return:
  256. """
  257. request = StopInstancesRequest()
  258. request.set_InstanceIds(instance_ids)
  259. request.set_ForceStop(force_stop)
  260. response = send_request(client=client, request=request)
  261. return response
  262. def release_instances(client, instance_ids, force=False):
  263. """
  264. 释放实例
  265. :param client:
  266. :param instance_ids: instance_id, type-list
  267. :param force: 是否强制释放, True-强制释放, False-正常释放, type-bool
  268. :return:
  269. """
  270. request = DeleteInstancesRequest()
  271. request.set_InstanceIds(instance_ids)
  272. request.set_Force(force)
  273. response = send_request(client=client, request=request)
  274. return response
  275. def get_instances_status(client, instance_ids):
  276. """
  277. 获取实例运行状态
  278. :param client:
  279. :param instance_ids: instance_id, type-liist
  280. :return:
  281. """
  282. request = DescribeInstanceStatusRequest()
  283. request.set_InstanceIds(instance_ids)
  284. request.set_PageSize(50)
  285. response = send_request(client=client, request=request)
  286. return response
  287. def set_instance_weight_process(client, slb_id, instance_id_list, weight_list):
  288. """
  289. 修改服务器的权重值
  290. :param client: slb客户端连接
  291. :param slb_id: slb id
  292. :param instance_id_list: instance id list
  293. :param weight_list: 权重修改列表 type-list [(weight, sleep_time), ...]
  294. :return:
  295. """
  296. for weight, sleep_time in weight_list:
  297. logging.info(f"weight = {weight}")
  298. flag = True
  299. while flag:
  300. try:
  301. set_weight_for_instances(client=client, slb_id=slb_id, instance_id_list=instance_id_list, weight=weight)
  302. time.sleep(sleep_time)
  303. flag = False
  304. except Exception as e:
  305. time.sleep(10)
  306. continue
  307. def add_backend_servers(client, slb_id, instances):
  308. """
  309. 服务器挂载到负载均衡(必须是状态为运行中的后端服务器才可以加入负载均衡实例,每次调用最多可添加20个后端服务器)
  310. :param client:
  311. :param slb_id:
  312. :param instances: 实例列表 [(instance_id, ip), ...]
  313. :return:
  314. """
  315. try:
  316. for i in range(len(instances) // 20 + 1):
  317. instances_list = instances[i * 20:(i + 1) * 20]
  318. if len(instances_list) == 0:
  319. return
  320. request = AddBackendServersRequest()
  321. request.set_accept_format('json')
  322. request.set_LoadBalancerId(slb_id)
  323. backend_servers = [
  324. {"ServerId": instance_id, "Weight": "0", "Type": "ecs", "ServerIp": ip_address}
  325. for instance_id, ip_address in instances_list]
  326. request.set_BackendServers(backend_servers)
  327. response = client.do_action_with_exception(request)
  328. return response
  329. except Exception as e:
  330. logging.error(e)
  331. sys.exit()
  332. def remove_backend_servers(client, slb_id, instances):
  333. """
  334. 服务器从负载均衡移除(一次调用最多可以移除20个后端服务器)
  335. :param client:
  336. :param slb_id:
  337. :param instances: 实例列表 [instance_id, ...]
  338. :return:
  339. """
  340. try:
  341. for i in range(len(instances) // 20 + 1):
  342. instances_list = instances[i * 20:(i + 1) * 20]
  343. if len(instances_list) == 0:
  344. return
  345. request = RemoveBackendServersRequest()
  346. request.set_accept_format('json')
  347. request.set_LoadBalancerId(slb_id)
  348. backend_servers = [
  349. {"ServerId": instance_id, "Weight": "0", "Type": "ecs"}
  350. for instance_id in instances_list]
  351. request.set_BackendServers(backend_servers)
  352. response = client.do_action_with_exception(request)
  353. return response
  354. except Exception as e:
  355. logging.error(e)
  356. sys.exit()
  357. def set_instance_weight_process_with_slbs(client, slb_id_list, instance_id_list, weight_list):
  358. """
  359. 修改服务器的权重值
  360. :param client: slb客户端连接
  361. :param slb_id_list: slb id list
  362. :param instance_id_list: instance id list
  363. :param weight_list: 权重修改列表 type-list [(weight, sleep_time), ...]
  364. :return:
  365. """
  366. for weight, sleep_time in weight_list:
  367. logging.info(f"修改权重中: weight = {weight}")
  368. for slb_id in slb_id_list:
  369. flag = True
  370. while flag:
  371. try:
  372. for i in range(len(instance_id_list) // 40 + 1):
  373. instances_list = instance_id_list[i * 40:(i + 1) * 40]
  374. if len(instances_list) == 0:
  375. break
  376. set_weight_for_instances(client=client, slb_id=slb_id, instance_id_list=instances_list, weight=weight)
  377. logging.info(f"slb: {slb_id} finished!")
  378. flag = False
  379. except Exception as e:
  380. time.sleep(10)
  381. continue
  382. time.sleep(sleep_time)
  383. def add_backend_servers_with_slbs(client, slb_id_list, instances):
  384. """
  385. 服务器挂载到负载均衡(必须是状态为运行中的后端服务器才可以加入负载均衡实例,每次调用最多可添加20个后端服务器)
  386. :param client:
  387. :param slb_id_list:
  388. :param instances: 实例列表 [(instance_id, ip), ...]
  389. :return:
  390. """
  391. try:
  392. for i in range(len(instances)//20 + 1):
  393. instances_list = instances[i*20:(i+1)*20]
  394. if len(instances_list) == 0:
  395. return
  396. for slb_id in slb_id_list:
  397. request = AddBackendServersRequest()
  398. request.set_accept_format('json')
  399. request.set_LoadBalancerId(slb_id)
  400. backend_servers = [
  401. {"ServerId": instance_id, "Weight": "0", "Type": "ecs", "ServerIp": ip_address}
  402. for instance_id, ip_address in instances_list]
  403. request.set_BackendServers(backend_servers)
  404. response = client.do_action_with_exception(request)
  405. logging.info(f"slb: {slb_id} add backend servers finished!")
  406. logging.info(f"i: {i}, count: {len(instances_list)}, instances: {instances_list} "
  407. f"add backend servers finished!")
  408. except Exception as e:
  409. logging.error(e)
  410. sys.exit()
  411. def remove_backend_servers_with_slbs(client, slb_id_list, instances):
  412. """
  413. 服务器从负载均衡移除(一次调用最多可以移除20个后端服务器)
  414. :param client:
  415. :param slb_id_list:
  416. :param instances: 实例列表 [instance_id, ...]
  417. :return:
  418. """
  419. try:
  420. for i in range(len(instances)//20 + 1):
  421. instances_list = instances[i*20:(i+1)*20]
  422. if len(instances_list) == 0:
  423. return
  424. for slb_id in slb_id_list:
  425. request = RemoveBackendServersRequest()
  426. request.set_accept_format('json')
  427. request.set_LoadBalancerId(slb_id)
  428. backend_servers = [
  429. {"ServerId": instance_id, "Weight": "0", "Type": "ecs"}
  430. for instance_id in instances_list]
  431. request.set_BackendServers(backend_servers)
  432. response = client.do_action_with_exception(request)
  433. logging.info(f"slb: {slb_id} remove backend servers finished!")
  434. logging.info(f"i: {i}, count: {len(instances_list)}, instances: {instances_list} "
  435. f"remove backend servers finished!")
  436. except Exception as e:
  437. logging.error(e)
  438. sys.exit()