ess-instance-rov-server.py 7.2 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224
  1. # #!/usr/bin/env python
  2. # #coding=utf-8
  3. import json
  4. import logging
  5. import time
  6. import requests
  7. import sys
  8. from aliyunsdkcore import client
  9. from aliyunsdkcore.client import AcsClient
  10. from aliyunsdkcore.acs_exception.exceptions import ClientException
  11. from aliyunsdkcore.acs_exception.exceptions import ServerException
  12. from aliyunsdkecs.request.v20140526.CreateInstanceRequest import CreateInstanceRequest
  13. from aliyunsdkecs.request.v20140526.StartInstanceRequest import StartInstanceRequest
  14. from aliyunsdkecs.request.v20140526.DescribeInstancesRequest import DescribeInstancesRequest
  15. from aliyunsdkecs.request.v20140526.RunInstancesRequest import RunInstancesRequest
  16. from aliyunsdkecs.request.v20140526.DescribeNetworkInterfacesRequest import DescribeNetworkInterfacesRequest
  17. from aliyunsdkslb.request.v20140515.AddBackendServersRequest import AddBackendServersRequest
  18. from aliyunsdkecs.request.v20140526.RunCommandRequest import RunCommandRequest
  19. from aliyunsdkcore.request import CommonRequest
  20. logging.basicConfig(level=logging.INFO,
  21. format='%(asctime)s %(filename)s[line:%(lineno)d] %(levelname)s %(message)s',
  22. datefmt='%a, %d %b %Y %H:%M:%S')
  23. # ##### 购买服务器权限
  24. # access key Id
  25. ak_id = "LTAI4GBWbFvvXoXsSVBe1o9f"
  26. # access key secret
  27. ak_secret = "kRAikWitb4kDxaAyBqNrmLmllMEDO3"
  28. # 设置地域
  29. region_id = "cn-hangzhou"
  30. clt = client.AcsClient(ak_id, ak_secret, region_id)
  31. # 获取批量创建ECS实例的数量, 取值范围:1-100, 默认值:1
  32. amount = int(sys.argv[1])
  33. # 使用的镜像信息
  34. image_id = "m-bp1dnxi0r8zn5s0gpuwm"
  35. # 设置实例规格
  36. instance_type = "ecs.ic5.large"
  37. # 选择的交换机
  38. vswitch_id = "vsw-bp19lpjwtc6j0p0m9mdc2"
  39. # 当前VPC类型的安全组
  40. security_group_id = "sg-bp1irhrkr4vfj272hk4y"
  41. # 硬盘的大小,单位:G
  42. disk_size = "200"
  43. # 服务器命名
  44. instance_name = "ESS-rov-server-[1,2]"
  45. # 服务器所在区域
  46. zone_id = "cn-hangzhou-h"
  47. # 磁盘类型:云盘
  48. disk_category = "cloud_efficiency"
  49. # 密钥
  50. key_pair_name = "stuuudy"
  51. # 负载均衡ID
  52. slb_id_2 = "lb-bp1werfophtsjzfr76njm"
  53. # ##### 修改负载均衡权限
  54. AccessKey = 'LTAIuPbTPL3LDDKN'
  55. AccessSecret = 'ORcNedKwWuwVtcq4IRFtUDZgS0b1le'
  56. RegionId = 'cn-hangzhou'
  57. client = AcsClient(AccessKey, AccessSecret, RegionId)
  58. def build_request():
  59. """购买服务器参数配置"""
  60. request = RunInstancesRequest()
  61. request.set_ImageId(image_id)
  62. request.set_VSwitchId(vswitch_id)
  63. request.set_SecurityGroupId(security_group_id)
  64. request.set_ZoneId(zone_id)
  65. request.set_InstanceType(instance_type)
  66. # request.set_UserData(init_data)
  67. request.set_InstanceName(instance_name)
  68. request.set_SystemDiskSize(disk_size)
  69. request.set_SystemDiskCategory(disk_category)
  70. request.set_KeyPairName(key_pair_name)
  71. request.set_Tags([
  72. {
  73. "Key": "ecs",
  74. "Value": "rov-server.prod"
  75. }
  76. ])
  77. return request
  78. def _send_request(request):
  79. """发送API请求"""
  80. request.set_accept_format('json')
  81. try:
  82. response_str = clt.do_action_with_exception(request)
  83. logging.info(response_str)
  84. response_detail = json.loads(response_str)
  85. return response_detail
  86. except Exception as e:
  87. logging.error(e)
  88. def check_instance_running(instance_ids):
  89. """检查服务器运行状态"""
  90. request = DescribeInstancesRequest()
  91. request.set_InstanceIds(json.dumps(instance_ids))
  92. response = _send_request(request)
  93. if response.get('Code') is None:
  94. instances_list = response.get('Instances').get('Instance')
  95. running_count = 0
  96. for instance_detail in instances_list:
  97. if instance_detail.get('Status') == "Running":
  98. running_count += 1
  99. return running_count
  100. def runCommand(instance_ids):
  101. """批量执行shell脚本:启动服务"""
  102. request = RunCommandRequest()
  103. request.set_accept_format('json')
  104. request.set_Type("RunShellScript")
  105. request.set_CommandContent("sh /home/sh/rov-server-start.sh")
  106. request.set_InstanceIds(instance_ids)
  107. response = clt.do_action_with_exception(request)
  108. logging.info(response)
  109. def healthCheck(instance_id):
  110. """服务健康检查 & 服务器挂载到负载均衡"""
  111. ipaddr = getIpaddr(instance_id)
  112. while True:
  113. health_url = 'http://%s:5001/healthcheck' %(ipaddr)
  114. try:
  115. http_code = requests.get(health_url).status_code
  116. except:
  117. logging.info("images is downloading")
  118. http_code = 0
  119. if http_code == 200:
  120. break
  121. else:
  122. time.sleep(20)
  123. # 服务预热60s, 服务刚启动时CPU很高
  124. time.sleep(60)
  125. # 挂载到负载均衡
  126. addBackendServers(slb_id_2, instance_id)
  127. def setWeight(slb_id, instance_id, weight):
  128. """
  129. 设置slb权重
  130. :param slb_id: slb_id
  131. :param instance_id: 服务器id
  132. :param weight: 权重值
  133. :return: None
  134. """
  135. BackendServers = [{"ServerId": instance_id, "Weight": weight}]
  136. request = CommonRequest()
  137. request.set_accept_format('json')
  138. request.set_domain('slb.aliyuncs.com')
  139. request.set_version('2014-05-15')
  140. request.set_method('POST')
  141. request.set_action_name('SetBackendServers')
  142. request.add_query_param('BackendServers', BackendServers)
  143. request.add_query_param('LoadBalancerId', slb_id)
  144. try:
  145. response = client.do_action_with_exception(request)
  146. except Exception as e:
  147. logging.error(e)
  148. def addBackendServers(slb_id, instance_id):
  149. """服务器挂载到负载均衡"""
  150. request = AddBackendServersRequest()
  151. request.set_accept_format('json')
  152. ipaddr = getIpaddr(instance_id)
  153. request.set_LoadBalancerId(slb_id)
  154. request.set_BackendServers([{"ServerId": instance_id, "Weight": "0", "Type": "ecs", "ServerIp": ipaddr}])
  155. response = client.do_action_with_exception(request)
  156. logging.info(response)
  157. for i in range(1, 6):
  158. time.sleep(5)
  159. weight = i * 20
  160. logging.info(f"instance_id: {instance_id}, weight: {weight}")
  161. setWeight(slb_id=slb_id, instance_id=instance_id, weight=weight)
  162. def getIpaddr(instance_id):
  163. """根据 instance_id 获取实例IP地址"""
  164. request = DescribeNetworkInterfacesRequest()
  165. request.set_accept_format('json')
  166. request.set_InstanceId(instance_id)
  167. response = clt.do_action_with_exception(request)
  168. request_content = json.loads(response)
  169. ipaddr = request_content['NetworkInterfaceSets']['NetworkInterfaceSet'][0]['PrivateIpAddress']
  170. return ipaddr
  171. def _execute_request(request):
  172. response = _send_request(request)
  173. if response.get('Code') is None:
  174. instance_ids = response.get('InstanceIdSets').get('InstanceIdSet')
  175. running_amount = 0
  176. while running_amount < amount:
  177. time.sleep(10)
  178. running_amount = check_instance_running(instance_ids)
  179. logging.info(f"{instance_ids} is running")
  180. time.sleep(60)
  181. runCommand(instance_ids)
  182. for instance_id in instance_ids:
  183. healthCheck(instance_id)
  184. def create_multiple_instances():
  185. """创建ECS实例并启动"""
  186. request = build_request()
  187. request.set_Amount(amount)
  188. _execute_request(request)
  189. if __name__ == '__main__':
  190. logging.info("Start Create Instances")
  191. # 创建ECS实例并启动
  192. create_multiple_instances()