app.py 20 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398
  1. from flask import Flask,Response
  2. from DBSession import session_maker
  3. from model import *
  4. from sqlalchemy.sql import func
  5. from utils import *
  6. import atexit
  7. from aliyunsdkcore.client import AcsClient
  8. from aliyunsdkecs.request.v20140526.DescribeInstancesRequest import DescribeInstancesRequest
  9. from apscheduler.schedulers.background import BackgroundScheduler
  10. import json
  11. from model_longvideo import produce_video_task,produce_video_project
  12. from DBSession_longvideo import session_maker_longvideo
  13. from prometheus_client import Gauge,Counter, generate_latest
  14. from prometheus_client.core import CollectorRegistry
  15. from scheduler_jobs import interface_info_count
  16. from ex_response import ex_response
  17. import time
  18. import threading
  19. app = Flask(__name__)
  20. registry = CollectorRegistry(auto_describe=False)
  21. # 定义后台执行调度器
  22. scheduler = BackgroundScheduler()
  23. scheduler.add_job(func=update_request_url_list, trigger="interval", seconds=300)
  24. scheduler.start()
  25. atexit.register(lambda: scheduler.shutdown())
  26. client = AcsClient('LTAI4GBWbFvvXoXsSVBe1o9f', 'kRAikWitb4kDxaAyBqNrmLmllMEDO3', 'cn-hangzhou')
  27. healthcheck_status = Gauge("healthcheck_status", "ipaddress", ['instance_id','server_name', 'ipaddress'], registry=registry)
  28. url_http_avgtime = Gauge("url_http_times_avgs", "url of avgs", ['appType', 'url'], registry=registry)
  29. url_http_qps = Gauge("url_http_qps", "url of qps", ['appType','url'], registry=registry)
  30. url_http_expendtime_summary = Gauge("url_http_expendtime_summary", "expendtime summary", ['appType', 'url', 'duration'], registry=registry)
  31. url_http_error_code_cnt = Gauge("url_http_error_code_cnt", "error code", ['appType', 'error_code'], registry=registry)
  32. probe_http_status_code = Gauge("http_status_code", 'h5',['server_name'], registry=registry)
  33. probe_http_total_time = Gauge("http_total_time", 'h5',['server_name'], registry=registry)
  34. probe_http_dns_time = Gauge("http_dns_time", 'h5',['server_name'], registry=registry)
  35. probe_http_connect_time = Gauge("http_connect_time", 'h5',['server_name'], registry=registry)
  36. probe_http_pretransfer_time = Gauge("http_pretransfer_time", 'h5',['server_name'], registry=registry)
  37. probe_http_first_byte_time = Gauge("http_first_byte_time", 'h5',['server_name'], registry=registry)
  38. slb_http_status_code = Gauge("slb_http_status_code", 'slb', ['server_name', 'status'], registry=registry)
  39. #视频合成
  40. produce_video_task_count = Gauge("produce_video_task_count", 'status', ['status'], registry=registry)
  41. produce_video_task_rate = Gauge("produce_video_task_rate", 'produce_video_rate', ['produce_video_rate'], registry=registry)
  42. produce_video_task_ratio = Gauge("produce_video_task_ratio", 'produce_video_ratio', ['ratio'], registry=registry)
  43. produce_video_tts_count = Gauge("tts_aliyun_azure", 'success', ['tts_channel'], registry=registry)
  44. logs_app_recommend_log_cnt_300 = Gauge("logs_app_recommend_log_null_cnt_300", "null cnt", ['cnt'], registry=registry)
  45. logs_app_recommend_log_cnt_all = Counter("logs_app_recommend_log_null_cnt_all", "all cnt", ['cnt'], registry=registry)
  46. @app.route('/update')
  47. def update():
  48. request = DescribeInstancesRequest()
  49. request.set_accept_format('json')
  50. request.set_PageSize(100)
  51. # request.set_InstanceNetworkType("vpc")
  52. request.set_Tags([
  53. {
  54. "Key": "ecs"
  55. }
  56. ])
  57. response = client.do_action_with_exception(request)
  58. instance_info = json.loads(response)
  59. intances_list_del()
  60. count = len(instance_info["Instances"]["Instance"])
  61. for i in range(len(instance_info["Instances"]["Instance"])):
  62. instance_id = instance_info["Instances"]["Instance"][i]["InstanceId"]
  63. if instance_info["Instances"]["Instance"][i]["InstanceNetworkType"] == "vpc":
  64. ipaddr = instance_info["Instances"]["Instance"][i]["VpcAttributes"]["PrivateIpAddress"]["IpAddress"][0]
  65. if instance_info["Instances"]["Instance"][i]["InstanceNetworkType"] == "classic":
  66. ipaddr = instance_info["Instances"]["Instance"][i]["InnerIpAddress"]["IpAddress"][0]
  67. server_name = instance_info["Instances"]["Instance"][i]["Tags"]["Tag"][0]["TagValue"]
  68. status = instance_info["Instances"]["Instance"][i]["Status"]
  69. instance_name = instance_info["Instances"]["Instance"][i]["HostName"]
  70. if status == "Running":
  71. status = 1
  72. instance_insert(instance_id, ipaddr, instance_name, server_name, status)
  73. return "更新完成"
  74. @app.route('/app/healthcheck/metrics')
  75. def app_healthcheck():
  76. threads = []
  77. with session_maker() as session:
  78. instance_infos = session.query(InstanceList).filter(InstanceList.server_name=="longvideoapi.prod").all()
  79. for index in range(len(instance_infos)):
  80. ipaddr = instance_infos[index].ipadd
  81. server_name = instance_infos[index].server_name
  82. http_code = healthcheck(ipaddr, server_name)
  83. instance_id = instance_infos[index].instance_id
  84. healthcheck_status.labels(instance_id, server_name, ipaddr).set(http_code)
  85. return Response(generate_latest(registry),mimetype="text/plain")
  86. @app.route('/app/qps/metrics')
  87. def qps_avgtime_count():
  88. threads = []
  89. with session_maker() as session:
  90. intface_infos = session.query(IntfaceList.interface_url).all()
  91. app_type = session.query(app_info.app_type).all()
  92. for i in range(len(intface_infos)):
  93. for index in range(len(app_type)):
  94. url = intface_infos[i].interface_url
  95. appType = app_type[index].app_type
  96. url_avgtime = count_avg_time(appType, url)
  97. url_qps = count_qps(appType, url)
  98. url_http_avgtime.labels(appType, url).set(url_avgtime)
  99. url_http_qps.labels(appType, url).set(url_qps)
  100. return Response(generate_latest(registry),mimetype="text/plain")
  101. @app.route('/h5/metrics')
  102. def h5_healthcheck():
  103. # curl_respon = ex_response(
  104. share_h5 = "share_h5"
  105. download_h5 = "download_h5"
  106. share_h5_url = "https://longvideoh5.piaoquantv.com/core/share?shareSource=customerMessage&fromAppType=0&qrAppType=0&versionCode=321&shareUid=12463024&shareMachineCode=weixin_openid_o0w175fPwp8yrtOGihYJhvnT9Ag4&h5WxrootPageSource=vlog-pages___category&videoId=2689415&isRecommendShare=1&h5ShareId=backend493cd67dd28f4ee395781d59881567211625976055926&shareDepth=0&state=#"
  107. download_h5_url = "https://longvideoh5.piaoquantv.com/dist_1_3_4/upload?accessToken=fe8914eb2e99d1fe8ddaa2f753f5ec613eb2dfbb&versionCode=323&galleryId=0&fileType=2&machineCode=weixin_openid_o0w175fPwp8yrtOGihYJhvnT9Ag4&platform=devtools&system=iOS%2010.0.1&appType=0&appId=wx89e7eb06478361d7&pageSource=vlog-pages%2Fwebview&loginUid=12463024&machineInfo=%7B%22sdkVersion%22%3A%222.4.1%22,%22brand%22%3A%22devtools%22,%22language%22%3A%22zh_CN%22,%22model%22%3A%22iPhone%20X%22,%22platform%22%3A%22devtools%22,%22system%22%3A%22iOS%2010.0.1%22,%22weChatVersion%22%3A%228.0.5%22,%22screenHeight%22%3A812,%22screenWidth%22%3A375,%22windowHeight%22%3A730,%22windowWidth%22%3A375,%22softVersion%22%3A%224.1.168%22%7D&wxHelpPagePath=%2Fpackage-my%2Fhelp-feedback%2Fhelp-feedback&transaction=2065ff98-6f27-4f09-c9eb-d366c99dd5d5&videoBarrageSwitch=true&addMusic=1&eventId=0&fromActivityId=0&sessionId=1626833289618-583a312d-81cd-62f9-cdd4-cf914c682d55&subSessionId=1626833289618-583a312d-81cd-62f9-cdd4-cf914c682d55&projectId=&entranceType=#wechat_redirec"
  108. shar_h5_curl_response = ex_response(share_h5_url)
  109. share_h5_url_info = shar_h5_curl_response.getinfo()
  110. download_h5_curl_response = ex_response(download_h5_url)
  111. download_h5_url_info = download_h5_curl_response.getinfo()
  112. probe_http_status_code.labels(share_h5).set(share_h5_url_info["http_code"])
  113. probe_http_status_code.labels(download_h5).set(download_h5_url_info["http_code"])
  114. probe_http_total_time.labels("share_h5").set(share_h5_url_info["total_time"]*1000)
  115. probe_http_total_time.labels("download_h5").set(download_h5_url_info["total_time"]*1000)
  116. probe_http_dns_time.labels("share_h5").set(share_h5_url_info["dns_time"]*1000)
  117. probe_http_dns_time.labels("download_h5").set(download_h5_url_info["dns_time"]*1000)
  118. probe_http_connect_time.labels("share_h5").set(share_h5_url_info["dns_time"]*1000)
  119. probe_http_connect_time.labels("download_h5").set(download_h5_url_info["dns_time"]*1000)
  120. probe_http_pretransfer_time.labels("share_h5").set(share_h5_url_info["pretransfer_time"]*1000)
  121. probe_http_pretransfer_time.labels("download_h5").set(download_h5_url_info["pretransfer_time"]*1000)
  122. probe_http_first_byte_time.labels("share_h5").set(share_h5_url_info["first_byte_time"]*1000)
  123. probe_http_first_byte_time.labels("download_h5").set(download_h5_url_info["first_byte_time"]*1000)
  124. return Response(generate_latest(registry), mimetype="text/plain")
  125. @app.route('/slbStatusCode/metrics')
  126. def slb_request_status_metric():
  127. svc_name = {'longvideoapi', 'clip', 'speed'}
  128. for name in svc_name:
  129. res = slb_status_code_count(name)
  130. if res:
  131. for i in range(len(res)):
  132. status = res[i]['status']
  133. cnt = float(res[i]['cnt'])
  134. slb_http_status_code.labels(name, status).set(cnt)
  135. return Response(generate_latest(registry), mimetype="text/plain")
  136. @app.route('/metrics')
  137. def all_metric():
  138. """视频合成类metrics"""
  139. """视频合成成功率"""
  140. start_time = int(time.strftime("%Y%m%d%H%M", time.localtime())) * 100000000000
  141. end_time = (int(time.strftime("%Y%m%d%H%M", time.localtime())) + 5) * 100000000000
  142. print(start_time, end_time)
  143. query_sql = ("select round((successCount + processingCount1)/totalCount * 100,2) from "
  144. "(select count(*) as totalCount,"
  145. "sum(case when produce_status in (5,6,7,8) then 1 else 0 end) as successCount,"
  146. "sum(case when produce_status = 99 then 1 else 0 end) as failCount , "
  147. "sum(case when produce_status in(0,1,2,3,4) then 1 else 0 end) as processingCount,"
  148. "sum(case when produce_status in(0,1,2,3,4) and (rate < 1 or rate is null) then 1 else 0 end) processingCount1,"
  149. "sum(case when produce_status in(0,1,2,3,4) and rate >= 1 then 1 else 0 end) processingCount2 from "
  150. "(select t1.project_id, t1.produce_status, round((t2.last_connect_timestamp - t1.submit_timestamp) / (t1.video_duration/1000), 1) as rate from produce_video_project t1 "
  151. "left join produce_video_project_connect_time t2 on t1.project_id = t2.project_id "
  152. "where t1.project_id > %s and t1.project_id < %s and t1.app_type not in (1,13,15)) s1) ss1" %(start_time ,end_time)
  153. )
  154. res = db_query(query_sql)
  155. if res[0] is not None:
  156. produce_video_task_rate.labels("produce_video_task_rate").set(res[0])
  157. else:
  158. produce_video_task_rate.labels("produce_video_task_rate").set(-1)
  159. """今日视频合成任务数"""
  160. """今日视频合成成功数量"""
  161. """今日视频合成失败数量"""
  162. """视频合成中任务数量"""
  163. res = produce_video_task_cnt()
  164. if res:
  165. if res[0]:
  166. total_cnt = res[0]
  167. produce_video_task_count.labels("total").set(total_cnt)
  168. if res[1]:
  169. success_cnt = res[1]
  170. produce_video_task_count.labels("success").set(success_cnt)
  171. if res[2]:
  172. fail_cnt = res[2]
  173. produce_video_task_count.labels("fail").set(fail_cnt)
  174. if res[3]:
  175. process_cnt = res[3]
  176. produce_video_task_count.labels("process").set(process_cnt)
  177. if res[4]:
  178. r1 = res[4]
  179. produce_video_task_ratio.labels("<0.5").set(r1)
  180. if res[5]:
  181. r2 = res[5]
  182. produce_video_task_ratio.labels("0.5-0.7").set(r2)
  183. if res[5]:
  184. r3 = res[6]
  185. produce_video_task_ratio.labels("0.7-1.0").set(r3)
  186. if res[5]:
  187. r4 = res[7]
  188. produce_video_task_ratio.labels("1.0-1.5").set(r4)
  189. if res[5]:
  190. r5 = res[8]
  191. produce_video_task_ratio.labels("1.5-2.0").set(r5)
  192. if res[5]:
  193. r6 = res[9]
  194. produce_video_task_ratio.labels(">2.0").set(r6)
  195. # sql = "select v1 as 平均合成耗时,v2 as 平均视频时长, round(v2/v1,1) as 时长耗时比 from (select avg(produce_done_timestamp - submit_timestamp) as v1, avg(video_duration/1000) as v2 from produce_video_project where project_id > {} and project_id < {} and app_type not in (13,15) and produce_status in (5,6,7,8)) as t1".format(start_time, end_time)
  196. # #tts
  197. # res = db_query(sql)
  198. # if res[2] is not None:
  199. # produce_video_task_count.labels("video_progress").set(res[2])
  200. # else:
  201. # produce_video_task_count.labels("video_progress").set(0)
  202. res = logs_tts_count("aliyun",1)
  203. if res is not None:
  204. produce_video_tts_count.labels("aliyun_success").set(res[0]["count"])
  205. else:
  206. produce_video_tts_count.labels("aliyun_success").set(0)
  207. res = logs_tts_count("aliyun", 0)
  208. if res is not None:
  209. produce_video_tts_count.labels("aliyun_fail").set(res[0]["count"])
  210. else:
  211. produce_video_tts_count.labels("aliyun_fail").set(0)
  212. res = logs_tts_count("azure", 1)
  213. if res is not None:
  214. produce_video_tts_count.labels("azure_success").set(res[0]["count"])
  215. else:
  216. produce_video_tts_count.labels("azure_success").set(0)
  217. res = logs_tts_count("aliyun", 0)
  218. if res is not None:
  219. produce_video_tts_count.labels("azure_fail").set(res[0]["count"])
  220. else:
  221. produce_video_tts_count.labels("azure_fail").set(0)
  222. #当日负载均衡http_code
  223. svc_name = {'longvideoapi', 'clip', 'speed', 'commonapi'}
  224. for name in svc_name:
  225. res = slb_status_code_count(name)
  226. if res:
  227. for i in range(len(res)):
  228. status = res[i]['status']
  229. cnt = float(res[i]['cnt'])
  230. slb_http_status_code.labels(name, status).set(cnt)
  231. #h5 healthcheck
  232. share_h5 = "share_h5"
  233. download_h5 = "download_h5"
  234. share_h5_url = "https://longvideoh5.piaoquantv.com/core/share?shareSource=customerMessage&fromAppType=0&qrAppType=0&versionCode=321&shareUid=12463024&shareMachineCode=weixin_openid_o0w175fPwp8yrtOGihYJhvnT9Ag4&h5WxrootPageSource=vlog-pages___category&videoId=2689415&isRecommendShare=1&h5ShareId=backend493cd67dd28f4ee395781d59881567211625976055926&shareDepth=0&state=#"
  235. download_h5_url = "https://longvideoh5.piaoquantv.com/dist_1_3_4/upload?accessToken=fe8914eb2e99d1fe8ddaa2f753f5ec613eb2dfbb&versionCode=323&galleryId=0&fileType=2&machineCode=weixin_openid_o0w175fPwp8yrtOGihYJhvnT9Ag4&platform=devtools&system=iOS%2010.0.1&appType=0&appId=wx89e7eb06478361d7&pageSource=vlog-pages%2Fwebview&loginUid=12463024&machineInfo=%7B%22sdkVersion%22%3A%222.4.1%22,%22brand%22%3A%22devtools%22,%22language%22%3A%22zh_CN%22,%22model%22%3A%22iPhone%20X%22,%22platform%22%3A%22devtools%22,%22system%22%3A%22iOS%2010.0.1%22,%22weChatVersion%22%3A%228.0.5%22,%22screenHeight%22%3A812,%22screenWidth%22%3A375,%22windowHeight%22%3A730,%22windowWidth%22%3A375,%22softVersion%22%3A%224.1.168%22%7D&wxHelpPagePath=%2Fpackage-my%2Fhelp-feedback%2Fhelp-feedback&transaction=2065ff98-6f27-4f09-c9eb-d366c99dd5d5&videoBarrageSwitch=true&addMusic=1&eventId=0&fromActivityId=0&sessionId=1626833289618-583a312d-81cd-62f9-cdd4-cf914c682d55&subSessionId=1626833289618-583a312d-81cd-62f9-cdd4-cf914c682d55&projectId=&entranceType=#wechat_redirec"
  236. shar_h5_curl_response = ex_response(share_h5_url)
  237. share_h5_url_info = shar_h5_curl_response.getinfo()
  238. download_h5_curl_response = ex_response(download_h5_url)
  239. download_h5_url_info = download_h5_curl_response.getinfo()
  240. probe_http_status_code.labels(share_h5).set(share_h5_url_info["http_code"])
  241. probe_http_status_code.labels(download_h5).set(download_h5_url_info["http_code"])
  242. probe_http_total_time.labels("share_h5").set(share_h5_url_info["total_time"]*1000)
  243. probe_http_total_time.labels("download_h5").set(download_h5_url_info["total_time"]*1000)
  244. probe_http_dns_time.labels("share_h5").set(share_h5_url_info["dns_time"]*1000)
  245. probe_http_dns_time.labels("download_h5").set(download_h5_url_info["dns_time"]*1000)
  246. probe_http_connect_time.labels("share_h5").set(share_h5_url_info["dns_time"]*1000)
  247. probe_http_connect_time.labels("download_h5").set(download_h5_url_info["dns_time"]*1000)
  248. probe_http_pretransfer_time.labels("share_h5").set(share_h5_url_info["pretransfer_time"]*1000)
  249. probe_http_pretransfer_time.labels("download_h5").set(download_h5_url_info["pretransfer_time"]*1000)
  250. probe_http_first_byte_time.labels("share_h5").set(share_h5_url_info["first_byte_time"]*1000)
  251. probe_http_first_byte_time.labels("download_h5").set(download_h5_url_info["first_byte_time"]*1000)
  252. #推荐业务
  253. res_null_cnt = count_recommend_null()
  254. logs_app_recommend_log_cnt_300.labels("recommend").set(res_null_cnt)
  255. # # logs_app_recommend_log_cnt_all.labels("recommend").inc(1)
  256. # logs_app_recommend_log_cnt_all.inc(res_null_cnt)
  257. return Response(generate_latest(registry), mimetype="text/plain")
  258. @app.route('/qps_avgtime/metrics')
  259. def qps_avgtime_metrics():
  260. """统计接口QPM, RT时间,RT时间分布 """
  261. res, url = app_openapi_qps_avgtime_count()
  262. qps = int(res.body[0]["cnt"])
  263. avgtime = int(float(res.body[0]["avg_time"]))
  264. app_type_temp = 1
  265. url_http_qps.labels(app_type_temp, url).set(qps)
  266. url_http_avgtime.labels(app_type_temp, url).set(avgtime)
  267. app_type = ['1', '0', '4', '5', '6', '12', '13', '15']
  268. for i in range(len(app_type)):
  269. appType = app_type[i]
  270. res = count_qps_avgtime(appType)
  271. for i in range(len(res.body)):
  272. url = res.body[i]["requestUri"]
  273. qps = int(res.body[i]["cnt"])
  274. avgtime = int(float(res.body[i]["avg_time"]))
  275. url_http_qps.labels(appType, url).set(qps)
  276. url_http_avgtime.labels(appType, url).set(avgtime)
  277. res = count_rt_less_time_count(appType, 0, 200)
  278. for i in range(len(res.body)):
  279. url = res.body[i]["requestUri"]
  280. count = res.body[i]["cnt"]
  281. url_http_expendtime_summary.labels(appType, url, "0-200").set(count)
  282. res = count_rt_less_time_count(appType, 200, 500)
  283. for i in range(len(res.body)):
  284. url = res.body[i]["requestUri"]
  285. count = res.body[i]["cnt"]
  286. url_http_expendtime_summary.labels(appType, url, "200-300").set(count)
  287. res = count_rt_less_time_count(appType, 500, 1000)
  288. for i in range(len(res.body)):
  289. url = res.body[i]["requestUri"]
  290. count = res.body[i]["cnt"]
  291. url_http_expendtime_summary.labels(appType, url, "500-1000").set(count)
  292. res = count_rt_less_time_count(appType, 1000, 10000)
  293. for i in range(len(res.body)):
  294. url = res.body[i]["requestUri"]
  295. count = res.body[i]["cnt"]
  296. url_http_expendtime_summary.labels(appType, url, ">1000").set(count)
  297. """接口error统计"""
  298. res = error_cnt(appType)
  299. for i in range(len(res.body)):
  300. cnt = res.body[i]["cnt"]
  301. error_code = res.body[i]["resultCode"]
  302. url_http_error_code_cnt.labels(appType,error_code).set(cnt)
  303. return Response(generate_latest(registry), mimetype="text/plain")
  304. def produce_video_data():
  305. start_time = (int(time.strftime("%Y%m%d%H%M", time.localtime())) - 30) * 100000000000
  306. end_time = (int(time.strftime("%Y%m%d%H%M", time.localtime()))) * 100000000000
  307. sum_sql = ("select count(*) as totalCount from"
  308. "(select t1.project_id, t1.produce_status "
  309. "from produce_video_project t1 "
  310. "left join produce_video_project_connect_time t2 on t1.project_id = t2.project_id "
  311. " where t1.project_id > %s and t1.project_id < %s and t1.app_type not in (1,13,15)) s1) ss1"%(start_time,end_time)
  312. )
  313. if __name__ == '__main__':
  314. app.run()
  315. # app.run(host='192.168.201.1', port=9091)