process_offline.sh 9.2 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164
  1. #! /bin/bash
  2. # **********线下爬虫********** #
  3. env=$1 # 爬虫运行环境,正式环境: prod / 测试环境: dev
  4. #echo ${env}
  5. if [ ${env} = "dev" ];then
  6. piaoquan_crawler_dir=/Users/wangkun/Desktop/crawler/piaoquan_crawler/
  7. profile_path=/etc/profile
  8. node_path=/opt/homebrew/bin/node
  9. log_path=${piaoquan_crawler_dir}main/main_logs/process-$(date +%Y-%m-%d).log
  10. else
  11. piaoquan_crawler_dir=/Users/piaoquan/Desktop/piaoquan_crawler/
  12. profile_path=./base_profile
  13. node_path=/usr/local/bin/node
  14. log_path=${piaoquan_crawler_dir}main/main_logs/process-$(date +%Y-%m-%d).log
  15. fi
  16. time=$(date +%H:%M:%S)
  17. echo "$(date "+%Y-%m-%d %H:%M:%S") 更新环境变量..." >> ${log_path}
  18. cd ~ && source ${profile_path}
  19. echo "$(date "+%Y-%m-%d %H:%M:%S") 更新环境变量完成!" >> ${log_path}
  20. echo "$(date "+%Y-%m-%d %H:%M:%S") 正在重启Appium..." >> ${log_path}
  21. ps -ef | grep "/Applications/Appium.app/Contents/Resources/app/node_modules/appium/build/lib/main.js" | grep -v "grep"
  22. if [ "$?" -eq 1 ];then
  23. echo "$(date "+%Y-%m-%d %H:%M:%S") Appium异常停止,正在重启!" >> ${log_path}
  24. nohup ${node_path} /Applications/Appium.app/Contents/Resources/app/node_modules/appium/build/lib/main.js >>./nohup.log 2>&1 &
  25. echo "$(date "+%Y-%m-%d %H:%M:%S") 重启Appium完毕!" >> ${log_path}
  26. else
  27. echo "$(date "+%Y-%m-%d %H:%M:%S") Appium 进程状态正常" >> ${log_path}
  28. fi
  29. # 知青天天看
  30. if [[ "$time" > "00:00:00" ]] && [[ "$time" < "00:59:59" ]]; then
  31. echo "$(date "+%Y-%m-%d %H:%M:%S") 开始启动 知青天天看 爬虫脚本任务" >> ${log_path}
  32. ps aux | grep run_zhongmiaoyinxin | grep -v grep | awk '{print $2}' | xargs kill -9
  33. ps aux | grep run_ganggangdouchuan | grep -v grep | awk '{print $2}' | xargs kill -9
  34. ps aux | grep run_jixiangxingfu | grep -v grep | awk '{print $2}' | xargs kill -9
  35. ps aux | grep run_zfqz | grep -v grep | awk '{print $2}' | xargs kill -9
  36. ps aux | grep run_htzf | grep -v grep | awk '{print $2}' | xargs kill -9
  37. ps -ef | grep "run_zhiqingtiantiankan_recommend.py" | grep -v "grep"
  38. if [ "$?" -eq 1 ];then
  39. echo "$(date "+%Y-%m-%d %H:%M:%S") 知青天天看小程序爬虫, 异常停止, 正在重启!" >> ${log_path}
  40. cd ${piaoquan_crawler_dir}
  41. nohup python3 -u zhiqingtiantiankan/zhiqingtiantiankan_main/run_zhiqingtiantiankan_recommend.py --log_type="recommend" --crawler="zhiqingtiantiankan" --env=${env} >>zhiqingtiantiankan/logs/nohup-recommend.log 2>&1 &
  42. echo "$(date "+%Y-%m-%d %H:%M:%S") 重启完成!" >> ${log_path}
  43. else
  44. echo "$(date "+%Y-%m-%d %H:%M:%S") 知青天天看小程序爬虫, 进程状态正常" >> ${log_path}
  45. fi
  46. else
  47. echo "$(date "+%Y-%m-%d %H:%M:%S") 知青天天看 爬虫脚本任务结束" >> ${log_path}
  48. fi
  49. # 海豚祝福
  50. if [[ "$time" > "01:00:00" ]] && [[ "$time" < "03:59:59" ]]; then
  51. echo "$(date "+%Y-%m-%d %H:%M:%S") 开始启动 海豚祝福 爬虫脚本任务" >> ${log_path}
  52. ps aux | grep run_zhiqingtiantiankan | grep -v grep | awk '{print $2}' | xargs kill -9
  53. ps aux | grep run_zhongmiaoyinxin | grep -v grep | awk '{print $2}' | xargs kill -9
  54. ps aux | grep run_ganggangdouchuan | grep -v grep | awk '{print $2}' | xargs kill -9
  55. ps aux | grep run_jixiangxingfu | grep -v grep | awk '{print $2}' | xargs kill -9
  56. ps aux | grep run_zfqz | grep -v grep | awk '{print $2}' | xargs kill -9
  57. ps -ef | grep "run_htzf_recommend.py" | grep -v "grep"
  58. if [ "$?" -eq 1 ];then
  59. echo "$(date "+%Y-%m-%d %H:%M:%S") 海豚祝福小程序爬虫, 异常停止, 正在重启!" >> ${log_path}
  60. cd ${piaoquan_crawler_dir}
  61. nohup python3 -u haitunzhufu/haitunzhufu_main/run_htzf_recommend.py --log_type="recommend" --crawler="haitunzhufu" --env=${env} >> haitunzhufu/logs/nohup-recommend.log 2>&1 &
  62. echo "$(date "+%Y-%m-%d %H:%M:%S") 重启完成!" >> ${log_path}
  63. else
  64. echo "$(date "+%Y-%m-%d %H:%M:%S") 海豚祝福小程序爬虫, 进程状态正常" >> ${log_path}
  65. fi
  66. else
  67. echo "$(date "+%Y-%m-%d %H:%M:%S") 海豚祝福 爬虫脚本任务结束" >> ${log_path}
  68. fi
  69. # 刚刚都传
  70. if [[ "$time" > "04:00:00" ]] && [[ "$time" < "06:59:59" ]]; then
  71. echo "$(date "+%Y-%m-%d %H:%M:%S") 开始启动 刚刚都传 爬虫脚本任务" >> ${log_path}
  72. ps aux | grep run_htzf | grep -v grep | awk '{print $2}' | xargs kill -9
  73. ps aux | grep run_zhongmiaoyinxin | grep -v grep | awk '{print $2}' | xargs kill -9
  74. ps aux | grep run_zhiqingtiantiankan | grep -v grep | awk '{print $2}' | xargs kill -9
  75. ps aux | grep run_jixiangxingfu | grep -v grep | awk '{print $2}' | xargs kill -9
  76. ps aux | grep run_zfqz | grep -v grep | awk '{print $2}' | xargs kill -9
  77. ps -ef | grep "run_ganggangdouchuan_recommend.py" | grep -v "grep"
  78. if [ "$?" -eq 1 ];then
  79. echo "$(date "+%Y-%m-%d %H:%M:%S") 刚刚都传小程序爬虫, 异常停止, 正在重启!" >> ${log_path}
  80. cd ${piaoquan_crawler_dir}
  81. nohup python3 -u ganggangdouchuan/ganggangdouchuan_main/run_ganggangdouchuan_recommend.py --log_type="recommend" --crawler="ganggangdouchuan" --env=${env} >>ganggangdouchuan/logs/nohup-recommend.log 2>&1 &
  82. echo "$(date "+%Y-%m-%d %H:%M:%S") 重启完成!" >> ${log_path}
  83. else
  84. echo "$(date "+%Y-%m-%d %H:%M:%S") 刚刚都传小程序爬虫, 进程状态正常" >> ${log_path}
  85. fi
  86. else
  87. echo "$(date "+%Y-%m-%d %H:%M:%S") 刚刚都传小程序爬虫, 任务结束" >> ${log_path}
  88. fi
  89. # 吉祥幸福
  90. if [[ "$time" > "07:00:00" ]] && [[ "$time" < "09:59:59" ]]; then
  91. echo "$(date "+%Y-%m-%d %H:%M:%S") 开始启动 吉祥幸福 爬虫脚本任务" >> ${log_path}
  92. ps aux | grep run_htzf | grep -v grep | awk '{print $2}' | xargs kill -9
  93. ps aux | grep run_zhongmiaoyinxin | grep -v grep | awk '{print $2}' | xargs kill -9
  94. ps aux | grep run_zhiqingtiantiankan | grep -v grep | awk '{print $2}' | xargs kill -9
  95. ps aux | grep run_ganggangdouchuan | grep -v grep | awk '{print $2}' | xargs kill -9
  96. ps aux | grep run_zfqz | grep -v grep | awk '{print $2}' | xargs kill -9
  97. ps -ef | grep "run_jixiangxingfu_recommend.py" | grep -v "grep"
  98. if [ "$?" -eq 1 ];then
  99. echo "$(date "+%Y-%m-%d %H:%M:%S") 吉祥幸福爬虫, 异常停止, 正在重启!" >> ${log_path}
  100. cd ${piaoquan_crawler_dir}
  101. nohup python3 -u jixiangxingfu/jixiangxingfu_main/run_jixiangxingfu_recommend.py --log_type="recommend" --crawler="jixiangxingfu" --env=${env} >>jixiangxingfu/logs/nohup-recommend.log 2>&1 &
  102. echo "$(date "+%Y-%m-%d %H:%M:%S") 重启完成!" >> ${log_path}
  103. else
  104. echo "$(date "+%Y-%m-%d %H:%M:%S") 吉祥幸福 进程状态正常" >> ${log_path}
  105. fi
  106. else
  107. echo "$(date "+%Y-%m-%d %H:%M:%S") 吉祥幸福 爬虫脚本任务结束" >> ${log_path}
  108. fi
  109. # 众妙音信
  110. if [[ "$time" > "10:00:00" ]] && [[ "$time" < "12:59:59" ]]; then
  111. echo "$(date "+%Y-%m-%d %H:%M:%S") 开始启动 众妙音信 爬虫脚本任务" >> ${log_path}
  112. ps aux | grep run_htzf | grep -v grep | awk '{print $2}' | xargs kill -9
  113. ps aux | grep run_ganggangdouchuan | grep -v grep | awk '{print $2}' | xargs kill -9
  114. ps aux | grep run_zhiqingtiantiankan | grep -v grep | awk '{print $2}' | xargs kill -9
  115. ps aux | grep run_jixiangxingfu | grep -v grep | awk '{print $2}' | xargs kill -9
  116. ps aux | grep run_zfqz | grep -v grep | awk '{print $2}' | xargs kill -9
  117. ps -ef | grep "run_zhongmiaoyinxin_recommend.py" | grep -v "grep"
  118. if [ "$?" -eq 1 ];then
  119. echo "$(date "+%Y-%m-%d %H:%M:%S") 众妙音信小程序爬虫, 异常停止, 正在重启!" >> ${log_path}
  120. cd ${piaoquan_crawler_dir}
  121. nohup python3 -u zhongmiaoyinxin/zhongmiaoyinxin_main/run_zhongmiaoyinxin_recommend.py --log_type="recommend" --crawler="zhongmiaoyinxin" --env=${env} >>zhongmiaoyinxin/logs/nohup-recommend.log 2>&1 &
  122. echo "$(date "+%Y-%m-%d %H:%M:%S") 重启完成!" >> ${log_path}
  123. else
  124. echo "$(date "+%Y-%m-%d %H:%M:%S") 众妙音信小程序爬虫, 进程状态正常" >> ${log_path}
  125. fi
  126. else
  127. echo "$(date "+%Y-%m-%d %H:%M:%S") 众妙音信 爬虫脚本任务结束" >> ${log_path}
  128. fi
  129. # 祝福圈子
  130. if [[ "$time" > "13:00:00" ]] && [[ "$time" < "23:59:59" ]]; then
  131. echo "$(date "+%Y-%m-%d %H:%M:%S") 开始启动 祝福圈子 爬虫脚本任务" >> ${log_path}
  132. ps aux | grep run_htzf | grep -v grep | awk '{print $2}' | xargs kill -9
  133. ps aux | grep run_zhongmiaoyinxin | grep -v grep | awk '{print $2}' | xargs kill -9
  134. ps aux | grep run_ganggangdouchuan | grep -v grep | awk '{print $2}' | xargs kill -9
  135. ps aux | grep run_zhiqingtiantiankan | grep -v grep | awk '{print $2}' | xargs kill -9
  136. ps aux | grep run_jixiangxingfu | grep -v grep | awk '{print $2}' | xargs kill -9
  137. ps -ef | grep "run_zfqz_recommend.py" | grep -v "grep"
  138. if [ "$?" -eq 1 ];then
  139. echo "$(date "+%Y-%m-%d %H:%M:%S") 祝福圈子小程序爬虫, 异常停止, 正在重启!" >> ${log_path}
  140. cd ${piaoquan_crawler_dir}
  141. /bin/sh ${piaoquan_crawler_dir}main/process_mq.sh "zfqz" "zhufuquanzi" "recommend" ${env}
  142. echo "$(date "+%Y-%m-%d %H:%M:%S") 重启完成!" >> ${log_path}
  143. else
  144. echo "$(date "+%Y-%m-%d %H:%M:%S") 祝福圈子小程序爬虫, 进程状态正常" >> ${log_path}
  145. fi
  146. else
  147. echo "$(date "+%Y-%m-%d %H:%M:%S") 祝福圈子 爬虫脚本任务结束" >> ${log_path}
  148. fi
  149. # 删除日志
  150. echo "$(date "+%Y-%m-%d %H:%M:%S") 开始清理 10 天前的日志文件" >> ${log_path}
  151. find ${piaoquan_crawler_dir}main/main_logs/ -mtime +10 -name "*.log" -exec rm -rf {} \;
  152. echo "$(date "+%Y-%m-%d %H:%M:%S") 日志文件清理完毕" >> ${log_path}
  153. exit 0