process_offline.sh 11 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197
  1. #! /bin/bash
  2. # **********线下爬虫********** #
  3. env=$1 # 爬虫运行环境,正式环境: prod / 测试环境: dev
  4. #echo ${env}
  5. if [ ${env} = "dev" ];then
  6. piaoquan_crawler_dir=/Users/wangkun/Desktop/crawler/piaoquan_crawler/
  7. profile_path=/etc/profile
  8. node_path=/opt/homebrew/bin/node
  9. log_path=${piaoquan_crawler_dir}main/main_logs/process-$(date +%Y-%m-%d).log
  10. else
  11. piaoquan_crawler_dir=/Users/piaoquan/Desktop/piaoquan_crawler/
  12. profile_path=./base_profile
  13. node_path=/usr/local/bin/node
  14. log_path=${piaoquan_crawler_dir}main/main_logs/process-$(date +%Y-%m-%d).log
  15. fi
  16. time=$(date +%H:%M:%S)
  17. echo "$(date "+%Y-%m-%d %H:%M:%S") 更新环境变量..." >> ${log_path}
  18. cd ~ && source ${profile_path}
  19. echo "$(date "+%Y-%m-%d %H:%M:%S") 更新环境变量完成!" >> ${log_path}
  20. echo "$(date "+%Y-%m-%d %H:%M:%S") 正在重启Appium..." >> ${log_path}
  21. ps -ef | grep "/Applications/Appium.app/Contents/Resources/app/node_modules/appium/build/lib/main.js" | grep -v "grep"
  22. if [ "$?" -eq 1 ];then
  23. echo "$(date "+%Y-%m-%d %H:%M:%S") Appium异常停止,正在重启!" >> ${log_path}
  24. nohup ${node_path} /Applications/Appium.app/Contents/Resources/app/node_modules/appium/build/lib/main.js >>./nohup.log 2>&1 &
  25. echo "$(date "+%Y-%m-%d %H:%M:%S") 重启Appium完毕!" >> ${log_path}
  26. else
  27. echo "$(date "+%Y-%m-%d %H:%M:%S") Appium 进程状态正常" >> ${log_path}
  28. fi
  29. # 吉祥幸福
  30. if [[ "$time" > "00:30:00" && "$time" < "01:59:59" || "$time" > "05:00:00" && "$time" < "05:59:59" ]];then
  31. echo "$(date "+%Y-%m-%d %H:%M:%S") 开始启动 吉祥幸福 爬虫脚本任务" >> ${log_path}
  32. # ps aux | grep run_htzf | grep -v grep | awk '{print $2}' | xargs kill -9
  33. # ps aux | grep run_zhongmiaoyinxin | grep -v grep | awk '{print $2}' | xargs kill -9
  34. ps aux | grep run_zfqz | grep -v grep | awk '{print $2}' | xargs kill -9
  35. ps aux | grep run_zmyx | grep -v grep | awk '{print $2}' | xargs kill -9
  36. ps aux | grep run_xngplus | grep -v grep | awk '{print $2}' | xargs kill -9
  37. ps aux | grep run_xngrule | grep -v grep | awk '{print $2}' | xargs kill -9
  38. ps -ef | grep "run_jixiangxingfu_recommend.py" | grep -v "grep"
  39. if [ "$?" -eq 1 ];then
  40. echo "$(date "+%Y-%m-%d %H:%M:%S") 吉祥幸福爬虫, 异常停止, 正在重启!" >> ${log_path}
  41. adb forward --remove-all
  42. cd ${piaoquan_crawler_dir}
  43. nohup python3 -u jixiangxingfu/jixiangxingfu_main/run_jixiangxingfu_recommend.py --log_type="recommend" --crawler="jixiangxingfu" --env=${env} >>jixiangxingfu/logs/nohup-recommend.log 2>&1 &
  44. echo "$(date "+%Y-%m-%d %H:%M:%S") 重启完成!" >> ${log_path}
  45. else
  46. echo "$(date "+%Y-%m-%d %H:%M:%S") 吉祥幸福 进程状态正常" >> ${log_path}
  47. fi
  48. else
  49. echo "$(date "+%Y-%m-%d %H:%M:%S") 吉祥幸福 爬虫脚本任务结束" >> ${log_path}
  50. fi
  51. # 众妙音信-new
  52. if [[ "$time" > "02:00:00" && "$time" < "03:59:59" || "$time" > "06:00:00" && "$time" < "06:59:59" ]];then
  53. echo "$(date "+%Y-%m-%d %H:%M:%S") 开始启动 众妙音信-new 爬虫脚本任务" >> ${log_path}
  54. # ps aux | grep run_htzf | grep -v grep | awk '{print $2}' | xargs kill -9
  55. # ps aux | grep run_ganggangdouchuan | grep -v grep | awk '{print $2}' | xargs kill -9
  56. ps aux | grep run_jixiangxingfu | grep -v grep | awk '{print $2}' | xargs kill -9
  57. ps aux | grep run_zfqz | grep -v grep | awk '{print $2}' | xargs kill -9
  58. ps aux | grep run_xngplus | grep -v grep | awk '{print $2}' | xargs kill -9
  59. ps aux | grep run_xngrule | grep -v grep | awk '{print $2}' | xargs kill -9
  60. ps -ef | grep "run_zmyx_recommend.py" | grep -v "grep"
  61. if [ "$?" -eq 1 ];then
  62. echo "$(date "+%Y-%m-%d %H:%M:%S") 众妙音信-new小程序爬虫, 异常停止, 正在重启!" >> ${log_path}
  63. adb forward --remove-all
  64. cd ${piaoquan_crawler_dir}
  65. nohup python3 -u zhongmiaoyinxin/zhongmiaoyinxin_main/run_zmyx_recommend.py --log_type="recommend" --crawler="zhongmiaoyinxin" --env=${env} >>zhongmiaoyinxin/logs/nohup-recommend.log 2>&1 &
  66. echo "$(date "+%Y-%m-%d %H:%M:%S") 重启完成!" >> ${log_path}
  67. else
  68. echo "$(date "+%Y-%m-%d %H:%M:%S") 众妙音信-new小程序爬虫, 进程状态正常" >> ${log_path}
  69. fi
  70. else
  71. echo "$(date "+%Y-%m-%d %H:%M:%S") 众妙音信 爬虫脚本任务结束" >> ${log_path}
  72. fi
  73. # 小年糕-rule
  74. if [[ "$time" > "21:00:00" && "$time" < "21:59:59" ]];then
  75. echo "$(date "+%Y-%m-%d %H:%M:%S") 开始启动 小年糕-rule 爬虫脚本任务" >> ${log_path}
  76. # ps aux | grep run_htzf | grep -v grep | awk '{print $2}' | xargs kill -9
  77. # ps aux | grep run_ganggangdouchuan | grep -v grep | awk '{print $2}' | xargs kill -9
  78. ps aux | grep run_zmyx | grep -v grep | awk '{print $2}' | xargs kill -9
  79. ps aux | grep run_xngplus | grep -v grep | awk '{print $2}' | xargs kill -9
  80. ps -ef | grep "run_xngrule_recommend.py" | grep -v "grep"
  81. if [ "$?" -eq 1 ];then
  82. echo "$(date "+%Y-%m-%d %H:%M:%S") 小年糕-rule 小程序爬虫, 异常停止, 正在重启!" >> ${log_path}
  83. adb forward --remove-all
  84. cd ${piaoquan_crawler_dir}
  85. nohup python3 -u xiaoniangaoplus/xiaoniangaoplus_main/run_xngrule_recommend.py --log_type="recommend" --crawler="xiaoniangaoplus" --env=${env} >>xiaoniangaoplus/logs/nohup-recommend.log 2>&1 &
  86. echo "$(date "+%Y-%m-%d %H:%M:%S") 重启完成!" >> ${log_path}
  87. else
  88. echo "$(date "+%Y-%m-%d %H:%M:%S") 小年糕-rule 程序爬虫, 进程状态正常" >> ${log_path}
  89. fi
  90. else
  91. echo "$(date "+%Y-%m-%d %H:%M:%S") 小年糕-rule 爬虫脚本任务结束" >> ${log_path}
  92. fi
  93. # 小年糕+
  94. if [[ "$time" > "07:00:00" && "$time" < "08:59:59" || "$time" > "19:00:00" && "$time" < "20:59:59" || "$time" > "13:00:00" && "$time" < "14:59:59" || "$time" > "17:00:00" && "$time" < "17:59:59" ]];then
  95. echo "$(date "+%Y-%m-%d %H:%M:%S") 开始启动 小年糕+ 爬虫脚本任务" >> ${log_path}
  96. # ps aux | grep run_htzf | grep -v grep | awk '{print $2}' | xargs kill -9
  97. # ps aux | grep run_ganggangdouchuan | grep -v grep | awk '{print $2}' | xargs kill -9
  98. ps aux | grep run_xngrule | grep -v grep | awk '{print $2}' | xargs kill -9
  99. ps aux | grep run_zfqz | grep -v grep | awk '{print $2}' | xargs kill -9
  100. ps aux | grep run_zmyx | grep -v grep | awk '{print $2}' | xargs kill -9
  101. ps aux | grep run_jixiangxingfu | grep -v grep | awk '{print $2}' | xargs kill -9
  102. ps aux | grep run_ppq | grep -v grep | awk '{print $2}' | xargs kill -9
  103. ps -ef | grep "run_xngplus_recommend.py" | grep -v "grep"
  104. if [ "$?" -eq 1 ];then
  105. echo "$(date "+%Y-%m-%d %H:%M:%S") 小年糕+ 小程序爬虫, 异常停止, 正在重启!" >> ${log_path}
  106. adb forward --remove-all
  107. cd ${piaoquan_crawler_dir}
  108. nohup python3.10 -u xiaoniangaoplus/xiaoniangaoplus_main/run_xngplus_recommend.py --log_type="recommend" --crawler="xiaoniangaoplus" --env=${env} >>xiaoniangaoplus/logs/nohup-recommend.log 2>&1 &
  109. echo "$(date "+%Y-%m-%d %H:%M:%S") 重启完成!" >> ${log_path}
  110. else
  111. echo "$(date "+%Y-%m-%d %H:%M:%S") 小年糕+ 程序爬虫, 进程状态正常" >> ${log_path}
  112. fi
  113. else
  114. echo "$(date "+%Y-%m-%d %H:%M:%S") 小年糕+ 爬虫脚本任务结束" >> ${log_path}
  115. fi
  116. # 祝福圈子
  117. if [[ "$time" > "10:00:00" && "$time" < "11:59:59" || "$time" > "15:00:00" && "$time" < "15:59:59" ]];then
  118. echo "$(date "+%Y-%m-%d %H:%M:%S") 开始启动 祝福圈子 爬虫脚本任务" >> ${log_path}
  119. # ps aux | grep run_htzf | grep -v grep | awk '{print $2}' | xargs kill -9
  120. # ps aux | grep run_ganggangdouchuan | grep -v grep | awk '{print $2}' | xargs kill -9
  121. ps aux | grep run_xngplus | grep -v grep | awk '{print $2}' | xargs kill -9
  122. ps aux | grep run_xngrule | grep -v grep | awk '{print $2}' | xargs kill -9
  123. ps aux | grep run_jixiangxingfu | grep -v grep | awk '{print $2}' | xargs kill -9
  124. ps aux | grep run_zmyx | grep -v grep | awk '{print $2}' | xargs kill -9
  125. ps -ef | grep "run_zfqz_recommend.py" | grep -v "grep"
  126. if [ "$?" -eq 1 ];then
  127. echo "$(date "+%Y-%m-%d %H:%M:%S") 祝福圈子 小程序爬虫, 异常停止, 正在重启!" >> ${log_path}
  128. adb forward --remove-all
  129. cd ${piaoquan_crawler_dir}
  130. nohup python3 -u zhufuquanzi/zhufuquanzi_main/run_zfqz_recommend.py --log_type="recommend" --crawler="zhufuquanzi" --env=${env} >>zhufuquanzi/logs/nohup-recommend.log 2>&1 &
  131. echo "$(date "+%Y-%m-%d %H:%M:%S") 重启完成!" >> ${log_path}
  132. else
  133. echo "$(date "+%Y-%m-%d %H:%M:%S") 祝福圈子 程序爬虫, 进程状态正常" >> ${log_path}
  134. fi
  135. else
  136. echo "$(date "+%Y-%m-%d %H:%M:%S") 祝福圈子 爬虫脚本任务结束" >> ${log_path}
  137. fi
  138. # 漂漂圈
  139. if [[ "$time" > "16:00:00" && "$time" < "16:59:59" ]];then
  140. echo "$(date "+%Y-%m-%d %H:%M:%S") 开始启动 漂漂圈 爬虫脚本任务" >> ${log_path}
  141. # ps aux | grep run_htzf | grep -v grep | awk '{print $2}' | xargs kill -9
  142. # ps aux | grep run_ganggangdouchuan | grep -v grep | awk '{print $2}' | xargs kill -9
  143. ps aux | grep run_xngplus | grep -v grep | awk '{print $2}' | xargs kill -9
  144. ps aux | grep run_xngrule | grep -v grep | awk '{print $2}' | xargs kill -9
  145. ps aux | grep run_jixiangxingfu | grep -v grep | awk '{print $2}' | xargs kill -9
  146. ps aux | grep run_zmyx | grep -v grep | awk '{print $2}' | xargs kill -9
  147. ps aux | grep run_zfqz | grep -v grep | awk '{print $2}' | xargs kill -9
  148. ps -ef | grep "run_ppq_recommend.py" | grep -v "grep"
  149. if [ "$?" -eq 1 ];then
  150. echo "$(date "+%Y-%m-%d %H:%M:%S") 漂漂圈 小程序爬虫, 异常停止, 正在重启!" >> ${log_path}
  151. adb forward --remove-all
  152. cd ${piaoquan_crawler_dir}
  153. nohup python3 -u piaopiaoquan/piaopiaoquan_main/run_ppq_recommend.py --log_type="recommend" --crawler="zhufuquanzi" --env=${env} >>piaopiaoquan/logs/nohup-recommend.log 2>&1 &
  154. echo "$(date "+%Y-%m-%d %H:%M:%S") 重启完成!" >> ${log_path}
  155. else
  156. echo "$(date "+%Y-%m-%d %H:%M:%S") 漂漂圈 程序爬虫, 进程状态正常" >> ${log_path}
  157. fi
  158. else
  159. echo "$(date "+%Y-%m-%d %H:%M:%S") 漂漂圈 爬虫脚本任务结束" >> ${log_path}
  160. fi
  161. #if [[ "$time" > "13:00:00" && "$time" < "13:59:59" || "$time" > "16:00:00" && "$time" < "18:59:59" || "$time" > "22:00:00" && "$time" < "23:59:59" ]];then
  162. # echo "$(date "+%Y-%m-%d %H:%M:%S") 爬虫脚本任务结束" >> ${log_path}
  163. ## ps aux | grep run_htzf | grep -v grep | awk '{print $2}' | xargs kill -9
  164. ## ps aux | grep run_ganggangdouchuan | grep -v grep | awk '{print $2}' | xargs kill -9
  165. # ps aux | grep run_xngplus | grep -v grep | awk '{print $2}' | xargs kill -9
  166. # ps aux | grep run_zfqz | grep -v grep | awk '{print $2}' | xargs kill -9
  167. # ps aux | grep run_xngrule | grep -v grep | awk '{print $2}' | xargs kill -9
  168. # ps aux | grep run_jixiangxingfu | grep -v grep | awk '{print $2}' | xargs kill -9
  169. # ps aux | grep run_zmyx | grep -v grep | awk '{print $2}' | xargs kill -9
  170. #fi
  171. # 删除日志
  172. echo "$(date "+%Y-%m-%d %H:%M:%S") 开始清理 10 天前的日志文件" >> ${log_path}
  173. find ${piaoquan_crawler_dir}main/main_logs/ -mtime +10 -name "*.log" -exec rm -rf {} \;
  174. echo "$(date "+%Y-%m-%d %H:%M:%S") 日志文件清理完毕" >> ${log_path}
  175. exit 0