process_offline.sh 12 KB


  1. #! /bin/bash
  2. # **********线下爬虫********** #
  3. env=$1 # 爬虫运行环境,正式环境: prod / 测试环境: dev
  4. #echo ${env}
  5. if [ ${env} = "dev" ];then
  6. piaoquan_crawler_dir=/Users/wangkun/Desktop/crawler/piaoquan_crawler/
  7. profile_path=/etc/profile
  8. node_path=/opt/homebrew/bin/node
  9. log_path=${piaoquan_crawler_dir}main/main_logs/process-$(date +%Y-%m-%d).log
  10. else
  11. piaoquan_crawler_dir=/Users/piaoquan/Desktop/piaoquan_crawler/
  12. profile_path=./base_profile
  13. node_path=/usr/local/bin/node
  14. log_path=${piaoquan_crawler_dir}main/main_logs/process-$(date +%Y-%m-%d).log
  15. fi
  16. time=$(date +%H:%M:%S)
  17. echo "$(date "+%Y-%m-%d %H:%M:%S") 更新环境变量..." >> ${log_path}
  18. cd ~ && source ${profile_path}
  19. echo "$(date "+%Y-%m-%d %H:%M:%S") 更新环境变量完成!" >> ${log_path}
  20. echo "$(date "+%Y-%m-%d %H:%M:%S") 正在重启Appium..." >> ${log_path}
  21. ps -ef | grep "/Applications/Appium.app/Contents/Resources/app/node_modules/appium/build/lib/main.js" | grep -v "grep"
  22. if [ "$?" -eq 1 ];then
  23. echo "$(date "+%Y-%m-%d %H:%M:%S") Appium异常停止,正在重启!" >> ${log_path}
  24. nohup ${node_path} /Applications/Appium.app/Contents/Resources/app/node_modules/appium/build/lib/main.js >>./nohup.log 2>&1 &
  25. echo "$(date "+%Y-%m-%d %H:%M:%S") 重启Appium完毕!" >> ${log_path}
  26. else
  27. echo "$(date "+%Y-%m-%d %H:%M:%S") Appium 进程状态正常" >> ${log_path}
  28. fi
  29. # 吉祥幸福
  30. if [[ "$time" > "00:00:59" && "$time" < "01:59:59" || "$time" > "05:00:00" && "$time" < "05:59:59" ]];then
  31. echo "$(date "+%Y-%m-%d %H:%M:%S") 开始启动 吉祥幸福 爬虫脚本任务" >> ${log_path}
  32. # ps aux | grep run_htzf | grep -v grep | awk '{print $2}' | xargs kill -9
  33. # ps aux | grep run_zhongmiaoyinxin | grep -v grep | awk '{print $2}' | xargs kill -9
  34. ps aux | grep run_ppqsift | grep -v grep | awk '{print $2}' | xargs kill -9
  35. ps aux | grep run_zfqz | grep -v grep | awk '{print $2}' | xargs kill -9
  36. ps aux | grep run_zmyx | grep -v grep | awk '{print $2}' | xargs kill -9
  37. ps aux | grep run_xngplus | grep -v grep | awk '{print $2}' | xargs kill -9
  38. ps aux | grep run_xngrule | grep -v grep | awk '{print $2}' | xargs kill -9
  39. ps -ef | grep "run_jixiangxingfu_recommend.py" | grep -v "grep"
  40. if [ "$?" -eq 1 ];then
  41. echo "$(date "+%Y-%m-%d %H:%M:%S") 吉祥幸福爬虫, 异常停止, 正在重启!" >> ${log_path}
  42. adb forward --remove-all
  43. cd ${piaoquan_crawler_dir}
  44. nohup python3 -u jixiangxingfu/jixiangxingfu_main/run_jixiangxingfu_recommend.py --log_type="recommend" --crawler="jixiangxingfu" --env=${env} >>jixiangxingfu/logs/nohup-recommend.log 2>&1 &
  45. echo "$(date "+%Y-%m-%d %H:%M:%S") 重启完成!" >> ${log_path}
  46. else
  47. echo "$(date "+%Y-%m-%d %H:%M:%S") 吉祥幸福 进程状态正常" >> ${log_path}
  48. fi
  49. else
  50. echo "$(date "+%Y-%m-%d %H:%M:%S") 吉祥幸福 爬虫脚本任务结束" >> ${log_path}
  51. fi
  52. # 众妙音信-new
  53. if [[ "$time" > "02:00:00" && "$time" < "03:59:59" || "$time" > "06:00:00" && "$time" < "06:59:59" ]];then
  54. echo "$(date "+%Y-%m-%d %H:%M:%S") 开始启动 众妙音信-new 爬虫脚本任务" >> ${log_path}
  55. # ps aux | grep run_htzf | grep -v grep | awk '{print $2}' | xargs kill -9
  56. # ps aux | grep run_ganggangdouchuan | grep -v grep | awk '{print $2}' | xargs kill -9
  57. ps aux | grep run_jixiangxingfu | grep -v grep | awk '{print $2}' | xargs kill -9
  58. ps aux | grep run_zfqz | grep -v grep | awk '{print $2}' | xargs kill -9
  59. ps aux | grep run_xngplus | grep -v grep | awk '{print $2}' | xargs kill -9
  60. ps aux | grep run_xngrule | grep -v grep | awk '{print $2}' | xargs kill -9
  61. ps -ef | grep "run_zmyx_recommend.py" | grep -v "grep"
  62. if [ "$?" -eq 1 ];then
  63. echo "$(date "+%Y-%m-%d %H:%M:%S") 众妙音信-new小程序爬虫, 异常停止, 正在重启!" >> ${log_path}
  64. adb forward --remove-all
  65. cd ${piaoquan_crawler_dir}
  66. nohup python3 -u zhongmiaoyinxin/zhongmiaoyinxin_main/run_zmyx_recommend.py --log_type="recommend" --crawler="zhongmiaoyinxin" --env=${env} >>zhongmiaoyinxin/logs/nohup-recommend.log 2>&1 &
  67. echo "$(date "+%Y-%m-%d %H:%M:%S") 重启完成!" >> ${log_path}
  68. else
  69. echo "$(date "+%Y-%m-%d %H:%M:%S") 众妙音信-new小程序爬虫, 进程状态正常" >> ${log_path}
  70. fi
  71. else
  72. echo "$(date "+%Y-%m-%d %H:%M:%S") 众妙音信 爬虫脚本任务结束" >> ${log_path}
  73. fi
  74. # 小年糕-rule
  75. if [[ "$time" > "21:00:00" && "$time" < "21:59:59" ]];then
  76. echo "$(date "+%Y-%m-%d %H:%M:%S") 开始启动 小年糕-rule 爬虫脚本任务" >> ${log_path}
  77. # ps aux | grep run_htzf | grep -v grep | awk '{print $2}' | xargs kill -9
  78. # ps aux | grep run_ganggangdouchuan | grep -v grep | awk '{print $2}' | xargs kill -9
  79. ps aux | grep run_zmyx | grep -v grep | awk '{print $2}' | xargs kill -9
  80. ps aux | grep run_xngplus | grep -v grep | awk '{print $2}' | xargs kill -9
  81. ps -ef | grep "run_xngrule_recommend.py" | grep -v "grep"
  82. if [ "$?" -eq 1 ];then
  83. echo "$(date "+%Y-%m-%d %H:%M:%S") 小年糕-rule 小程序爬虫, 异常停止, 正在重启!" >> ${log_path}
  84. adb forward --remove-all
  85. cd ${piaoquan_crawler_dir}
  86. nohup python3 -u xiaoniangaoplus/xiaoniangaoplus_main/run_xngrule_recommend.py --log_type="recommend" --crawler="xiaoniangaoplus" --env=${env} >>xiaoniangaoplus/logs/nohup-recommend.log 2>&1 &
  87. echo "$(date "+%Y-%m-%d %H:%M:%S") 重启完成!" >> ${log_path}
  88. else
  89. echo "$(date "+%Y-%m-%d %H:%M:%S") 小年糕-rule 程序爬虫, 进程状态正常" >> ${log_path}
  90. fi
  91. else
  92. echo "$(date "+%Y-%m-%d %H:%M:%S") 小年糕-rule 爬虫脚本任务结束" >> ${log_path}
  93. fi
  94. # 小年糕+
  95. if [[ "$time" > "10:00:00" && "$time" < "11:59:59" || "$time" > "19:00:00" && "$time" < "20:59:59" || "$time" > "13:00:00" && "$time" < "14:59:59" || "$time" > "17:00:00" && "$time" < "17:59:59" ]];then
  96. echo "$(date "+%Y-%m-%d %H:%M:%S") 开始启动 小年糕+ 爬虫脚本任务" >> ${log_path}
  97. # ps aux | grep run_htzf | grep -v grep | awk '{print $2}' | xargs kill -9
  98. # ps aux | grep run_ganggangdouchuan | grep -v grep | awk '{print $2}' | xargs kill -9
  99. ps aux | grep run_xngrule | grep -v grep | awk '{print $2}' | xargs kill -9
  100. ps aux | grep run_zfqz | grep -v grep | awk '{print $2}' | xargs kill -9
  101. ps aux | grep run_zmyx | grep -v grep | awk '{print $2}' | xargs kill -9
  102. ps aux | grep run_jixiangxingfu | grep -v grep | awk '{print $2}' | xargs kill -9
  103. ps aux | grep run_ppq | grep -v grep | awk '{print $2}' | xargs kill -9
  104. ps -ef | grep "run_xngplus_recommend.py" | grep -v "grep"
  105. if [ "$?" -eq 1 ];then
  106. echo "$(date "+%Y-%m-%d %H:%M:%S") 小年糕+ 小程序爬虫, 异常停止, 正在重启!" >> ${log_path}
  107. adb forward --remove-all
  108. cd ${piaoquan_crawler_dir}
  109. nohup python3.10 -u xiaoniangaoplus/xiaoniangaoplus_main/run_xngplus_recommend.py --log_type="recommend" --crawler="xiaoniangaoplus" --env=${env} >>xiaoniangaoplus/logs/nohup-recommend.log 2>&1 &
  110. echo "$(date "+%Y-%m-%d %H:%M:%S") 重启完成!" >> ${log_path}
  111. else
  112. echo "$(date "+%Y-%m-%d %H:%M:%S") 小年糕+ 程序爬虫, 进程状态正常" >> ${log_path}
  113. fi
  114. else
  115. echo "$(date "+%Y-%m-%d %H:%M:%S") 小年糕+ 爬虫脚本任务结束" >> ${log_path}
  116. fi
  117. # 祝福圈子
  118. if [[ "$time" > "07:00:00" && "$time" < "08:59:59" || "$time" > "15:00:00" && "$time" < "15:59:59" ]];then
  119. echo "$(date "+%Y-%m-%d %H:%M:%S") 开始启动 祝福圈子 爬虫脚本任务" >> ${log_path}
  120. # ps aux | grep run_htzf | grep -v grep | awk '{print $2}' | xargs kill -9
  121. # ps aux | grep run_ganggangdouchuan | grep -v grep | awk '{print $2}' | xargs kill -9
  122. ps aux | grep run_xngplus | grep -v grep | awk '{print $2}' | xargs kill -9
  123. ps aux | grep run_xngrule | grep -v grep | awk '{print $2}' | xargs kill -9
  124. ps aux | grep run_jixiangxingfu | grep -v grep | awk '{print $2}' | xargs kill -9
  125. ps aux | grep run_zmyx | grep -v grep | awk '{print $2}' | xargs kill -9
  126. ps -ef | grep "run_zfqz_recommend.py" | grep -v "grep"
  127. if [ "$?" -eq 1 ];then
  128. echo "$(date "+%Y-%m-%d %H:%M:%S") 祝福圈子 小程序爬虫, 异常停止, 正在重启!" >> ${log_path}
  129. adb forward --remove-all
  130. cd ${piaoquan_crawler_dir}
  131. nohup python3 -u zhufuquanzi/zhufuquanzi_main/run_zfqz_recommend.py --log_type="recommend" --crawler="zhufuquanzi" --env=${env} >>zhufuquanzi/logs/nohup-recommend.log 2>&1 &
  132. echo "$(date "+%Y-%m-%d %H:%M:%S") 重启完成!" >> ${log_path}
  133. else
  134. echo "$(date "+%Y-%m-%d %H:%M:%S") 祝福圈子 程序爬虫, 进程状态正常" >> ${log_path}
  135. fi
  136. else
  137. echo "$(date "+%Y-%m-%d %H:%M:%S") 祝福圈子 爬虫脚本任务结束" >> ${log_path}
  138. fi
  139. # 漂漂圈
  140. if [[ "$time" > "16:00:00" && "$time" < "16:59:59" ]];then
  141. echo "$(date "+%Y-%m-%d %H:%M:%S") 开始启动 漂漂圈 爬虫脚本任务" >> ${log_path}
  142. # ps aux | grep run_htzf | grep -v grep | awk '{print $2}' | xargs kill -9
  143. # ps aux | grep run_ganggangdouchuan | grep -v grep | awk '{print $2}' | xargs kill -9
  144. ps aux | grep run_xngplus | grep -v grep | awk '{print $2}' | xargs kill -9
  145. ps aux | grep run_xngrule | grep -v grep | awk '{print $2}' | xargs kill -9
  146. ps aux | grep run_jixiangxingfu | grep -v grep | awk '{print $2}' | xargs kill -9
  147. ps aux | grep run_zmyx | grep -v grep | awk '{print $2}' | xargs kill -9
  148. ps aux | grep run_zfqz | grep -v grep | awk '{print $2}' | xargs kill -9
  149. ps -ef | grep "run_ppq_recommend.py" | grep -v "grep"
  150. if [ "$?" -eq 1 ];then
  151. echo "$(date "+%Y-%m-%d %H:%M:%S") 漂漂圈 小程序爬虫, 异常停止, 正在重启!" >> ${log_path}
  152. adb forward --remove-all
  153. cd ${piaoquan_crawler_dir}
  154. nohup python3 -u piaopiaoquan/piaopiaoquan_main/run_ppq_recommend.py --log_type="recommend" --crawler="piaopiaoquan" --env=${env} >>piaopiaoquan/logs/nohup-recommend.log 2>&1 &
  155. echo "$(date "+%Y-%m-%d %H:%M:%S") 重启完成!" >> ${log_path}
  156. else
  157. echo "$(date "+%Y-%m-%d %H:%M:%S") 漂漂圈 程序爬虫, 进程状态正常" >> ${log_path}
  158. fi
  159. # 漂漂圈-精选
  160. if [[ "$time" > "22:00:00" && "$time" < "23:59:59" ]];then
  161. echo "$(date "+%Y-%m-%d %H:%M:%S") 开始启动 漂漂圈精选 爬虫脚本任务" >> ${log_path}
  162. # ps aux | grep run_htzf | grep -v grep | awk '{print $2}' | xargs kill -9
  163. # ps aux | grep run_ganggangdouchuan | grep -v grep | awk '{print $2}' | xargs kill -9
  164. ps aux | grep run_xngplus | grep -v grep | awk '{print $2}' | xargs kill -9
  165. ps aux | grep run_xngrule | grep -v grep | awk '{print $2}' | xargs kill -9
  166. ps aux | grep run_jixiangxingfu | grep -v grep | awk '{print $2}' | xargs kill -9
  167. ps aux | grep run_zmyx | grep -v grep | awk '{print $2}' | xargs kill -9
  168. ps aux | grep run_zfqz | grep -v grep | awk '{print $2}' | xargs kill -9
  169. ps aux | grep run_ppq | grep -v grep | awk '{print $2}' | xargs kill -9
  170. ps -ef | grep "run_ppqsift_recommend.py" | grep -v "grep"
  171. if [ "$?" -eq 1 ];then
  172. echo "$(date "+%Y-%m-%d %H:%M:%S") 漂漂圈精选 小程序爬虫, 异常停止, 正在重启!" >> ${log_path}
  173. adb forward --remove-all
  174. cd ${piaoquan_crawler_dir}
  175. nohup python3 -u piaopiaoquan/piaopiaoquan_main/run_ppqsift_recommend.py --log_type="recommend" --crawler="piaopiaoquan" --env=${env} >>piaopiaoquan/logs/nohup-recommend.log 2>&1 &
  176. echo "$(date "+%Y-%m-%d %H:%M:%S") 重启完成!" >> ${log_path}
  177. else
  178. echo "$(date "+%Y-%m-%d %H:%M:%S") 漂漂圈精选 程序爬虫, 进程状态正常" >> ${log_path}
  179. fi
  180. else
  181. echo "$(date "+%Y-%m-%d %H:%M:%S") 漂漂圈精选 爬虫脚本任务结束" >> ${log_path}
  182. fi
  183. #if [[ "$time" > "13:00:00" && "$time" < "13:59:59" || "$time" > "16:00:00" && "$time" < "18:59:59" || "$time" > "22:00:00" && "$time" < "23:59:59" ]];then
  184. # echo "$(date "+%Y-%m-%d %H:%M:%S") 爬虫脚本任务结束" >> ${log_path}
  185. ## ps aux | grep run_htzf | grep -v grep | awk '{print $2}' | xargs kill -9
  186. ## ps aux | grep run_ganggangdouchuan | grep -v grep | awk '{print $2}' | xargs kill -9
  187. # ps aux | grep run_xngplus | grep -v grep | awk '{print $2}' | xargs kill -9
  188. # ps aux | grep run_zfqz | grep -v grep | awk '{print $2}' | xargs kill -9
  189. # ps aux | grep run_xngrule | grep -v grep | awk '{print $2}' | xargs kill -9
  190. # ps aux | grep run_jixiangxingfu | grep -v grep | awk '{print $2}' | xargs kill -9
  191. # ps aux | grep run_zmyx | grep -v grep | awk '{print $2}' | xargs kill -9
  192. #fi
  193. # 删除日志
  194. echo "$(date "+%Y-%m-%d %H:%M:%S") 开始清理 10 天前的日志文件" >> ${log_path}
  195. find ${piaoquan_crawler_dir}main/main_logs/ -mtime +10 -name "*.log" -exec rm -rf {} \;
  196. echo "$(date "+%Y-%m-%d %H:%M:%S") 日志文件清理完毕" >> ${log_path}
  197. exit 0