process.sh 16 KB


  1. #! /bin/bash
  2. env=$1 # 环境
  3. if [ ${env} = "dev" ];then
  4. piaoquan_crawler_dir=/Users/wangkun/Desktop/crawler/piaoquan_crawler/
  5. profile_path=/etc/profile
  6. python=python3
  7. log_path=${piaoquan_crawler_dir}main/main_logs/process-$(date +%Y-%m-%d).log
  8. elif [ ${env} = "hk" ];then
  9. piaoquan_crawler_dir=/root/piaoquan_crawler/
  10. profile_path=/etc/profile
  11. python=python3
  12. log_path=${piaoquan_crawler_dir}main/main_logs/process-$(date +%Y-%m-%d).log
  13. else
  14. piaoquan_crawler_dir=/data5/piaoquan_crawler/
  15. profile_path=/etc/profile
  16. python=python
  17. log_path=${piaoquan_crawler_dir}main/main_logs/process-$(date +%Y-%m-%d).log
  18. fi
  19. time=$(date +%H:%M:%S)
  20. echo "$(date "+%Y-%m-%d %H:%M:%S") 开始监测爬虫进程状态" >> ${log_path}
  21. echo "$(date "+%Y-%m-%d %H:%M:%S") 更新环境变量..." >> ${log_path}
  22. cd ~ && source /etc/profile
  23. echo "$(date "+%Y-%m-%d %H:%M:%S") 更新环境变量完成!" >> ${log_path}
  24. # 公众号爬虫策略
  25. echo "$(date "+%Y-%m-%d %H:%M:%S") 正在监测 公众号爬虫策略 1-100个账号 进程状态" >> ${log_path}
  26. ps -ef | grep "run_gongzhonghao_follow.py" | grep -v "grep"
  27. if [ "$?" -eq 1 ];then
  28. echo "$(date "+%Y-%m-%d_%H:%M:%S") 异常停止,正在重启!" >> ${log_path}
  29. if [ ${env} = "dev" ];then
  30. cd ${piaoquan_crawler_dir} && sh main/scheduling_main.sh ./gongzhonghao/gongzhonghao_main/run_gongzhonghao_follow.py --log_type="author" --crawler="gongzhonghao" --env="dev" gongzhonghao/logs/nohup-follow.log
  31. else
  32. cd ${piaoquan_crawler_dir} && /usr/bin/sh /data5/piaoquan_crawler/main/scheduling_main.sh ./gongzhonghao/gongzhonghao_main/run_gongzhonghao_follow.py --log_type="author" --crawler="gongzhonghao" --env="prod" gongzhonghao/logs/nohup-follow.log
  33. fi
  34. echo "$(date "+%Y-%m-%d %H:%M:%S") 重启完成!" >> ${log_path}
  35. else
  36. echo "$(date "+%Y-%m-%d %H:%M:%S") 公众号爬虫策略1-100个账号 进程状态正常" >> ${log_path}
  37. fi
  38. echo "$(date "+%Y-%m-%d %H:%M:%S") 正在监测 公众号爬虫策略101-145个账号 进程状态" >> ${log_path}
  39. ps -ef | grep "run_gongzhonghao_follow_2.py" | grep -v "grep"
  40. if [ "$?" -eq 1 ];then
  41. echo "$(date "+%Y-%m-%d_%H:%M:%S") 异常停止,正在重启!" >> ${log_path}
  42. if [ ${env} = "dev" ];then
  43. cd ${piaoquan_crawler_dir} && sh main/scheduling_main.sh ./gongzhonghao/gongzhonghao_main/run_gongzhonghao_follow_2.py --log_type="follow-2" --crawler="gongzhonghao" --env="dev" gongzhonghao/logs/nohup-follow-2.log
  44. else
  45. cd ${piaoquan_crawler_dir} && /usr/bin/sh /data5/piaoquan_crawler/main/scheduling_main.sh ./gongzhonghao/gongzhonghao_main/run_gongzhonghao_follow_2.py --log_type="follow-2" --crawler="gongzhonghao" --env="prod" gongzhonghao/logs/nohup-follow-2.log
  46. fi
  47. echo "$(date "+%Y-%m-%d %H:%M:%S") 重启完成!" >> ${log_path}
  48. else
  49. echo "$(date "+%Y-%m-%d %H:%M:%S") 公众号爬虫策略101-145个账号 进程状态正常" >> ${log_path}
  50. fi
  51. # 小年糕定向爬虫策略
  52. echo "$(date "+%Y-%m-%d %H:%M:%S") 正在监测 小年糕定向爬虫策略 进程状态" >> ${log_path}
  53. ps -ef | grep "run_xiaoniangao_follow.py" | grep -v "grep"
  54. if [ "$?" -eq 1 ];then
  55. echo "$(date "+%Y-%m-%d_%H:%M:%S") 异常停止,正在重启!" >> ${log_path}
  56. if [ ${env} = "dev" ];then
  57. cd ${piaoquan_crawler_dir} && sh main/scheduling_main.sh ./xiaoniangao/xiaoniangao_main/run_xiaoniangao_follow.py --log_type="author" --crawler="xiaoniangao" --env="dev" xiaoniangao/logs/nohup-follow.log
  58. else
  59. cd ${piaoquan_crawler_dir} && /usr/bin/sh /data5/piaoquan_crawler/main/scheduling_main.sh ./xiaoniangao/xiaoniangao_main/run_xiaoniangao_follow.py --log_type="author" --crawler="xiaoniangao" --env="prod" xiaoniangao/logs/nohup-follow.log
  60. fi
  61. echo "$(date "+%Y-%m-%d %H:%M:%S") 重启完成!" >> ${log_path}
  62. else
  63. echo "$(date "+%Y-%m-%d %H:%M:%S") 小年糕定向爬虫策略 进程状态正常" >> ${log_path}
  64. fi
  65. # 小年糕小时榜爬虫策略
  66. echo "$(date "+%Y-%m-%d %H:%M:%S") 正在监测 小年糕小时榜爬虫策略 进程状态" >> ${log_path}
  67. ps -ef | grep "run_xiaoniangao_hour.py" | grep -v "grep"
  68. if [ "$?" -eq 1 ];then
  69. echo "$(date "+%Y-%m-%d_%H:%M:%S") 异常停止,正在重启!" >> ${log_path}
  70. if [ ${env} = "dev" ];then
  71. cd ${piaoquan_crawler_dir} && sh main/scheduling_main.sh ./xiaoniangao/xiaoniangao_main/run_xiaoniangao_hour.py --log_type="hour" --crawler="xiaoniangao" --env="dev" xiaoniangao/logs/nohup-hour.log
  72. else
  73. cd ${piaoquan_crawler_dir} && /usr/bin/sh /data5/piaoquan_crawler/main/scheduling_main.sh ./xiaoniangao/xiaoniangao_main/run_xiaoniangao_hour.py --log_type="hour" --crawler="xiaoniangao" --env="prod" xiaoniangao/logs/nohup-hour.log
  74. fi
  75. echo "$(date "+%Y-%m-%d %H:%M:%S") 重启完成!" >> ${log_path}
  76. else
  77. echo "$(date "+%Y-%m-%d %H:%M:%S") 小年糕小时榜爬虫策略 进程状态正常" >> ${log_path}
  78. fi
  79. # 小年糕播放量榜爬虫策略
  80. echo "$(date "+%Y-%m-%d %H:%M:%S") 正在监测 播放量榜爬虫策略 进程状态" >> ${log_path}
  81. ps -ef | grep "run_xiaoniangao_play.py" | grep -v "grep"
  82. if [ "$?" -eq 1 ];then
  83. echo "$(date "+%Y-%m-%d_%H:%M:%S") 异常停止,正在重启!" >> ${log_path}
  84. if [ ${env} = "dev" ];then
  85. cd ${piaoquan_crawler_dir} && sh main/scheduling_main.sh ./xiaoniangao/xiaoniangao_main/run_xiaoniangao_play.py --log_type="play" --crawler="xiaoniangao" --env="dev" xiaoniangao/logs/nohup-play.log
  86. else
  87. cd ${piaoquan_crawler_dir} && /usr/bin/sh /data5/piaoquan_crawler/main/scheduling_main.sh ./xiaoniangao/xiaoniangao_main/run_xiaoniangao_play.py --log_type="play" --crawler="xiaoniangao" --env="prod" xiaoniangao/logs/nohup-play.log
  88. fi
  89. echo "$(date "+%Y-%m-%d %H:%M:%S") 重启完成!" >> ${log_path}
  90. else
  91. echo "$(date "+%Y-%m-%d %H:%M:%S") 播放量榜爬虫策略 进程状态正常" >> ${log_path}
  92. fi
  93. # 快手定向爬虫策略
  94. echo "$(date "+%Y-%m-%d %H:%M:%S") 正在监测 快手定向爬虫策略 进程状态" >> ${log_path}
  95. ps -ef | grep "run_kuaishou_follow.py" | grep -v "grep"
  96. if [ "$?" -eq 1 ];then
  97. echo "$(date "+%Y-%m-%d_%H:%M:%S") 异常停止,正在重启!" >> ${log_path}
  98. if [ ${env} = "dev" ];then
  99. cd ${piaoquan_crawler_dir} && sh main/scheduling_main.sh ./kuaishou/kuaishou_main/run_kuaishou_follow.py --log_type="author" --crawler="kuaishou" --env="dev" kuaishou/logs/nohup-follow.log
  100. else
  101. cd ${piaoquan_crawler_dir} && /usr/bin/sh ./main/main.sh ./kuaishou/kuaishou_main/run_kuaishou_follow.py --log_type="author" --crawler="kuaishou" --strategy="定向爬虫策略" --oss_endpoint="inner" --env="prod" --machine="aliyun" kuaishou/logs/nohup-follow.log
  102. fi
  103. echo "$(date "+%Y-%m-%d %H:%M:%S") 重启完成!" >> ${log_path}
  104. else
  105. echo "$(date "+%Y-%m-%d %H:%M:%S") 快手定向爬虫策略 进程状态正常" >> ${log_path}
  106. fi
  107. ## 快手推荐爬虫策略
  108. #echo "$(date "+%Y-%m-%d %H:%M:%S") 正在监测 快手推荐爬虫策略 进程状态" >> ${log_path}
  109. #ps -ef | grep "run_kuaishou_recommend.py" | grep -v "grep"
  110. #if [ "$?" -eq 1 ];then
  111. # echo "$(date "+%Y-%m-%d_%H:%M:%S") 异常停止,正在重启!" >> ${log_path}
  112. # if [ ${env} = "dev" ];then
  113. # cd ${piaoquan_crawler_dir} && sh main/scheduling_main.sh ./kuaishou/kuaishou_main/run_kuaishou_follow.py --log_type="author" --crawler="kuaishou" --env="dev" kuaishou/logs/nohup-recommend.log
  114. # else
  115. # cd ${piaoquan_crawler_dir} && /usr/bin/sh ./main/main.sh ./kuaishou/kuaishou_main/run_kuaishou_recommend.py --log_type="recommend" --crawler="kuaishou" --strategy="推荐爬虫策略" --oss_endpoint="inner" --env="prod" --machine="aliyun" kuaishou/logs/nohup-recommend.log
  116. # fi
  117. # echo "$(date "+%Y-%m-%d %H:%M:%S") 重启完成!" >> ${log_path}
  118. #else
  119. # echo "$(date "+%Y-%m-%d %H:%M:%S") 快手推荐爬虫策略 进程状态正常" >> ${log_path}
  120. #fi
  121. # 抖音推荐爬虫策略
  122. echo "$(date "+%Y-%m-%d %H:%M:%S") 正在监测 抖音推荐爬虫策略 进程状态" >> ${log_path}
  123. ps -ef | grep "run_douyin_recommend.py" | grep -v "grep"
  124. if [ "$?" -eq 1 ];then
  125. echo "$(date "+%Y-%m-%d_%H:%M:%S") 异常停止,正在重启!" >> ${log_path}
  126. if [ ${env} = "dev" ];then
  127. cd ${piaoquan_crawler_dir} && sh main/scheduling_main.sh ./kuaishou/kuaishou_main/run_kuaishou_follow.py --log_type="author" --crawler="kuaishou" --env="dev" douyin/logs/nohup-recommend.log
  128. else
  129. cd ${piaoquan_crawler_dir} && /usr/bin/sh ./main/main.sh ./douyin/douyin_main/run_douyin_recommend.py --log_type="recommend" --crawler="douyin" --strategy="抖音推荐爬虫策略" --oss_endpoint="inner" --env="prod" --machine="aliyun" douyin/logs/nohup-recommend.log
  130. fi
  131. echo "$(date "+%Y-%m-%d %H:%M:%S") 重启完成!" >> ${log_path}
  132. else
  133. echo "$(date "+%Y-%m-%d %H:%M:%S") 抖音推荐爬虫策略 进程状态正常" >> ${log_path}
  134. fi
  135. # 抖音定向爬虫策略
  136. echo "$(date "+%Y-%m-%d %H:%M:%S") 正在监测 抖音定向爬虫策略 进程状态" >> ${log_path}
  137. ps -ef | grep "run_douyin_follow.py" | grep -v "grep"
  138. if [ "$?" -eq 1 ];then
  139. echo "$(date "+%Y-%m-%d_%H:%M:%S") 异常停止,正在重启!" >> ${log_path}
  140. if [ ${env} = "dev" ];then
  141. cd ${piaoquan_crawler_dir} && sh main/scheduling_main.sh ./kuaishou/douyin_main/run_douyin_follow.py --log_type="author" --crawler="douyin" --env="dev" douyin/logs/nohup-follow.log
  142. else
  143. cd ${piaoquan_crawler_dir} && /usr/bin/sh ./main/main.sh ./douyin/douyin_main/run_douyin_follow.py --log_type="author" --crawler="douyin" --strategy="抖音定向爬虫策略" --oss_endpoint="inner" --env="prod" --machine="aliyun" douyin/logs/nohup-author.log
  144. fi
  145. echo "$(date "+%Y-%m-%d %H:%M:%S") 重启完成!" >> ${log_path}
  146. else
  147. echo "$(date "+%Y-%m-%d %H:%M:%S") 抖音推荐爬虫策略 进程状态正常" >> ${log_path}
  148. fi
  149. # 西瓜定向爬虫策略
  150. echo "$(date "+%Y-%m-%d %H:%M:%S") 正在监测 西瓜定向爬虫策略 进程状态" >> ${log_path}
  151. ps -ef | grep "run_xigua_follow.py" | grep -v "grep"
  152. if [ "$?" -eq 1 ];then
  153. echo "$(date "+%Y-%m-%d_%H:%M:%S") 异常停止,正在重启!" >> ${log_path}
  154. if [ ${env} = "dev" ];then
  155. cd ${piaoquan_crawler_dir} && sh main/scheduling_main.sh ./xigua/xigua_main/run_xigua_follow.py --log_type="author" --crawler="xigua" --env="dev" xigua/logs/nohup-follow.log
  156. else
  157. cd ${piaoquan_crawler_dir} && /usr/bin/sh ./main/main.sh ./xigua/xigua_main/run_xigua_follow.py --log_type="author" --crawler="xigua" --strategy="定向爬虫策略" --oss_endpoint="inner" --env="prod" --machine="aliyun" xigua/logs/nohup-follow.log
  158. fi
  159. echo "$(date "+%Y-%m-%d %H:%M:%S") 重启完成!" >> ${log_path}
  160. else
  161. echo "$(date "+%Y-%m-%d %H:%M:%S") 西瓜定向爬虫策略 进程状态正常" >> ${log_path}
  162. fi
  163. # 西瓜推荐榜爬虫策略
  164. echo "$(date "+%Y-%m-%d %H:%M:%S") 正在监测 西瓜推荐榜爬虫策略 进程状态" >> ${log_path}
  165. ps -ef | grep "run_xigua_recommend.py" | grep -v "grep"
  166. if [ "$?" -eq 1 ];then
  167. echo "$(date "+%Y-%m-%d_%H:%M:%S") 异常停止,正在重启!" >> ${log_path}
  168. if [ ${env} = "dev" ];then
  169. cd ${piaoquan_crawler_dir} && sh main/scheduling_main.sh ./xigua/xigua_main/run_xigua_recommend.py --log_type="recommend" --crawler="xigua" --env="dev" xigua/logs/nohup-recommend.log
  170. else
  171. cd ${piaoquan_crawler_dir} && /usr/bin/sh main/scheduling_main.sh ./xigua/xigua_main/run_xigua_recommend.py --log_type="recommend" --crawler="xigua" --env="prod" xigua/logs/nohup-recommend.log
  172. fi
  173. echo "$(date "+%Y-%m-%d %H:%M:%S") 重启完成!" >> ${log_path}
  174. else
  175. echo "$(date "+%Y-%m-%d %H:%M:%S") 西瓜推荐榜爬虫策略 进程状态正常" >> ${log_path}
  176. fi
  177. # 西瓜搜索爬虫策略
  178. if [[ "$time" > "00:00:00" ]] && [[ "$time" < "00:10:00" ]]; then
  179. echo "$(date "+%Y-%m-%d %H:%M:%S") 正在监测 西瓜搜索爬虫策略 进程状态" >> ${log_path}
  180. ps -ef | grep "run_xigua_search_new" | grep -v "grep"
  181. if [ "$?" -eq 1 ];then
  182. echo "$(date "+%Y-%m-%d %H:%M:%S") 西瓜搜索爬虫策略, 异常停止, 正在重启!" >> ${log_path}
  183. if [ ${env} = "dev" ];then
  184. cd ${piaoquan_crawler_dir} && sh main/scheduling_main.sh ./xigua/xigua_main/run_xigua_search_new.py --log_type="search" --crawler="xigua" --env="dev" xigua/logs/nohup-search.log
  185. else
  186. cd ${piaoquan_crawler_dir} && /usr/bin/sh main/scheduling_main.sh ./xigua/xigua_main/run_xigua_search_new.py --log_type="search" --crawler="xigua" --env="prod" xigua/logs/nohup-search.log
  187. fi
  188. echo "$(date "+%Y-%m-%d %H:%M:%S") 重启完成!" >> ${log_path}
  189. else
  190. echo "$(date "+%Y-%m-%d %H:%M:%S") 西瓜搜索爬虫策略 进程状态正常" >> ${log_path}
  191. fi
  192. else
  193. echo "$(date "+%Y-%m-%d %H:%M:%S") 不在任务启动时间范围: 西瓜搜索爬虫" >> ${log_path}
  194. fi
  195. # youtube定向爬虫策略
  196. echo "$(date "+%Y-%m-%d %H:%M:%S") 正在监测 youtube定向爬虫策略 进程状态" >> ${log_path}
  197. ps -ef | grep "run_youtube_follow.py" | grep -v "grep"
  198. if [ "$?" -eq 1 ];then
  199. echo "$(date "+%Y-%m-%d_%H:%M:%S") 异常停止,正在重启!" >> ${log_path}
  200. if [ ${env} = "dev" ];then
  201. cd ${piaoquan_crawler_dir} && sh main/scheduling_main.sh ./youtube/youtube_main/run_youtube_follow.py --log_type="author" --crawler="youtube" --env="dev" youtube/logs/nohup-follow.log
  202. else
  203. cd ${piaoquan_crawler_dir} && /usr/bin/sh ./main/main.sh ./youtube/youtube_main/run_youtube_follow.py --log_type="author" --crawler="youtube" --strategy="定向爬虫策略" --oss_endpoint="hk" --env="hk" --machine="aliyun_hk" youtube/logs/nohup-follow.log
  204. fi
  205. echo "$(date "+%Y-%m-%d %H:%M:%S") 重启完成!" >> ${log_path}
  206. else
  207. echo "$(date "+%Y-%m-%d %H:%M:%S") youtube定向爬虫策略 进程状态正常" >> ${log_path}
  208. fi
  209. ## 本山祝福小程序爬虫
  210. #echo "$(date "+%Y-%m-%d %H:%M:%S") 正在监测 本山祝福小程序爬虫 进程状态" >> ${log_path}
  211. #ps -ef | grep "run_benshanzhufu" | grep -v "grep"
  212. #if [ "$?" -eq 1 ];then
  213. # echo "$(date "+%Y-%m-%d_%H:%M:%S") 异常停止,正在重启!" >> ${log_path}
  214. # if [ ${env} = "dev" ];then
  215. # cd ${piaoquan_crawler_dir} && sh main/scheduling_main.sh ./benshanzhufu/benshanzhufu_main/run_benshanzhufu_recommend.py --log_type="recommend" --crawler="benshanzhufu" --env="dev" benshanzhufu/logs/nohup-recommend.log
  216. # else
  217. # cd ${piaoquan_crawler_dir} && /usr/bin/sh /data5/piaoquan_crawler/main/scheduling_main.sh ./benshanzhufu/benshanzhufu_main/run_benshanzhufu_recommend.py --log_type="recommend" --crawler="benshanzhufu" --env="prod" benshanzhufu/logs/nohup-recommend.log
  218. # fi
  219. # echo "$(date "+%Y-%m-%d %H:%M:%S") 重启完成!" >> ${log_path}
  220. #else
  221. # echo "$(date "+%Y-%m-%d %H:%M:%S") 本山祝福小程序爬虫 进程状态正常" >> ${log_path}
  222. #fi
  223. ## 岁岁年年迎福气小程序爬虫
  224. #echo "$(date "+%Y-%m-%d %H:%M:%S") 正在监测 岁岁年年迎福气小程序爬虫 进程状态" >> ${log_path}
  225. #ps -ef | grep "run_suisuiniannianyingfuqi" | grep -v "grep"
  226. #if [ "$?" -eq 1 ];then
  227. # echo "$(date "+%Y-%m-%d_%H:%M:%S") 异常停止,正在重启!" >> ${log_path}
  228. # if [ ${env} = "dev" ];then
  229. # cd ${piaoquan_crawler_dir} && sh main/scheduling_main.sh ./suisuiniannianyingfuqi/suisuiniannianyingfuqi_main/run_suisuiniannianyingfuqi_recommend.py --log_type="recommend" --crawler="suisuiniannianyingfuqi" --env="dev" suisuiniannianyingfuqi/logs/nohup-recommend.log
  230. # else
  231. # cd ${piaoquan_crawler_dir} && /usr/bin/sh /data5/piaoquan_crawler/main/scheduling_main.sh ./suisuiniannianyingfuqi/suisuiniannianyingfuqi_main/run_suisuiniannianyingfuqi_recommend.py --log_type="recommend" --crawler="suisuiniannianyingfuqi" --env="prod" suisuiniannianyingfuqi/logs/nohup-recommend.log
  232. # fi
  233. # echo "$(date "+%Y-%m-%d %H:%M:%S") 重启完成!" >> ${log_path}
  234. #else
  235. # echo "$(date "+%Y-%m-%d %H:%M:%S") 岁岁年年迎福气小程序爬虫 进程状态正常" >> ${log_path}
  236. #fi
  237. # 微信指数监控
  238. echo "$(date "+%Y-%m-%d %H:%M:%S") 正在监测 微信指数 bot 爬虫 进程状态" >> ${log_path}
  239. ps -ef | grep "run_weixinzhishu_bot" | grep -v "grep"
  240. if [ "$?" -eq 1 ];then
  241. echo "$(date "+%Y-%m-%d_%H:%M:%S") 异常停止,正在重启!" >> ${log_path}
  242. if [ ${env} = "dev" ];then
  243. cd ${piaoquan_crawler_dir} && sh main/scheduling_main.sh ./weixinzhishu/weixinzhishu_main/run_weixinzhishu_bot.py --log_type="bot" --crawler="weixinzhishu" --env="dev" weixinzhishu/logs/nohup-bot.log
  244. else
  245. cd ${piaoquan_crawler_dir} && /usr/bin/sh /data5/piaoquan_crawler/main/scheduling_main.sh ./weixinzhishu/weixinzhishu_main/run_weixinzhishu_bot.py --log_type="bot" --crawler="weixinzhishu" --env="prod" weixinzhishu/logs/nohup-bot.log
  246. fi
  247. echo "$(date "+%Y-%m-%d %H:%M:%S") 重启完成!" >> ${log_path}
  248. else
  249. echo "$(date "+%Y-%m-%d %H:%M:%S") 微信指数 bot 爬虫 进程状态正常" >> ${log_path}
  250. fi
  251. # 删除日志
  252. echo "$(date "+%Y-%m-%d %H:%M:%S") 开始清理 5 天前的日志文件" >> ${log_path}
  253. find ${piaoquan_crawler_dir}main/main_logs/ -mtime +5 -name "*.log" -exec rm -rf {} \;
  254. echo "$(date "+%Y-%m-%d %H:%M:%S") 日志文件清理完毕" >> ${log_path}
  255. exit 0