process.sh 17 KB


  1. #! /bin/bash
  2. env=$1 # 环境
  3. if [ ${env} = "dev" ];then
  4. piaoquan_crawler_dir=/Users/wangkun/Desktop/crawler/piaoquan_crawler/
  5. profile_path=/etc/profile
  6. python=python3
  7. log_path=${piaoquan_crawler_dir}main/main_logs/process-$(date +%Y-%m-%d).log
  8. elif [ ${env} = "hk" ];then
  9. piaoquan_crawler_dir=/root/piaoquan_crawler/
  10. profile_path=/etc/profile
  11. python=python3
  12. log_path=${piaoquan_crawler_dir}main/main_logs/process-$(date +%Y-%m-%d).log
  13. else
  14. piaoquan_crawler_dir=/data5/piaoquan_crawler/
  15. profile_path=/etc/profile
  16. python=python
  17. log_path=${piaoquan_crawler_dir}main/main_logs/process-$(date +%Y-%m-%d).log
  18. fi
  19. time=$(date +%H:%M:%S)
  20. echo "$(date "+%Y-%m-%d %H:%M:%S") 开始监测爬虫进程状态" >> ${log_path}
  21. echo "$(date "+%Y-%m-%d %H:%M:%S") 更新环境变量..." >> ${log_path}
  22. cd ~ && source /etc/profile
  23. echo "$(date "+%Y-%m-%d %H:%M:%S") 更新环境变量完成!" >> ${log_path}
  24. ## 公众号爬虫策略
  25. #echo "$(date "+%Y-%m-%d %H:%M:%S") 正在监测 公众号爬虫策略 1-100个账号 进程状态" >> ${log_path}
  26. #ps -ef | grep "run_gongzhonghao_follow.py" | grep -v "grep"
  27. #if [ "$?" -eq 1 ];then
  28. # echo "$(date "+%Y-%m-%d_%H:%M:%S") 异常停止,正在重启!" >> ${log_path}
  29. # if [ ${env} = "dev" ];then
  30. # cd ${piaoquan_crawler_dir} && sh main/scheduling_main.sh ./gongzhonghao/gongzhonghao_main/run_gongzhonghao_follow.py --log_type="author" --crawler="gongzhonghao" --env="dev" gongzhonghao/logs/nohup-follow.log
  31. # else
  32. # cd ${piaoquan_crawler_dir} && /usr/bin/sh /data5/piaoquan_crawler/main/scheduling_main.sh ./gongzhonghao/gongzhonghao_main/run_gongzhonghao_follow.py --log_type="author" --crawler="gongzhonghao" --env="prod" gongzhonghao/logs/nohup-follow.log
  33. # fi
  34. # echo "$(date "+%Y-%m-%d %H:%M:%S") 重启完成!" >> ${log_path}
  35. #else
  36. # echo "$(date "+%Y-%m-%d %H:%M:%S") 公众号爬虫策略1-100个账号 进程状态正常" >> ${log_path}
  37. #fi
  38. #
  39. #echo "$(date "+%Y-%m-%d %H:%M:%S") 正在监测 公众号爬虫策略101-145个账号 进程状态" >> ${log_path}
  40. #ps -ef | grep "run_gongzhonghao_follow_2.py" | grep -v "grep"
  41. #if [ "$?" -eq 1 ];then
  42. # echo "$(date "+%Y-%m-%d_%H:%M:%S") 异常停止,正在重启!" >> ${log_path}
  43. # if [ ${env} = "dev" ];then
  44. # cd ${piaoquan_crawler_dir} && sh main/scheduling_main.sh ./gongzhonghao/gongzhonghao_main/run_gongzhonghao_follow_2.py --log_type="follow-2" --crawler="gongzhonghao" --env="dev" gongzhonghao/logs/nohup-follow-2.log
  45. # else
  46. # cd ${piaoquan_crawler_dir} && /usr/bin/sh /data5/piaoquan_crawler/main/scheduling_main.sh ./gongzhonghao/gongzhonghao_main/run_gongzhonghao_follow_2.py --log_type="follow-2" --crawler="gongzhonghao" --env="prod" gongzhonghao/logs/nohup-follow-2.log
  47. # fi
  48. # echo "$(date "+%Y-%m-%d %H:%M:%S") 重启完成!" >> ${log_path}
  49. #else
  50. # echo "$(date "+%Y-%m-%d %H:%M:%S") 公众号爬虫策略101-145个账号 进程状态正常" >> ${log_path}
  51. #fi
  52. # 小年糕定向爬虫策略
  53. echo "$(date "+%Y-%m-%d %H:%M:%S") 正在监测 小年糕定向爬虫策略 进程状态" >> ${log_path}
  54. ps -ef | grep "run_xiaoniangao_follow.py" | grep -v "grep"
  55. if [ "$?" -eq 1 ];then
  56. echo "$(date "+%Y-%m-%d_%H:%M:%S") 异常停止,正在重启!" >> ${log_path}
  57. if [ ${env} = "dev" ];then
  58. cd ${piaoquan_crawler_dir} && sh main/scheduling_main.sh ./xiaoniangao/xiaoniangao_main/run_xiaoniangao_follow.py --log_type="author" --crawler="xiaoniangao" --env="dev" xiaoniangao/logs/nohup-follow.log
  59. else
  60. cd ${piaoquan_crawler_dir} && /usr/bin/sh /data5/piaoquan_crawler/main/scheduling_main.sh ./xiaoniangao/xiaoniangao_main/run_xiaoniangao_follow.py --log_type="author" --crawler="xiaoniangao" --env="prod" xiaoniangao/logs/nohup-follow.log
  61. fi
  62. echo "$(date "+%Y-%m-%d %H:%M:%S") 重启完成!" >> ${log_path}
  63. else
  64. echo "$(date "+%Y-%m-%d %H:%M:%S") 小年糕定向爬虫策略 进程状态正常" >> ${log_path}
  65. fi
  66. # 小年糕小时榜爬虫策略
  67. echo "$(date "+%Y-%m-%d %H:%M:%S") 正在监测 小年糕小时榜爬虫策略 进程状态" >> ${log_path}
  68. ps -ef | grep "run_xiaoniangao_hour.py" | grep -v "grep"
  69. if [ "$?" -eq 1 ];then
  70. echo "$(date "+%Y-%m-%d_%H:%M:%S") 异常停止,正在重启!" >> ${log_path}
  71. if [ ${env} = "dev" ];then
  72. cd ${piaoquan_crawler_dir} && sh main/scheduling_main.sh ./xiaoniangao/xiaoniangao_main/run_xiaoniangao_hour.py --log_type="hour" --crawler="xiaoniangao" --env="dev" xiaoniangao/logs/nohup-hour.log
  73. else
  74. cd ${piaoquan_crawler_dir} && /usr/bin/sh /data5/piaoquan_crawler/main/scheduling_main.sh ./xiaoniangao/xiaoniangao_main/run_xiaoniangao_hour.py --log_type="hour" --crawler="xiaoniangao" --env="prod" xiaoniangao/logs/nohup-hour.log
  75. fi
  76. echo "$(date "+%Y-%m-%d %H:%M:%S") 重启完成!" >> ${log_path}
  77. else
  78. echo "$(date "+%Y-%m-%d %H:%M:%S") 小年糕小时榜爬虫策略 进程状态正常" >> ${log_path}
  79. fi
  80. # 小年糕播放量榜爬虫策略
  81. echo "$(date "+%Y-%m-%d %H:%M:%S") 正在监测 播放量榜爬虫策略 进程状态" >> ${log_path}
  82. ps -ef | grep "run_xiaoniangao_play.py" | grep -v "grep"
  83. if [ "$?" -eq 1 ];then
  84. echo "$(date "+%Y-%m-%d_%H:%M:%S") 异常停止,正在重启!" >> ${log_path}
  85. if [ ${env} = "dev" ];then
  86. cd ${piaoquan_crawler_dir} && sh main/scheduling_main.sh ./xiaoniangao/xiaoniangao_main/run_xiaoniangao_play.py --log_type="play" --crawler="xiaoniangao" --env="dev" xiaoniangao/logs/nohup-play.log
  87. else
  88. cd ${piaoquan_crawler_dir} && /usr/bin/sh /data5/piaoquan_crawler/main/scheduling_main.sh ./xiaoniangao/xiaoniangao_main/run_xiaoniangao_play.py --log_type="play" --crawler="xiaoniangao" --env="prod" xiaoniangao/logs/nohup-play.log
  89. fi
  90. echo "$(date "+%Y-%m-%d %H:%M:%S") 重启完成!" >> ${log_path}
  91. else
  92. echo "$(date "+%Y-%m-%d %H:%M:%S") 播放量榜爬虫策略 进程状态正常" >> ${log_path}
  93. fi
  94. ## 快手定向爬虫策略
  95. #echo "$(date "+%Y-%m-%d %H:%M:%S") 正在监测 快手定向爬虫策略 进程状态" >> ${log_path}
  96. #ps -ef | grep "run_kuaishou_follow.py" | grep -v "grep"
  97. #if [ "$?" -eq 1 ];then
  98. # echo "$(date "+%Y-%m-%d_%H:%M:%S") 异常停止,正在重启!" >> ${log_path}
  99. # if [ ${env} = "dev" ];then
  100. # cd ${piaoquan_crawler_dir} && sh main/scheduling_main.sh ./kuaishou/kuaishou_main/run_kuaishou_follow.py --log_type="author" --crawler="kuaishou" --env="dev" kuaishou/logs/nohup-follow.log
  101. # else
  102. # cd ${piaoquan_crawler_dir} && /usr/bin/sh ./main/main.sh ./kuaishou/kuaishou_main/run_kuaishou_follow.py --log_type="author" --crawler="kuaishou" --strategy="定向爬虫策略" --oss_endpoint="inner" --env="prod" --machine="aliyun" kuaishou/logs/nohup-follow.log
  103. # fi
  104. # echo "$(date "+%Y-%m-%d %H:%M:%S") 重启完成!" >> ${log_path}
  105. #else
  106. # echo "$(date "+%Y-%m-%d %H:%M:%S") 快手定向爬虫策略 进程状态正常" >> ${log_path}
  107. #fi
  108. ## 快手推荐爬虫策略
  109. #echo "$(date "+%Y-%m-%d %H:%M:%S") 正在监测 快手推荐爬虫策略 进程状态" >> ${log_path}
  110. #ps -ef | grep "run_kuaishou_recommend.py" | grep -v "grep"
  111. #if [ "$?" -eq 1 ];then
  112. # echo "$(date "+%Y-%m-%d_%H:%M:%S") 异常停止,正在重启!" >> ${log_path}
  113. # if [ ${env} = "dev" ];then
  114. # cd ${piaoquan_crawler_dir} && sh main/scheduling_main.sh ./kuaishou/kuaishou_main/run_kuaishou_follow.py --log_type="author" --crawler="kuaishou" --env="dev" kuaishou/logs/nohup-recommend.log
  115. # else
  116. # cd ${piaoquan_crawler_dir} && /usr/bin/sh ./main/main.sh ./kuaishou/kuaishou_main/run_kuaishou_recommend.py --log_type="recommend" --crawler="kuaishou" --strategy="推荐爬虫策略" --oss_endpoint="inner" --env="prod" --machine="aliyun" kuaishou/logs/nohup-recommend.log
  117. # fi
  118. # echo "$(date "+%Y-%m-%d %H:%M:%S") 重启完成!" >> ${log_path}
  119. #else
  120. # echo "$(date "+%Y-%m-%d %H:%M:%S") 快手推荐爬虫策略 进程状态正常" >> ${log_path}
  121. #fi
  122. # 抖音推荐爬虫策略
  123. echo "$(date "+%Y-%m-%d %H:%M:%S") 正在监测 抖音推荐爬虫策略 进程状态" >> ${log_path}
  124. ps -ef | grep "run_douyin_recommend.py" | grep -v "grep"
  125. if [ "$?" -eq 1 ];then
  126. echo "$(date "+%Y-%m-%d_%H:%M:%S") 异常停止,正在重启!" >> ${log_path}
  127. if [ ${env} = "dev" ];then
  128. cd ${piaoquan_crawler_dir} && sh main/scheduling_main.sh ./kuaishou/kuaishou_main/run_kuaishou_follow.py --log_type="author" --crawler="kuaishou" --env="dev" douyin/logs/nohup-recommend.log
  129. else
  130. cd ${piaoquan_crawler_dir} && /usr/bin/sh ./main/main.sh ./douyin/douyin_main/run_douyin_recommend.py --log_type="recommend" --crawler="douyin" --strategy="抖音推荐爬虫策略" --oss_endpoint="inner" --env="prod" --machine="aliyun" douyin/logs/nohup-recommend.log
  131. fi
  132. echo "$(date "+%Y-%m-%d %H:%M:%S") 重启完成!" >> ${log_path}
  133. else
  134. echo "$(date "+%Y-%m-%d %H:%M:%S") 抖音推荐爬虫策略 进程状态正常" >> ${log_path}
  135. fi
  136. # 抖音定向爬虫策略
  137. echo "$(date "+%Y-%m-%d %H:%M:%S") 正在监测 抖音定向爬虫策略 进程状态" >> ${log_path}
  138. ps -ef | grep "run_douyin_follow.py" | grep -v "grep"
  139. if [ "$?" -eq 1 ];then
  140. echo "$(date "+%Y-%m-%d_%H:%M:%S") 异常停止,正在重启!" >> ${log_path}
  141. if [ ${env} = "dev" ];then
  142. cd ${piaoquan_crawler_dir} && sh main/scheduling_main.sh ./kuaishou/douyin_main/run_douyin_follow.py --log_type="author" --crawler="douyin" --env="dev" douyin/logs/nohup-follow.log
  143. else
  144. cd ${piaoquan_crawler_dir} && /usr/bin/sh ./main/main.sh ./douyin/douyin_main/run_douyin_follow.py --log_type="author" --crawler="douyin" --strategy="抖音定向爬虫策略" --oss_endpoint="inner" --env="prod" --machine="aliyun" douyin/logs/nohup-author.log
  145. fi
  146. echo "$(date "+%Y-%m-%d %H:%M:%S") 重启完成!" >> ${log_path}
  147. else
  148. echo "$(date "+%Y-%m-%d %H:%M:%S") 抖音推荐爬虫策略 进程状态正常" >> ${log_path}
  149. fi
  150. # 西瓜定向爬虫策略
  151. echo "$(date "+%Y-%m-%d %H:%M:%S") 正在监测 西瓜定向爬虫策略 进程状态" >> ${log_path}
  152. ps -ef | grep "run_xigua_follow.py" | grep -v "grep"
  153. if [ "$?" -eq 1 ];then
  154. echo "$(date "+%Y-%m-%d_%H:%M:%S") 异常停止,正在重启!" >> ${log_path}
  155. if [ ${env} = "dev" ];then
  156. cd ${piaoquan_crawler_dir} && sh main/scheduling_main.sh ./xigua/xigua_main/run_xigua_follow.py --log_type="author" --crawler="xigua" --env="dev" xigua/logs/nohup-follow.log
  157. else
  158. cd ${piaoquan_crawler_dir} && /usr/bin/sh ./main/main.sh ./xigua/xigua_main/run_xigua_follow.py --log_type="author" --crawler="xigua" --strategy="定向爬虫策略" --oss_endpoint="inner" --env="prod" --machine="aliyun" xigua/logs/nohup-follow.log
  159. fi
  160. echo "$(date "+%Y-%m-%d %H:%M:%S") 重启完成!" >> ${log_path}
  161. else
  162. echo "$(date "+%Y-%m-%d %H:%M:%S") 西瓜定向爬虫策略 进程状态正常" >> ${log_path}
  163. fi
  164. # 西瓜推荐榜爬虫策略
  165. echo "$(date "+%Y-%m-%d %H:%M:%S") 正在监测 西瓜推荐榜爬虫策略 进程状态" >> ${log_path}
  166. ps -ef | grep "run_xigua_recommend.py" | grep -v "grep"
  167. if [ "$?" -eq 1 ];then
  168. echo "$(date "+%Y-%m-%d_%H:%M:%S") 异常停止,正在重启!" >> ${log_path}
  169. if [ ${env} = "dev" ];then
  170. cd ${piaoquan_crawler_dir} && sh main/scheduling_main.sh ./xigua/xigua_main/run_xigua_recommend.py --log_type="recommend" --crawler="xigua" --env="dev" xigua/logs/nohup-recommend.log
  171. else
  172. cd ${piaoquan_crawler_dir} && /usr/bin/sh main/scheduling_main.sh ./xigua/xigua_main/run_xigua_recommend.py --log_type="recommend" --crawler="xigua" --env="prod" xigua/logs/nohup-recommend.log
  173. fi
  174. echo "$(date "+%Y-%m-%d %H:%M:%S") 重启完成!" >> ${log_path}
  175. else
  176. echo "$(date "+%Y-%m-%d %H:%M:%S") 西瓜推荐榜爬虫策略 进程状态正常" >> ${log_path}
  177. fi
  178. # 西瓜搜索爬虫策略
  179. if [[ "$time" > "00:00:00" ]] && [[ "$time" < "00:10:00" ]]; then
  180. echo "$(date "+%Y-%m-%d %H:%M:%S") 正在监测 西瓜搜索爬虫策略 进程状态" >> ${log_path}
  181. ps -ef | grep "run_xigua_search_new" | grep -v "grep"
  182. if [ "$?" -eq 1 ];then
  183. echo "$(date "+%Y-%m-%d %H:%M:%S") 西瓜搜索爬虫策略, 异常停止, 正在重启!" >> ${log_path}
  184. if [ ${env} = "dev" ];then
  185. cd ${piaoquan_crawler_dir} && sh main/scheduling_main.sh ./xigua/xigua_main/run_xigua_search_new.py --log_type="search" --crawler="xigua" --env="dev" xigua/logs/nohup-search.log
  186. else
  187. cd ${piaoquan_crawler_dir} && /usr/bin/sh main/scheduling_main.sh ./xigua/xigua_main/run_xigua_search_new.py --log_type="search" --crawler="xigua" --env="prod" xigua/logs/nohup-search.log
  188. fi
  189. echo "$(date "+%Y-%m-%d %H:%M:%S") 重启完成!" >> ${log_path}
  190. else
  191. echo "$(date "+%Y-%m-%d %H:%M:%S") 西瓜搜索爬虫策略 进程状态正常" >> ${log_path}
  192. fi
  193. else
  194. echo "$(date "+%Y-%m-%d %H:%M:%S") 不在任务启动时间范围: 西瓜搜索爬虫" >> ${log_path}
  195. fi
  196. # youtube定向爬虫策略
  197. echo "$(date "+%Y-%m-%d %H:%M:%S") 正在监测 youtube定向爬虫策略 进程状态" >> ${log_path}
  198. ps -ef | grep "run_youtube_follow.py" | grep -v "grep"
  199. if [ "$?" -eq 1 ];then
  200. echo "$(date "+%Y-%m-%d_%H:%M:%S") 异常停止,正在重启!" >> ${log_path}
  201. if [ ${env} = "dev" ];then
  202. cd ${piaoquan_crawler_dir} && sh main/scheduling_main.sh ./youtube/youtube_main/run_youtube_follow.py --log_type="author" --crawler="youtube" --env="dev" youtube/logs/nohup-follow.log
  203. else
  204. cd ${piaoquan_crawler_dir} && /usr/bin/sh ./main/main.sh ./youtube/youtube_main/run_youtube_follow.py --log_type="author" --crawler="youtube" --strategy="定向爬虫策略" --oss_endpoint="hk" --env="hk" --machine="aliyun_hk" youtube/logs/nohup-follow.log
  205. fi
  206. echo "$(date "+%Y-%m-%d %H:%M:%S") 重启完成!" >> ${log_path}
  207. else
  208. echo "$(date "+%Y-%m-%d %H:%M:%S") youtube定向爬虫策略 进程状态正常" >> ${log_path}
  209. fi
  210. ## 本山祝福小程序爬虫
  211. #echo "$(date "+%Y-%m-%d %H:%M:%S") 正在监测 本山祝福小程序爬虫 进程状态" >> ${log_path}
  212. #ps -ef | grep "run_benshanzhufu" | grep -v "grep"
  213. #if [ "$?" -eq 1 ];then
  214. # echo "$(date "+%Y-%m-%d_%H:%M:%S") 异常停止,正在重启!" >> ${log_path}
  215. # if [ ${env} = "dev" ];then
  216. # cd ${piaoquan_crawler_dir} && sh main/scheduling_main.sh ./benshanzhufu/benshanzhufu_main/run_benshanzhufu_recommend.py --log_type="recommend" --crawler="benshanzhufu" --env="dev" benshanzhufu/logs/nohup-recommend.log
  217. # else
  218. # cd ${piaoquan_crawler_dir} && /usr/bin/sh /data5/piaoquan_crawler/main/scheduling_main.sh ./benshanzhufu/benshanzhufu_main/run_benshanzhufu_recommend.py --log_type="recommend" --crawler="benshanzhufu" --env="prod" benshanzhufu/logs/nohup-recommend.log
  219. # fi
  220. # echo "$(date "+%Y-%m-%d %H:%M:%S") 重启完成!" >> ${log_path}
  221. #else
  222. # echo "$(date "+%Y-%m-%d %H:%M:%S") 本山祝福小程序爬虫 进程状态正常" >> ${log_path}
  223. #fi
  224. ## 岁岁年年迎福气小程序爬虫
  225. #echo "$(date "+%Y-%m-%d %H:%M:%S") 正在监测 岁岁年年迎福气小程序爬虫 进程状态" >> ${log_path}
  226. #ps -ef | grep "run_suisuiniannianyingfuqi" | grep -v "grep"
  227. #if [ "$?" -eq 1 ];then
  228. # echo "$(date "+%Y-%m-%d_%H:%M:%S") 异常停止,正在重启!" >> ${log_path}
  229. # if [ ${env} = "dev" ];then
  230. # cd ${piaoquan_crawler_dir} && sh main/scheduling_main.sh ./suisuiniannianyingfuqi/suisuiniannianyingfuqi_main/run_suisuiniannianyingfuqi_recommend.py --log_type="recommend" --crawler="suisuiniannianyingfuqi" --env="dev" suisuiniannianyingfuqi/logs/nohup-recommend.log
  231. # else
  232. # cd ${piaoquan_crawler_dir} && /usr/bin/sh /data5/piaoquan_crawler/main/scheduling_main.sh ./suisuiniannianyingfuqi/suisuiniannianyingfuqi_main/run_suisuiniannianyingfuqi_recommend.py --log_type="recommend" --crawler="suisuiniannianyingfuqi" --env="prod" suisuiniannianyingfuqi/logs/nohup-recommend.log
  233. # fi
  234. # echo "$(date "+%Y-%m-%d %H:%M:%S") 重启完成!" >> ${log_path}
  235. #else
  236. # echo "$(date "+%Y-%m-%d %H:%M:%S") 岁岁年年迎福气小程序爬虫 进程状态正常" >> ${log_path}
  237. #fi
  238. # 微信指数监控
  239. echo "$(date "+%Y-%m-%d %H:%M:%S") 正在监测 微信指数 bot 爬虫 进程状态" >> ${log_path}
  240. ps -ef | grep "run_weixinzhishu_bot" | grep -v "grep"
  241. if [ "$?" -eq 1 ];then
  242. echo "$(date "+%Y-%m-%d_%H:%M:%S") 异常停止,正在重启!" >> ${log_path}
  243. if [ ${env} = "dev" ];then
  244. cd ${piaoquan_crawler_dir} && sh main/scheduling_main.sh ./weixinzhishu/weixinzhishu_main/run_weixinzhishu_bot.py --log_type="bot" --crawler="weixinzhishu" --env="dev" weixinzhishu/logs/nohup-bot.log
  245. else
  246. cd ${piaoquan_crawler_dir} && /usr/bin/sh /data5/piaoquan_crawler/main/scheduling_main.sh ./weixinzhishu/weixinzhishu_main/run_weixinzhishu_bot.py --log_type="bot" --crawler="weixinzhishu" --env="prod" weixinzhishu/logs/nohup-bot.log
  247. fi
  248. echo "$(date "+%Y-%m-%d %H:%M:%S") 重启完成!" >> ${log_path}
  249. else
  250. echo "$(date "+%Y-%m-%d %H:%M:%S") 微信指数 bot 爬虫 进程状态正常" >> ${log_path}
  251. fi
  252. # 删除日志
  253. echo "$(date "+%Y-%m-%d %H:%M:%S") 开始清理 5 天前的日志文件" >> ${log_path}
  254. find ${piaoquan_crawler_dir}main/main_logs/ -mtime +5 -name "*.log" -exec rm -rf {} \;
  255. echo "$(date "+%Y-%m-%d %H:%M:%S") 日志文件清理完毕" >> ${log_path}
  256. exit 0