public.py 845 B

123456789101112131415161718192021222324252627282930
  1. # -*- coding: utf-8 -*-
  2. # @Author: wangkun
  3. # @Time: 2023/3/27
  4. from common.scheduling_db import MysqlHelper
  5. # from scheduling_db import MysqlHelper
  6. # 过滤词库
  7. def filter_word(log_type, crawler, source, env):
  8. """
  9. 过滤词库
  10. :param log_type: 日志
  11. :param crawler: 哪款爬虫,如:xiaoniangao
  12. :param source: 哪款爬虫,如:小年糕
  13. :param env: 环境
  14. :return: word_list
  15. """
  16. select_sql = f""" select * from crawler_filter_word where source="{source}" """
  17. words = MysqlHelper.get_values(log_type, crawler, select_sql, env, action='')
  18. word_list = []
  19. if len(words) == 0:
  20. return word_list
  21. for word in words:
  22. word_list.append(word['filter_word'])
  23. return word_list
  24. if __name__ == "__main__":
  25. print(filter_word('public', 'xiaoniangao', '小年糕', 'prod'))