public.py 921 B

123456789101112131415161718192021222324252627282930313233
  1. # -*- coding: utf-8 -*-
  2. # @Author: wangkun
  3. # @Time: 2023/3/27
  4. from common.scheduling_db import MysqlHelper
  5. # from scheduling_db import MysqlHelper
  6. # 过滤词库
  7. def filter_word(log_type, crawler, source, env):
  8. """
  9. 过滤词库
  10. :param log_type: 日志
  11. :param crawler: 哪款爬虫,如:xiaoniangao
  12. :param source: 哪款爬虫,如:小年糕
  13. :param env: 环境
  14. :return: word_list
  15. """
  16. select_sql = f""" select * from crawler_filter_word where source="{source}" """
  17. words = MysqlHelper.get_values(log_type, crawler, select_sql, env, action='')
  18. if len(words) == 0:
  19. return None
  20. word_list = []
  21. for word in words:
  22. # ss = word['filter_word']
  23. # print(type(ss))
  24. # print(ss)
  25. word_list.append(word['filter_word'])
  26. return word_list
  27. if __name__ == "__main__":
  28. print(filter_word('public', 'xiaoniangao', '小年糕', 'prod'))