model_predict_analyse.py 1008 B

1234567891011121314151617181920212223242526272829303132
  1. import argparse
  2. import sys
  3. import gzip
  4. from hdfs import InsecureClient
  5. client = InsecureClient("http://master-1-1.c-7f31a3eea195cb73.cn-hangzhou.emr.aliyuncs.com:9870", user="spark")
  6. def read_predict(hdfs_path):
  7. dir = "/dw/recommend/model/34_ad_predict_data/20241004_351_0927_1003_1000/"
  8. for file in client.list(dir):
  9. with client.read(dir + file, encoding="utf-8") as reador:
  10. with gzip.GzipFile(fileobj=reador, mode="rb") as gz_file:
  11. content = gz_file.read().decode("utf-8")
  12. print(f"Content of {file}:\n {content}")
  13. def _main():
  14. read_predict("")
  15. if __name__ == '__main__':
  16. # parser = argparse.ArgumentParser(description="model_predict_analyse.py")
  17. # parser.add_argument("-p", "--predict_path_list", type=list, help="config file path")
  18. # args = parser.parse_args()
  19. #
  20. # predict_path_list = args.predict_path_list
  21. # # 判断参数是否正常
  22. # if len(predict_path_list) != 2:
  23. # sys.exit(1)
  24. _main()