| 
					
				 | 
			
			
				@@ -3,7 +3,6 @@ import gzip 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				 import sys 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				  
			 | 
		
	
		
			
				 | 
				 | 
			
			
				 import pandas as pd 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				- 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				 from hdfs import InsecureClient 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				  
			 | 
		
	
		
			
				 | 
				 | 
			
			
				 client = InsecureClient("http://master-1-1.c-7f31a3eea195cb73.cn-hangzhou.emr.aliyuncs.com:9870", user="spark") 
			 | 
		
	
	
		
			
				| 
					
				 | 
			
			
				@@ -32,6 +31,15 @@ def read_predict(hdfs_path: str) -> list: 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				  
			 | 
		
	
		
			
				 | 
				 | 
			
			
				  
			 | 
		
	
		
			
				 | 
				 | 
			
			
				 def _main(model1_predict_path: str, model2_predict_path: str): 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				+    if not model1_predict_path.endswith("/"): 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				+        model1_predict_path += "/" 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				+ 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				+    if not model2_predict_path.endswith("/"): 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				+        model2_predict_path += "/" 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				+ 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				+    # # 设置 pandas 显示选项 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				+    # pd.set_option('display.max_rows', None)  # 显示所有行 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				+    # pd.set_option('display.max_columns', None)  # 显示所有列 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				  
			 | 
		
	
		
			
				 | 
				 | 
			
			
				     model1_result = read_predict(model1_predict_path) 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				     model2_result = read_predict(model2_predict_path) 
			 | 
		
	
	
		
			
				| 
					
				 | 
			
			
				@@ -55,8 +63,6 @@ def _main(model1_predict_path: str, model2_predict_path: str): 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				     # 计算差值的平均值,并保留六位小数 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				     mean_abs_diff = round(merged['score_diff'].mean(), 6) 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				  
			 | 
		
	
		
			
				 | 
				 | 
			
			
				-    print(mean_abs_diff) 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				-     
			 | 
		
	
		
			
				 | 
				 | 
			
			
				  
			 | 
		
	
		
			
				 | 
				 | 
			
			
				 if __name__ == '__main__': 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				     parser = argparse.ArgumentParser(description="model_predict_analyse.py") 
			 |