|  | @@ -33,6 +33,7 @@ object makedata_ad_33_bucketData_20240729 {
 | 
											
												
													
														|  |      val repartition = param.getOrElse("repartition", "100").toInt
 |  |      val repartition = param.getOrElse("repartition", "100").toInt
 | 
											
												
													
														|  |      val filterNames = param.getOrElse("filterNames", "").split(",").toSet
 |  |      val filterNames = param.getOrElse("filterNames", "").split(",").toSet
 | 
											
												
													
														|  |      val whatLabel = param.getOrElse("whatLabel", "ad_is_conversion")
 |  |      val whatLabel = param.getOrElse("whatLabel", "ad_is_conversion")
 | 
											
												
													
														|  | 
 |  | +    val cidCountThreshold = param.getOrElse("cidCountThreshold", "20000").toInt
 | 
											
												
													
														|  |  
 |  |  
 | 
											
												
													
														|  |      val loader = getClass.getClassLoader
 |  |      val loader = getClass.getClassLoader
 | 
											
												
													
														|  |  
 |  |  
 | 
											
										
											
												
													
														|  | @@ -86,7 +87,7 @@ object makedata_ad_33_bucketData_20240729 {
 | 
											
												
													
														|  |              }
 |  |              }
 | 
											
												
													
														|  |              val count = cidCountMap.getOrElse(key, 0) + 1
 |  |              val count = cidCountMap.getOrElse(key, 0) + 1
 | 
											
												
													
														|  |              cidCountMap.put(key, count)
 |  |              cidCountMap.put(key, count)
 | 
											
												
													
														|  | -            count > 20000
 |  | 
 | 
											
												
													
														|  | 
 |  | +            count < cidCountThreshold
 | 
											
												
													
														|  |          }.map{
 |  |          }.map{
 | 
											
												
													
														|  |            case (logKey, labelKey, features) =>
 |  |            case (logKey, labelKey, features) =>
 | 
											
												
													
														|  |              val label = JSON.parseObject(labelKey).getOrDefault(whatLabel, "0").toString
 |  |              val label = JSON.parseObject(labelKey).getOrDefault(whatLabel, "0").toString
 |