often 6 月之前
父节点
当前提交
0ab1518074
共有 1 个文件被更改,包括 2 次插入5 次删除
  1. 2 5
      recommend-model-produce/src/main/python/models/dssm/bq_reader_train_ps.py

+ 2 - 5
recommend-model-produce/src/main/python/models/dssm/bq_reader_train_ps.py

@@ -14,7 +14,7 @@ class DSSMReader(MultiSlotDataGenerator):
         try:
             # 按tab分割样本的各个字段
             sample_values = line.rstrip('\n').split('\t')
-            sys.stderr.write(f"sample_values length: {len(sample_values)}\n")
+            
             if len(sample_values) == 6: # 训练格式
                 sample_id, label, vid_left,vid_right,left_features, right_features = sample_values
                 # 转换label为整数
@@ -24,10 +24,7 @@ class DSSMReader(MultiSlotDataGenerator):
                 left_features = [float(x) for x in left_features.split(',')]
                 right_features = [float(x) for x in right_features.split(',')]
                 
-                # 验证特征维度
-                if len(left_features) != self.feature_dim or len(right_features) != self.feature_dim:
-                    return None
-                
+                sys.stderr.write(f"left_features length: {len(left_features)}\n")
                 # 构建输出列表
                 output = []
                 #output.append(("sample_id", [sample_id]))  # 样本ID