Browse Source

fix data format

often 5 months ago
parent
commit
976542ed7e

+ 1 - 1
recommend-model-produce/src/main/python/models/dssm/bq_reader_train_ps.py

@@ -12,7 +12,7 @@ class DSSMReader(MultiSlotDataGenerator):
     def line_process(self, line):
         try:
             # 按tab分割样本的各个字段
-            sample_id, label, left_features, right_features = line.rstrip('\n').split('\t')
+            sample_id, label, left_features, right_features = line.rstrip('\n').split('    ')
             
             # 转换label为整数
             label = int(label)