Browse Source

test 分布式

often 5 months ago
parent
commit
fbfe37c093

+ 1 - 1
recommend-model-produce/src/main/python/models/dssm/config_ps.yaml

@@ -21,7 +21,7 @@ runner:
   reader_type: "QueueDataset"  # DataLoader / QueueDataset / RecDataset
   reader_type: "QueueDataset"  # DataLoader / QueueDataset / RecDataset
   pipe_command: "python bq_reader_train_ps.py"
   pipe_command: "python bq_reader_train_ps.py"
   thread_num: 1
   thread_num: 1
-  sync_mode: "sync"
+  sync_mode: "async"
 
 
   use_gpu: False
   use_gpu: False
   epochs: 10
   epochs: 10

+ 1 - 1
recommend-model-produce/src/main/python/tools/static_ps_trainer.py

@@ -112,7 +112,7 @@ class Main(object):
 
 
     def init_fleet_with_gloo(use_gloo=True):
     def init_fleet_with_gloo(use_gloo=True):
         if use_gloo:
         if use_gloo:
-            os.environ["PADDLE_WITH_GLOO"] = 0
+            os.environ["PADDLE_WITH_GLOO"] = "0"
             role = role_maker.PaddleCloudRoleMaker(
             role = role_maker.PaddleCloudRoleMaker(
                 is_collective=False,
                 is_collective=False,
                 init_gloo=False
                 init_gloo=False