Skip to content

Commit

Permalink
Merge pull request #244 from sony/feature/20200921-extend-watchdog-time
Browse files Browse the repository at this point in the history
extend watch dog time so not too sensitive
  • Loading branch information
YukioOobuchi authored Sep 29, 2020
2 parents cf53048 + 85bf3f6 commit cf74f5e
Show file tree
Hide file tree
Showing 2 changed files with 2 additions and 2 deletions.
Original file line number Diff line number Diff line change
Expand Up @@ -60,7 +60,7 @@ template <typename T>
class NBLA_API MultiProcessDataParallelCommunicatorNccl
: public MultiProcessDataParallelCommunicator<T> {
protected:
int all_reduce_timeout_ = 100; // timeout=10s
int all_reduce_timeout_ = 500; // timeout=50s
Watchdog watch_dog_;
int device_id_;

Expand Down
2 changes: 1 addition & 1 deletion include/nbla/cuda/communicator/watch_dog.hpp
Original file line number Diff line number Diff line change
Expand Up @@ -19,7 +19,7 @@ namespace nbla {

class Watchdog {
private:
static const int TIMEOUT_TICKS = 100; // default timeout is 10s
static const int TIMEOUT_TICKS = 600; // default timeout is 60s
static const int TICK = 100; // 100 ms each tick
static const int STOP_WATCH_DOG = -1000; // arbitrary negative value
static const int EXIT_WATCH_DOG = 1; // exit flag
Expand Down

0 comments on commit cf74f5e

Please sign in to comment.