mirror of
https://github.com/THU-MIG/yolov10.git
synced 2025-05-23 21:44:22 +08:00
re-added commented out debug print
This commit is contained in:
parent
99b3fac964
commit
803f4013a2
@ -224,6 +224,7 @@ class BaseTrainer:
|
|||||||
"""Initializes and sets the DistributedDataParallel parameters for training."""
|
"""Initializes and sets the DistributedDataParallel parameters for training."""
|
||||||
torch.cuda.set_device(RANK)
|
torch.cuda.set_device(RANK)
|
||||||
self.device = torch.device("cuda", RANK)
|
self.device = torch.device("cuda", RANK)
|
||||||
|
# LOGGER.info(f'DDP info: RANK {RANK}, WORLD_SIZE {world_size}, DEVICE {self.device}')
|
||||||
os.environ["TORCH_NCCL_BLOCKING_WAIT"] = "1" # set to enforce timeout
|
os.environ["TORCH_NCCL_BLOCKING_WAIT"] = "1" # set to enforce timeout
|
||||||
dist.init_process_group(
|
dist.init_process_group(
|
||||||
backend="nccl" if dist.is_nccl_available() else "gloo",
|
backend="nccl" if dist.is_nccl_available() else "gloo",
|
||||||
|
Loading…
x
Reference in New Issue
Block a user