initialise process group for tp
This commit is contained in:
@@ -827,7 +827,7 @@ class ModelLoader:
|
|||||||
_ = _configure_zero3_memory_efficient_loading()
|
_ = _configure_zero3_memory_efficient_loading()
|
||||||
|
|
||||||
if self.cfg.tensor_parallel == "auto":
|
if self.cfg.tensor_parallel == "auto":
|
||||||
rank = int(os.environ["RANK"])
|
rank = int(os.environ.get("LOCAL_RANK", 0))
|
||||||
device = torch.device(f"cuda:{rank}")
|
device = torch.device(f"cuda:{rank}")
|
||||||
torch.distributed.init_process_group("nccl", device_id=device)
|
torch.distributed.init_process_group("nccl", device_id=device)
|
||||||
|
|
||||||
|
|||||||
Reference in New Issue
Block a user