From f512d9f8ebe03dd0842fba88b12a7a44e14282be Mon Sep 17 00:00:00 2001 From: Yasiru Date: Sun, 28 Apr 2024 00:30:57 +1000 Subject: [PATCH 1/3] Changed argument --local_rank to --local-rank The argument --local_rank has been changed to --local-rank because torch.distributed.launch passes the argument as --local-rank instead of --local_rank in a multi-GPU environment --- train.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/train.py b/train.py index 59c372afe..a114f93f3 100644 --- a/train.py +++ b/train.py @@ -466,7 +466,7 @@ def parse_opt(known=False): parser.add_argument('--freeze', nargs='+', type=int, default=[0], help='Freeze layers: backbone=10, first3=0 1 2') parser.add_argument('--save-period', type=int, default=-1, help='Save checkpoint every x epochs (disabled if < 1)') parser.add_argument('--seed', type=int, default=0, help='Global training seed') - parser.add_argument('--local_rank', type=int, default=-1, help='Automatic DDP Multi-GPU argument, do not modify') + parser.add_argument('--local-rank', type=int, default=-1, help='Automatic DDP Multi-GPU argument, do not modify') parser.add_argument('--min-items', type=int, default=0, help='Experimental') parser.add_argument('--close-mosaic', type=int, default=0, help='Experimental') From 9d3041f6ffde5aa301a3c7e8e59ce61cff107b5b Mon Sep 17 00:00:00 2001 From: Yasiru Date: Sun, 28 Apr 2024 00:32:12 +1000 Subject: [PATCH 2/3] Changed argument --local_rank to --local-rank The argument --local_rank has been changed to --local-rank because torch.distributed.launch passes the argument as --local-rank instead of --local_rank in a multi-GPU environment. --- train_dual.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/train_dual.py b/train_dual.py index 1d21ac8f5..69964fe98 100644 --- a/train_dual.py +++ b/train_dual.py @@ -474,7 +474,7 @@ def parse_opt(known=False): parser.add_argument('--freeze', nargs='+', type=int, default=[0], help='Freeze layers: backbone=10, first3=0 1 2') parser.add_argument('--save-period', type=int, default=-1, help='Save checkpoint every x epochs (disabled if < 1)') parser.add_argument('--seed', type=int, default=0, help='Global training seed') - parser.add_argument('--local_rank', type=int, default=-1, help='Automatic DDP Multi-GPU argument, do not modify') + parser.add_argument('--local-rank', type=int, default=-1, help='Automatic DDP Multi-GPU argument, do not modify') parser.add_argument('--min-items', type=int, default=0, help='Experimental') parser.add_argument('--close-mosaic', type=int, default=0, help='Experimental') From 5864f5422abee4570c299fc19ef3e2c25ef18785 Mon Sep 17 00:00:00 2001 From: Yasiru Date: Sun, 28 Apr 2024 00:32:52 +1000 Subject: [PATCH 3/3] Changed argument --local_rank to --local-rank The argument --local_rank has been changed to --local-rank because torch.distributed.launch passes the argument as --local-rank instead of --local_rank in a multi-GPU environment. --- train_triple.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/train_triple.py b/train_triple.py index 4dbbc1eee..f824d189b 100644 --- a/train_triple.py +++ b/train_triple.py @@ -466,7 +466,7 @@ def parse_opt(known=False): parser.add_argument('--freeze', nargs='+', type=int, default=[0], help='Freeze layers: backbone=10, first3=0 1 2') parser.add_argument('--save-period', type=int, default=-1, help='Save checkpoint every x epochs (disabled if < 1)') parser.add_argument('--seed', type=int, default=0, help='Global training seed') - parser.add_argument('--local_rank', type=int, default=-1, help='Automatic DDP Multi-GPU argument, do not modify') + parser.add_argument('--local-rank', type=int, default=-1, help='Automatic DDP Multi-GPU argument, do not modify') parser.add_argument('--min-items', type=int, default=0, help='Experimental') parser.add_argument('--close-mosaic', type=int, default=0, help='Experimental')