We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent 79d8bd1 commit e53cda0Copy full SHA for e53cda0
scripts/vla/vla_finetune.py
@@ -54,7 +54,7 @@
54
def main(args) -> None:
55
56
mbs = args.mbs
57
- gbs = args.mbs *2
+ gbs = args.mbs
58
decoder_seq_length = 287
59
60
@@ -94,7 +94,7 @@ def main(args) -> None:
94
)
95
96
strategy = nl.MegatronStrategy(
97
- tensor_model_parallel_size=4,
+ tensor_model_parallel_size=2,
98
pipeline_model_parallel_size=1,
99
pipeline_dtype=torch.bfloat16,
100
sequence_parallel=False,
0 commit comments