@@ -357,6 +357,8 @@ def test(self, zero_stage, use_cpu_offload):
357
357
model .backward (loss )
358
358
model .step ()
359
359
360
+ model .destroy ()
361
+
360
362
361
363
@pytest .mark .parametrize ("zero_stage" , [1 , 2 , 3 ])
362
364
@pytest .mark .parametrize ("use_cpu_offload" , [True , False ])
@@ -402,6 +404,8 @@ def test(self, zero_stage, use_cpu_offload, hidden_dim=4):
402
404
model .backward (loss )
403
405
model .step ()
404
406
407
+ model .destroy ()
408
+
405
409
406
410
@pytest .mark .parametrize ("zero_stage" , [1 , 2 , 3 ])
407
411
@pytest .mark .parametrize ("use_cpu_offload" , [True , False ])
@@ -436,6 +440,7 @@ def test(self, zero_stage, use_cpu_offload):
436
440
model = model ,
437
441
optimizer = optimizer ,
438
442
model_parameters = model .parameters ())
443
+ model .destroy ()
439
444
440
445
441
446
@pytest .mark .parametrize ("zero_stage" , [1 , 2 , 3 ])
@@ -486,6 +491,8 @@ def test(self, zero_stage, use_cpu_offload):
486
491
model .backward (loss )
487
492
model .step ()
488
493
494
+ model .destroy ()
495
+
489
496
490
497
@amp_available
491
498
class TestAmp (DistributedTest ):
@@ -615,6 +622,7 @@ def test(self, zero_stage, optimizer_constructor):
615
622
model = SimpleModel (hidden_dim )
616
623
client_optimizer = optimizer_constructor (params = model .parameters ())
617
624
model , _ , _ , _ = deepspeed .initialize (config = config_dict , model = model , optimizer = client_optimizer )
625
+ model .destroy ()
618
626
619
627
620
628
class TestZero2ReduceScatterOff (DistributedTest ):
@@ -727,6 +735,8 @@ def test(self):
727
735
model .backward (loss )
728
736
model .step ()
729
737
738
+ model .destroy ()
739
+
730
740
731
741
@pytest .mark .parametrize ('stage' , [1 , 2 , 3 ])
732
742
class TestZeroEmptyGrad (DistributedTest ):
@@ -755,3 +765,5 @@ def test(self, stage):
755
765
loss = model (batch [0 ], batch [1 ])
756
766
model .backward (loss )
757
767
model .step ()
768
+
769
+ model .destroy ()
0 commit comments