Register
Login
Resources
Docs Blog Datasets Glossary Case Studies Tutorials & Webinars
Product
Data Engine LLMs Platform Enterprise
Pricing Explore
Connect to our Discord channel

kd_ema_test.py 4.7 KB

You have to be logged in to leave a comment. Sign In
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
  1. import unittest
  2. from super_gradients.training import models
  3. from super_gradients.training import Trainer
  4. from super_gradients.training.dataloaders.dataloaders import classification_test_dataloader
  5. from super_gradients.training.kd_trainer import KDTrainer
  6. import torch
  7. from super_gradients.training.utils.utils import check_models_have_same_weights
  8. from super_gradients.training.metrics import Accuracy
  9. from super_gradients.training.losses.kd_losses import KDLogitsLoss
  10. class KDEMATest(unittest.TestCase):
  11. @classmethod
  12. def setUp(cls):
  13. cls.sg_trained_teacher = Trainer("sg_trained_teacher", device='cpu')
  14. cls.kd_train_params = {"max_epochs": 3, "lr_updates": [1], "lr_decay_factor": 0.1, "lr_mode": "step",
  15. "lr_warmup_epochs": 0, "initial_lr": 0.1,
  16. "loss": KDLogitsLoss(torch.nn.CrossEntropyLoss()),
  17. "optimizer": "SGD",
  18. "criterion_params": {}, "optimizer_params": {"weight_decay": 1e-4, "momentum": 0.9},
  19. "train_metrics_list": [Accuracy()], "valid_metrics_list": [Accuracy()],
  20. "metric_to_watch": "Accuracy",
  21. 'loss_logging_items_names': ["Loss", "Task Loss", "Distillation Loss"],
  22. "greater_metric_to_watch_is_better": True, "average_best_models": False,
  23. "ema": True}
  24. def test_teacher_ema_not_duplicated(self):
  25. """Check that the teacher EMA is a reference to the teacher net (not a copy)."""
  26. kd_model = KDTrainer("test_teacher_ema_not_duplicated", device='cpu')
  27. student = models.get('resnet18', arch_params={'num_classes': 1000})
  28. teacher = models.get('resnet50', arch_params={'num_classes': 1000},
  29. pretrained_weights="imagenet")
  30. kd_model.train(training_params=self.kd_train_params, student=student, teacher=teacher,
  31. train_loader=classification_test_dataloader(),
  32. valid_loader=classification_test_dataloader())
  33. self.assertTrue(kd_model.ema_model.ema.module.teacher is kd_model.net.module.teacher)
  34. self.assertTrue(kd_model.ema_model.ema.module.student is not kd_model.net.module.student)
  35. def test_kd_ckpt_reload_net(self):
  36. """Check that the KD trainer load correctly from checkpoint when "load_ema_as_net=False"."""
  37. # Create a KD trainer and train it
  38. train_params = self.kd_train_params.copy()
  39. kd_model = KDTrainer("test_kd_ema_ckpt_reload", device='cpu')
  40. student = models.get('resnet18', arch_params={'num_classes': 1000})
  41. teacher = models.get('resnet50', arch_params={'num_classes': 1000},
  42. pretrained_weights="imagenet")
  43. kd_model.train(training_params=self.kd_train_params, student=student, teacher=teacher,
  44. train_loader=classification_test_dataloader(),
  45. valid_loader=classification_test_dataloader())
  46. ema_model = kd_model.ema_model.ema
  47. net = kd_model.net
  48. # Load the trained KD trainer
  49. kd_model = KDTrainer("test_kd_ema_ckpt_reload", device='cpu')
  50. student = models.get('resnet18', arch_params={'num_classes': 1000})
  51. teacher = models.get('resnet50', arch_params={'num_classes': 1000},
  52. pretrained_weights="imagenet")
  53. train_params["resume"] = True
  54. kd_model.train(training_params=train_params, student=student, teacher=teacher,
  55. train_loader=classification_test_dataloader(),
  56. valid_loader=classification_test_dataloader())
  57. reloaded_ema_model = kd_model.ema_model.ema
  58. reloaded_net = kd_model.net
  59. # trained ema == loaded ema (Should always be true as long as "ema=True" in train_params)
  60. self.assertTrue(check_models_have_same_weights(ema_model, reloaded_ema_model))
  61. # loaded net == trained net (since load_ema_as_net = False)
  62. self.assertTrue(check_models_have_same_weights(reloaded_net, net))
  63. # loaded net != trained ema (since load_ema_as_net = False)
  64. self.assertTrue(not check_models_have_same_weights(reloaded_net, ema_model))
  65. # loaded student ema == loaded student net (since load_ema_as_net = False)
  66. self.assertTrue(
  67. not check_models_have_same_weights(reloaded_ema_model.module.student, reloaded_net.module.student))
  68. # loaded teacher ema == loaded teacher net (teacher always loads ema)
  69. self.assertTrue(check_models_have_same_weights(reloaded_ema_model.module.teacher, reloaded_net.module.teacher))
  70. if __name__ == '__main__':
  71. unittest.main()
Tip!

Press p or to see the previous file or, n or to see the next file

Comments

Loading...