#211 SG-136: Apply ema only on student (KD)

Merged

Louis Dupont merged 1 commits into Deci-AI:master from deci-ai:feature/SG-136_use_ema_only_on_kd_student

  
    
        
          
1

2

3

4

5

6

7

8

9

10

11

12

13

14

15

16

17

18

19

20

21

22

23

24

25

26

27

28

29

30

31

32

33

34

35

36

37

38

39

40

41

42

43

44

45

46

47

48

49

50

51

52

53

54

          
            # Efficientnet-B0 Imagenet training
# This example trains with effective batch size = 64 * 4 gpus = 256.
# Epoch time on 4 X 3090Ti distributed training is ~ 16:25 minutes
# Logs and tensorboards: s3://deci-pretrained-models/efficientnet_b0/
# Instructions:
# Set the PYTHONPATH environment variable: (Replace "YOUR_LOCAL_PATH" with the path to the downloaded repo):
#   export PYTHONPATH="YOUR_LOCAL_PATH"/super_gradients/:"YOUR_LOCAL_PATH"/super_gradients/src/
# Then:
# #   python -m torch.distributed.launch --nproc_per_node=4 train_from_recipe.py --config-name=imagenet_efficientnet
defaults:
  - training_hyperparams: imagenet_efficientnet_train_params
  - dataset_params: imagenet_dataset_params
  - arch_params: efficientnet_b0_arch_params
  - checkpoint_params: default_checkpoint_params
arch_params:
  num_classes: 1000
dataset_params:
  batch_size: 64
  color_jitter: 0.4
  random_erase_prob: 0.2
  random_erase_value: random
  train_interpolation: random
  auto_augment_config_string: rand-m9-mstd0.5
dataset_interface:
  _target_: super_gradients.training.datasets.dataset_interfaces.dataset_interface.ImageNetDatasetInterface
  dataset_params: ${dataset_params}
  data_dir: /data/Imagenet
data_loader_num_workers: 8
load_checkpoint: False
checkpoint_params:
  load_checkpoint: ${load_checkpoint}
experiment_name: efficientnet_b0_imagenet
model_checkpoints_location: local
ckpt_root_dir:
multi_gpu:
  _target_: super_gradients.training.sg_model.MultiGPUMode
  value: 'DDP'
sg_model:
  _target_: super_gradients.SgModel
  experiment_name: ${experiment_name}
  model_checkpoints_location: ${model_checkpoints_location}
  ckpt_root_dir: ${ckpt_root_dir}
  multi_gpu: ${multi_gpu}
architecture: efficientnet_b0

          
        
      

  

Tip!

Press p or to see the previous file or, n or to see the next file

Deci-AI / super-gradients connected to https://github.com/Deci-AI/super-gradients.git

#211 SG-136: Apply ema only on student (KD)

Deci-AI
/
super-gradients
connected to https://github.com/Deci-AI/super-gradients.git