#211 SG-136: Apply ema only on student (KD)

Merged

Louis Dupont merged 1 commits into Deci-AI:master from deci-ai:feature/SG-136_use_ema_only_on_kd_student

  
    
        
          
1

2

3

4

5

6

7

8

9

10

11

12

13

14

15

16

17

18

19

20

21

22

23

24

25

26

27

28

29

30

31

32

33

34

35

36

37

38

39

40

41

42

43

44

45

46

47

48

          
            # Shelfnet34_lw recipe for COCO segmentation 21 classes from PASCAL.
# Reaches ~65.1 mIOU
# Trained using 4 X 2080 Ti using DDP- takes ~ 2d 7h with batch size of 8 and batch accumulate of 3 (i.e effective batch
# size is 4*8*3 = 96)
# Logs and tensorboards: s3://deci-pretrained-models/shelfnet34_coco_segmentation_tensorboard/
# python train_from_recipe_example/train_from_recipe.py --config-name=coco_segmentation_shelfnet_lw
defaults:
  - training_hyperparams: coco_segmentation_shelfnet_lw_train_params
  - dataset_params: coco_segmentation_dataset_params
  - arch_params: shelfnet34_lw_arch_params
  - checkpoint_params: default_checkpoint_params
sub_classes:
  _target_: super_gradients.training.utils.segmentation_utils.coco_sub_classes_inclusion_tuples_list
dataset_interface:
  _target_: super_gradients.training.datasets.dataset_interfaces.dataset_interface.CoCoSegmentationDatasetInterface
  dataset_params: ${dataset_params}
  dataset_classes_inclusion_tuples_list: ${sub_classes}
data_loader_num_workers: 8
load_checkpoint: True
checkpoint_params:
  load_checkpoint: ${load_checkpoint}
  strict_load: True
  load_weights_only: True
  load_backbone: True
  source_ckpt_folder_name: resnet_34
experiment_name: coco_segmentation_21_subclass_shelfnet34
multi_gpu:
  _target_: super_gradients.training.sg_model.MultiGPUMode
  value: 'DDP'
ckpt_root_dir:
sg_model:
  _target_: super_gradients.SgModel
  experiment_name: ${experiment_name}
  model_checkpoints_location: ${model_checkpoints_location}
  ckpt_root_dir: ${ckpt_root_dir}
  multi_gpu: ${multi_gpu}
architecture: shelfnet34_lw

          
        
      

  

Tip!

Press p or to see the previous file or, n or to see the next file

Deci-AI / super-gradients connected to https://github.com/Deci-AI/super-gradients.git

#211 SG-136: Apply ema only on student (KD)

Deci-AI
/
super-gradients
connected to https://github.com/Deci-AI/super-gradients.git