tianyu0207
diff --git a/‎README.md‎
Lines changed: 10 additions & 1 deletion b/‎README.md‎
Lines changed: 10 additions & 1 deletion
diff --git a/‎comm.py‎
Lines changed: 132 additions & 0 deletions b/‎comm.py‎
Lines changed: 132 additions & 0 deletions
diff --git a/‎config.py‎
Lines changed: 13 additions & 0 deletions b/‎config.py‎
Lines changed: 13 additions & 0 deletions
diff --git a/‎config_cvt.py‎
Lines changed: 207 additions & 0 deletions b/‎config_cvt.py‎
Lines changed: 207 additions & 0 deletions
@@ -12,8 +12,17 @@
 Please download the dataset through this [link](https://drive.google.com/file/d/19jRx9WjLviCGpqa_ShXVSnGG0rfr2GeV/view?usp=sharing
 ).
 
-### Code will be available early October. 
+### Training 
+After downloading the dataset and extracting the I3D features using this [**repo**](https://github.com/Tushar-N/pytorch-resnet3d), simply run the following command: 
+```shell
+python main_transformer.py
+```
 
+### Inference 
+For inference, after setting the path of the best checkpoint, then run the following command: 
+```shell
+python inference.py
+```
 
 ### Citation
 
 
@@ -0,0 +1,132 @@
+import pickle
+import torch
+import torch.distributed as dist
+
+
+class Comm(object):
+    def __init__(self, local_rank=0):
+        self.local_rank = 0
+
+    @property
+    def world_size(self):
+        if not dist.is_available():
+            return 1
+        if not dist.is_initialized():
+            return 1
+        return dist.get_world_size()
+
+    @property
+    def rank(self):
+        if not dist.is_available():
+            return 0
+        if not dist.is_initialized():
+            return 0
+        return dist.get_rank()
+
+    @property
+    def local_rank(self):
+        if not dist.is_available():
+            return 0
+        if not dist.is_initialized():
+            return 0
+        return self._local_rank
+
+    @local_rank.setter
+    def local_rank(self, value):
+        if not dist.is_available():
+            self._local_rank = 0
+        if not dist.is_initialized():
+            self._local_rank = 0
+        self._local_rank = value
+
+    @property
+    def head(self):
+        return 'Rank[{}/{}]'.format(self.rank, self.world_size)
+   
+    def is_main_process(self):
+        return self.rank == 0
+
+    def synchronize(self):
+        """
+        Helper function to synchronize (barrier) among all processes when
+        using distributed training
+        """
+        if self.world_size == 1:
+            return
+        dist.barrier()
+
+
+comm = Comm()
+
+
+def all_gather(data):
+    """
+    Run all_gather on arbitrary picklable data (not necessarily tensors)
+    Args:
+        data: any picklable object
+    Returns:
+        list[data]: list of data gathered from each rank
+    """
+    world_size = comm.world_size
+    if world_size == 1:
+        return [data]
+
+    # serialized to a Tensor
+    buffer = pickle.dumps(data)
+    storage = torch.ByteStorage.from_buffer(buffer)
+    tensor = torch.ByteTensor(storage).to("cuda")
+
+    # obtain Tensor size of each rank
+    local_size = torch.LongTensor([tensor.numel()]).to("cuda")
+    size_list = [torch.LongTensor([0]).to("cuda") for _ in range(world_size)]
+    dist.all_gather(size_list, local_size)
+    size_list = [int(size.item()) for size in size_list]
+    max_size = max(size_list)
+
+    # receiving Tensor from all ranks
+    # we pad the tensor because torch all_gather does not support
+    # gathering tensors of different shapes
+    tensor_list = []
+    for _ in size_list:
+        tensor_list.append(torch.ByteTensor(size=(max_size,)).to("cuda"))
+    if local_size != max_size:
+        padding = torch.ByteTensor(size=(max_size - local_size,)).to("cuda")
+        tensor = torch.cat((tensor, padding), dim=0)
+    dist.all_gather(tensor_list, tensor)
+
+    data_list = []
+    for size, tensor in zip(size_list, tensor_list):
+        buffer = tensor.cpu().numpy().tobytes()[:size]
+        data_list.append(pickle.loads(buffer))
+
+    return data_list
+
+
+def reduce_dict(input_dict, average=True):
+    """
+    Args:
+        input_dict (dict): all the values will be reduced
+        average (bool): whether to do average or sum
+    Reduce the values in the dictionary from all processes so that process with rank
+    0 has the averaged results. Returns a dict with the same fields as
+    input_dict, after reduction.
+    """
+    world_size = comm.world_size
+    if world_size < 2:
+        return input_dict
+    with torch.no_grad():
+        names = []
+        values = []
+        # sort the keys so that they are consistent across processes
+        for k in sorted(input_dict.keys()):
+            names.append(k)
+            values.append(input_dict[k])
+        values = torch.stack(values, dim=0)
+        dist.reduce(values, dst=0)
+        if dist.get_rank() == 0 and average:
+            # only main process gets accumulated, so only divide by
+            # world_size in this case
+            values /= world_size
+        reduced_dict = {k: v for k, v in zip(names, values)}
+    return reduced_dict
+
@@ -0,0 +1,13 @@
+import numpy as np
+import os
+
+class Config(object):
+    def __init__(self, args):
+        self.lr = eval(args.lr)
+        self.lr_str = args.lr
+
+    def __str__(self):
+        attrs = vars(self)
+        attr_lst = sorted(attrs.keys())
+        return '\n'.join("- %s: %s" % (item, attrs[item]) for item in attr_lst if item != 'lr')
+
@@ -0,0 +1,207 @@
+from __future__ import absolute_import
+from __future__ import division
+from __future__ import print_function
+
+import os.path as op
+import yaml
+from yacs.config import CfgNode as CN
+
+from comm import comm
+
+
+_C = CN()
+
+_C.BASE = ['']
+_C.NAME = ''
+_C.DATA_DIR = ''
+_C.DIST_BACKEND = 'nccl'
+_C.GPUS = (0,)
+# _C.LOG_DIR = ''
+_C.MULTIPROCESSING_DISTRIBUTED = True
+_C.OUTPUT_DIR = ''
+_C.PIN_MEMORY = True
+_C.PRINT_FREQ = 20
+_C.RANK = 0
+_C.VERBOSE = True
+_C.WORKERS = 4
+_C.MODEL_SUMMARY = False
+
+_C.AMP = CN()
+_C.AMP.ENABLED = False
+_C.AMP.MEMORY_FORMAT = 'nchw'
+
+# Cudnn related params
+_C.CUDNN = CN()
+_C.CUDNN.BENCHMARK = True
+_C.CUDNN.DETERMINISTIC = False
+_C.CUDNN.ENABLED = True
+
+# common params for NETWORK
+_C.MODEL = CN()
+_C.MODEL.NAME = 'cls_hrnet'
+_C.MODEL.INIT_WEIGHTS = True
+_C.MODEL.PRETRAINED = ''
+_C.MODEL.PRETRAINED_LAYERS = ['*']
+_C.MODEL.NUM_CLASSES = 1000
+_C.MODEL.SPEC = CN(new_allowed=True)
+
+
+
+
+
+_C.LOSS = CN(new_allowed=True)
+_C.LOSS.LABEL_SMOOTHING = 0.0
+_C.LOSS.LOSS = 'softmax'
+
+# DATASET related params
+_C.DATASET = CN()
+_C.DATASET.ROOT = ''
+_C.DATASET.DATASET = 'imagenet'
+_C.DATASET.TRAIN_SET = 'train'
+_C.DATASET.TEST_SET = 'val'
+_C.DATASET.DATA_FORMAT = 'jpg'
+_C.DATASET.LABELMAP = ''
+_C.DATASET.TRAIN_TSV_LIST = []
+_C.DATASET.TEST_TSV_LIST = []
+_C.DATASET.SAMPLER = 'default'
+
+_C.DATASET.TARGET_SIZE = -1
+
+# training data augmentation
+_C.INPUT = CN()
+_C.INPUT.MEAN = [0.485, 0.456, 0.406]
+_C.INPUT.STD = [0.229, 0.224, 0.225]
+
+# data augmentation
+_C.AUG = CN()
+_C.AUG.SCALE = (0.08, 1.0)
+_C.AUG.RATIO = (3.0/4.0, 4.0/3.0)
+_C.AUG.COLOR_JITTER = [0.4, 0.4, 0.4, 0.1, 0.0]
+_C.AUG.GRAY_SCALE = 0.0
+_C.AUG.GAUSSIAN_BLUR = 0.0
+_C.AUG.DROPBLOCK_LAYERS = [3, 4]
+_C.AUG.DROPBLOCK_KEEP_PROB = 1.0
+_C.AUG.DROPBLOCK_BLOCK_SIZE = 7
+_C.AUG.MIXUP_PROB = 0.0
+_C.AUG.MIXUP = 0.0
+_C.AUG.MIXCUT = 0.0
+_C.AUG.MIXCUT_MINMAX = []
+_C.AUG.MIXUP_SWITCH_PROB = 0.5
+_C.AUG.MIXUP_MODE = 'batch'
+_C.AUG.MIXCUT_AND_MIXUP = False
+_C.AUG.INTERPOLATION = 2
+_C.AUG.TIMM_AUG = CN(new_allowed=True)
+_C.AUG.TIMM_AUG.USE_LOADER = False
+_C.AUG.TIMM_AUG.USE_TRANSFORM = False
+
+# train
+_C.TRAIN = CN()
+
+_C.TRAIN.AUTO_RESUME = True
+_C.TRAIN.CHECKPOINT = ''
+_C.TRAIN.LR_SCHEDULER = CN(new_allowed=True)
+_C.TRAIN.SCALE_LR = True
+_C.TRAIN.LR = 0.001
+
+_C.TRAIN.OPTIMIZER = 'sgd'
+_C.TRAIN.OPTIMIZER_ARGS = CN(new_allowed=True)
+_C.TRAIN.MOMENTUM = 0.9
+_C.TRAIN.WD = 0.0001
+_C.TRAIN.WITHOUT_WD_LIST = []
+_C.TRAIN.NESTEROV = True
+# for adam
+_C.TRAIN.GAMMA1 = 0.99
+_C.TRAIN.GAMMA2 = 0.0
+
+_C.TRAIN.BEGIN_EPOCH = 0
+_C.TRAIN.END_EPOCH = 100
+
+_C.TRAIN.IMAGE_SIZE = [224, 224]  # width * height, ex: 192 * 256
+_C.TRAIN.BATCH_SIZE_PER_GPU = 32
+_C.TRAIN.SHUFFLE = True
+
+_C.TRAIN.EVAL_BEGIN_EPOCH = 0
+
+_C.TRAIN.DETECT_ANOMALY = False
+
+_C.TRAIN.CLIP_GRAD_NORM = 0.0
+_C.TRAIN.SAVE_ALL_MODELS = False
+
+# testing
+_C.TEST = CN()
+
+# size of images for each device
+_C.TEST.BATCH_SIZE_PER_GPU = 32
+_C.TEST.CENTER_CROP = True
+_C.TEST.IMAGE_SIZE = [224, 224]  # width * height, ex: 192 * 256
+_C.TEST.INTERPOLATION = 2
+_C.TEST.MODEL_FILE = ''
+_C.TEST.REAL_LABELS = False
+_C.TEST.VALID_LABELS = ''
+
+_C.FINETUNE = CN()
+_C.FINETUNE.FINETUNE = False
+_C.FINETUNE.USE_TRAIN_AUG = False
+_C.FINETUNE.BASE_LR = 0.003
+_C.FINETUNE.BATCH_SIZE = 512
+_C.FINETUNE.EVAL_EVERY = 3000
+_C.FINETUNE.TRAIN_MODE = True
+# _C.FINETUNE.MODEL_FILE = ''
+_C.FINETUNE.FROZEN_LAYERS = []
+_C.FINETUNE.LR_SCHEDULER = CN(new_allowed=True)
+_C.FINETUNE.LR_SCHEDULER.DECAY_TYPE = 'step'
+
+# debug
+_C.DEBUG = CN()
+_C.DEBUG.DEBUG = False
+
+
+def _update_config_from_file(config, cfg_file):
+    config.defrost()
+    with open(cfg_file, 'r') as f:
+        yaml_cfg = yaml.load(f, Loader=yaml.FullLoader)
+
+    for cfg in yaml_cfg.setdefault('BASE', ['']):
+        if cfg:
+            _update_config_from_file(
+                config, op.join(op.dirname(cfg_file), cfg)
+            )
+    print('=> merge config from {}'.format(cfg_file))
+    config.merge_from_file(cfg_file)
+    config.freeze()
+
+
+def update_config(config, args):
+    _update_config_from_file(config, args.cfg)
+
+    config.defrost()
+    config.merge_from_list(args.opts)
+    if config.TRAIN.SCALE_LR:
+        config.TRAIN.LR *= comm.world_size
+    file_name, _ = op.splitext(op.basename(args.cfg))
+    config.NAME = file_name + config.NAME
+    config.RANK = comm.rank
+
+    if 'timm' == config.TRAIN.LR_SCHEDULER.METHOD:
+        config.TRAIN.LR_SCHEDULER.ARGS.epochs = config.TRAIN.END_EPOCH
+
+    if 'timm' == config.TRAIN.OPTIMIZER:
+        config.TRAIN.OPTIMIZER_ARGS.lr = config.TRAIN.LR
+
+    aug = config.AUG
+    if aug.MIXUP > 0.0 or aug.MIXCUT > 0.0 or aug.MIXCUT_MINMAX:
+        aug.MIXUP_PROB = 1.0
+    config.freeze()
+
+
+def save_config(cfg, path):
+    if comm.is_main_process():
+        with open(path, 'w') as f:
+            f.write(cfg.dump())
+
+
+if __name__ == '__main__':
+    import sys
+    with open(sys.argv[1], 'w') as f:
+        print(_C, file=f)
+