Renaming files

manogna-s · Jun 15, 2021 · 305af27 · 305af27
1 parent dcdbf42
commit 305af27
Show file tree

Hide file tree

Showing 8 changed files with 57 additions and 238 deletions.
diff --git a/models/model_utils.py b/models/model_utils.py
diff --git a/models/modeling.py → models/model_vit.py b/models/modeling.py → models/model_vit.py
@@ -19,12 +19,11 @@
 import gin
 import models.configs as configs
 
-from .modeling_resnet import ResNetV2
+from .resnetv2 import ResNetV2
 
 
 logger = logging.getLogger(__name__)
 
-
 ATTENTION_Q = "MultiHeadDotProductAttention_1/query"
 ATTENTION_K = "MultiHeadDotProductAttention_1/key"
 ATTENTION_V = "MultiHeadDotProductAttention_1/value"

diff --git a/models/modeling_resnet.py → models/resnetv2.py b/models/modeling_resnet.py → models/resnetv2.py
@@ -151,7 +151,7 @@ def __init__(self, block_units, width_factor):
             ('block2', nn.Sequential(OrderedDict(
                 [('unit1', PreActBottleneck(cin=width*4, cout=width*8, cmid=width*2, stride=2))] +
                 [(f'unit{i:d}', PreActBottleneck(cin=width*8, cout=width*8, cmid=width*2)) for i in range(2, block_units[1] + 1)],
-                ))),    
+                ))),
             ('block3', nn.Sequential(OrderedDict(
                 [('unit1', PreActBottleneck(cin=width*8, cout=width*16, cmid=width*4, stride=2))] +
                 [(f'unit{i:d}', PreActBottleneck(cin=width*16, cout=width*16, cmid=width*4)) for i in range(2, block_units[2] + 1)],
@@ -161,4 +161,4 @@ def __init__(self, block_units, width_factor):
     def forward(self, x):
         x = self.root(x)
         x = self.body(x)
-        return x
+        return x
diff --git a/models/sur.py b/models/sur.py
@@ -1,10 +1,10 @@
 import torch
+from torch import nn
 import numpy as np
-
-from models.model_utils import sigmoid, cosine_sim
 from models.losses import prototype_loss
-device = torch.device("cuda:0" if torch.cuda.is_available() else "cpu")
 
+device = torch.device("cuda:0" if torch.cuda.is_available() else "cpu")
+sigmoid = nn.Sigmoid()
 
 def apply_selection(features_dict, lambdas, normalize=True):
     """

diff --git a/paths.py b/paths.py
@@ -0,0 +1,3 @@
+PROJECT_ROOT = './'
+META_DATASET_ROOT = 'cdfsl_dataset/meta_dataset'
+META_RECORDS_ROOT = 'cdfsl_dataset/meta_dataset/dataset_conversion/records'
diff --git a/train.py b/train.py
@@ -13,10 +13,10 @@
 import json
 from tqdm import tqdm
 from torch.utils.tensorboard import SummaryWriter
-# from apex import amp
-# from apex.parallel import DistributedDataParallel as DDP
+from apex import amp
+from apex.parallel import DistributedDataParallel as DDP
 
-from models.modeling import VisionTransformer, CONFIGS
+from models.model_vit import VisionTransformer, CONFIGS
 from utils.scheduler import WarmupLinearSchedule, WarmupCosineSchedule
 from utils.data_utils import get_loader
 
@@ -25,6 +25,7 @@
 
 class AverageMeter(object):
     """Computes and stores the average and current value"""
+
     def __init__(self):
         self.reset()
 
@@ -49,14 +50,15 @@ def save_model(args, model):
     model_to_save = model.module if hasattr(model, 'module') else model
     model_checkpoint = os.path.join(args.output_dir, "checkpoint.bin")
     torch.save(model_to_save.state_dict(), model_checkpoint)
-    model_config = {'img_size': 84, 'num_classes':47, 'model_type': "ViT-B_16", 'dataset':args.dataset,'weights_file': model_checkpoint}
+    model_config = {'img_size': 84, 'num_classes': 47, 'model_type': "ViT-B_16", 'dataset': args.dataset,
+                    'weights_file': model_checkpoint}
     with open(os.path.join(args.output_dir, "model_config.json"), "w") as outfile:
         json.dump(model_config, outfile)
     logger.info("Saved model checkpoint to [DIR: %s]", args.output_dir)
 
 
 @gin.configurable
-def get_model(args, img_size, num_classes, model_type, pretrained_ckpt, dataset, training=True):
+def model_setup(args, img_size, num_classes, model_type, pretrained_ckpt, dataset, training=True):
     config = CONFIGS[model_type]
     model = VisionTransformer(config, img_size, zero_head=True, num_classes=num_classes)
     if pretrained_ckpt:
@@ -66,24 +68,35 @@ def get_model(args, img_size, num_classes, model_type, pretrained_ckpt, dataset,
             model.load_state_dict(torch.load(pretrained_ckpt, map_location=torch.device('cpu')))
     num_params = count_parameters(model)
 
+
+    if training:
+        args.name = args.dataset + '_img' + str(img_size) + '_cls' + str(num_classes)
+        args.img_size = img_size
+        args.dataset = dataset
+        dir_name = os.path.join(args.output_dir, args.name)
+        # dir_name = os.path.join(args.output_dir,args.name+datetime.now().strftime("%Y%m%d-%H%M%S"))
+        if not os.path.exists(dir_name):
+            os.mkdir(dir_name)
+        args.output_dir = dir_name
+
+    # Setup logging
+    logging.basicConfig(format='%(asctime)s - %(levelname)s - %(name)s - %(message)s',
+                        datefmt='%m/%d/%Y %H:%M:%S',
+                        level=logging.INFO if args.local_rank in [-1, 0] else logging.WARN,
+                        filename=f'{args.output_dir}/training.log',
+                        filemode='w')
+
     logger.info("{}".format(config))
     logger.info("Training parameters %s", args)
     logger.info("Total Parameter: \t%2.1fM" % num_params)
     print(num_params)
 
-    if training:
-        args.name = args.dataset+'_img'+str(img_size)+'_cls'+str(num_classes)+'_'
-        args.img_size=img_size
-        args.dataset=dataset
-        dir_name = os.path.join(args.output_dir,args.name+datetime.now().strftime("%Y%m%d-%H%M%S"))
-        os.mkdir(dir_name)
-        args.output_dir = dir_name
     return args, model
 
 
 def count_parameters(model):
     params = sum(p.numel() for p in model.parameters() if p.requires_grad)
-    return params/1000000
+    return params / 1000000
 
 
 def set_seed(args):
@@ -193,15 +206,15 @@ def train(args, model):
 
             if args.gradient_accumulation_steps > 1:
                 loss = loss / args.gradient_accumulation_steps
-            if 0: #args.fp16:
+            if args.fp16:
                 with amp.scale_loss(loss, optimizer) as scaled_loss:
                     scaled_loss.backward()
             else:
                 loss.backward()
 
             if (step + 1) % args.gradient_accumulation_steps == 0:
-                losses.update(loss.item()*args.gradient_accumulation_steps)
-                if 0: #args.fp16:
+                losses.update(loss.item() * args.gradient_accumulation_steps)
+                if args.fp16:
                     torch.nn.utils.clip_grad_norm_(amp.master_params(optimizer), args.max_grad_norm)
                 else:
                     torch.nn.utils.clip_grad_norm_(model.parameters(), args.max_grad_norm)
@@ -217,7 +230,7 @@ def train(args, model):
                     writer.add_scalar("train/loss", scalar_value=losses.val, global_step=global_step)
                     writer.add_scalar("train/lr", scalar_value=scheduler.get_lr()[0], global_step=global_step)
                 if global_step % args.eval_every == 0 and args.local_rank in [-1, 0]:
-                    save_model(args, model) #remove this
+                    save_model(args, model)  # remove this
                     accuracy = valid(args, model, writer, test_loader, global_step)
                     if best_acc < accuracy:
                         save_model(args, model)
@@ -237,7 +250,7 @@ def train(args, model):
 
 
 def main(args):
-    gin.parse_config_file(args.model_config)
+    gin.parse_config_file(args.model_config, skip_unknown=True)
 
     # Setup CUDA, GPU & distributed training
     if args.local_rank == -1:
@@ -251,18 +264,14 @@ def main(args):
         args.n_gpu = 1
     args.device = device
 
-    # Setup logging
-    logging.basicConfig(format='%(asctime)s - %(levelname)s - %(name)s - %(message)s',
-                        datefmt='%m/%d/%Y %H:%M:%S',
-                        level=logging.INFO if args.local_rank in [-1, 0] else logging.WARN)
-    logger.warning("Process rank: %s, device: %s, n_gpu: %s, distributed training: %s, 16-bits training: %s" %
-                   (args.local_rank, args.device, args.n_gpu, bool(args.local_rank != -1), args.fp16))
-
     # Set seed
     set_seed(args)
 
     # Model Setup
-    args, model = get_model(args)
+    args, model = model_setup(args)
+
+    logger.warning("Process rank: %s, device: %s, n_gpu: %s, distributed training: %s, 16-bits training: %s" %
+                   (args.local_rank, args.device, args.n_gpu, bool(args.local_rank != -1), args.fp16))
 
     # Training
     train(args, model)