huangzh13
diff --git a/‎checkpoint/DogCat/Exp-1/config.yaml
+38 b/‎checkpoint/DogCat/Exp-1/config.yaml
+38
diff --git a/‎checkpoint/DogCat/Exp-1/log.txt
+914 b/‎checkpoint/DogCat/Exp-1/log.txt
+914
diff --git a/‎config/default.py
+8-4 b/‎config/default.py
+8-4
diff --git a/‎configs/sample.yaml
+9-10 b/‎configs/sample.yaml
+9-10
diff --git a/‎configs/sampleAdam.yaml
+42 b/‎configs/sampleAdam.yaml
+42
diff --git a/‎data/__init__.py
+2-1 b/‎data/__init__.py
+2-1
diff --git a/‎models/__init__.py
+32-1 b/‎models/__init__.py
+32-1
diff --git a/‎models/baseline.py
+5-5 b/‎models/baseline.py
+5-5
diff --git a/‎models/losses/__init__.py
+10 b/‎models/losses/__init__.py
+10
diff --git a/‎models/losses/triplet.py
+131 b/‎models/losses/triplet.py
+131
@@ -0,0 +1,38 @@
+DATALOADER:
+  BATCH_SIZE: 64
+  NUM_INSTANCES: 4
+  NUM_WORKERS: 4
+DATASETS:
+  NAME: Market1501
+  ROOT: /home/hzh/data
+DEVICE: cuda
+DEVICE_ID: 1
+INPUT:
+  HF_PROB: 0.5
+  PIXEL_MEAN: [0.485, 0.456, 0.406]
+  PIXEL_STD: [0.229, 0.224, 0.225]
+  SIZE_TEST: [256, 128]
+  SIZE_TRAIN: [256, 128]
+MODEL:
+  ARCH: resnet50
+  NAME: baseline
+  STRIDE: 2
+OUTPUT_DIR: ./checkpoint/DogCat/Exp-1
+SCHEDULER:
+  GAMMA: 0.5
+  NAME: StepLR
+  STEP: 10
+SOLVER:
+  BASE_LR: 0.001
+  CHECK_PERIOD: 5
+  EVAL_PERIOD: 1
+  LOSS: softmax_triplet
+  MARGIN: 0.3
+  MAX_EPOCHS: 320
+  MOMENTUM: 0.9
+  NESTEROV: True
+  OPTIMIZER_NAME: SGD
+  PRINT_FREQ: 10
+  WEIGHT_DECAY: 0.0005
+TEST:
+  BATCH_SIZE: 128
@@ -12,9 +12,9 @@
 # MODEL
 # -----------------------------------------------------------------------------
 _C.MODEL = CN()
-_C.MODEL.NAME = 'ResModel'
-_C.MODEL.BACKBONE = 'ResNet50'
-_C.MODEL.PRETRAINED = True
+_C.MODEL.NAME = 'baseline'
+_C.MODEL.ARCH = 'resnet50'
+_C.MODEL.STRIDE = 2
 
 # -----------------------------------------------------------------------------
 # INPUT
@@ -50,6 +50,7 @@
 # DataLoader
 # -----------------------------------------------------------------------------
 _C.DATALOADER = CN()
+# Sampler
 # Number of data loading threads
 _C.DATALOADER.NUM_WORKERS = 4
 # Number of instance for one batch
@@ -61,14 +62,17 @@
 # ---------------------------------------------------------------------------- #
 _C.SOLVER = CN()
 # Sampler for data loading
-_C.SOLVER.LOSS = 'softmax'
+_C.SOLVER.LOSS = 'softmax_triplet'
+_C.SOLVER.MARGIN = 0.3
+
 _C.SOLVER.MAX_EPOCHS = 120
 _C.SOLVER.OPTIMIZER_NAME = "Adam"
 
 _C.SOLVER.BASE_LR = 3e-4
 # SGD
 # _C.SOLVER.BASE_LR = 0.01
 _C.SOLVER.NESTEROV = True
+_C.SOLVER.MOMENTUM = 0.9
 
 # Adam
 _C.SOLVER.WEIGHT_DECAY = 0.0005
 
@@ -1,11 +1,10 @@
 OUTPUT_DIR: "./checkpoint/DogCat/Exp-1"
 DEVICE: "cuda"
-DEVICE_ID: ('1,2,3')
+DEVICE_ID: ('1')
 
 MODEL:
-  NAME: 'ResModel'
-  BACKBONE: 'ResNet50'
-  PRETRAINED: True
+  NAME: 'baseline'
+  ARCH: 'resnet50'
 
 INPUT:
   SIZE_TRAIN: [256, 128]
@@ -17,15 +16,15 @@ DATASETS:
   ROOT: '/home/hzh/data'
 
 DATALOADER:
-  NUM_WORKERS: 2
+  NUM_WORKERS: 4
   BATCH_SIZE: 64
-  NUM_INSTANCES: 16
+  NUM_INSTANCES: 4
 
 SOLVER:
-  LOSS: 'softmax'
-  OPTIMIZER_NAME: 'Adam'
+  LOSS: 'softmax_triplet'
+  OPTIMIZER_NAME: 'SGD'
   MAX_EPOCHS: 320
-  BASE_LR: 0.00005
+  BASE_LR: 0.001
   WEIGHT_DECAY: 0.0005
 
   CHECK_PERIOD: 5
@@ -34,7 +33,7 @@ SOLVER:
 
 SCHEDULER:
   NAME: 'StepLR'
-  STEP: 2
+  STEP: 10
   GAMMA: 0.5
 
 TEST:
 
@@ -0,0 +1,42 @@
+OUTPUT_DIR: "./checkpoint/DogCat/Exp-1"
+DEVICE: "cuda"
+DEVICE_ID: ('1')
+
+MODEL:
+  NAME: 'baseline'
+  ARCH: 'resnet50'
+
+INPUT:
+  SIZE_TRAIN: [256, 128]
+  SIZE_TEST: [256, 128]
+  HF_PROB: 0.5 # random horizontal flip
+
+DATASETS:
+  NAME: 'Market1501'
+  ROOT: '/home/hzh/data'
+
+DATALOADER:
+  NUM_WORKERS: 2
+  BATCH_SIZE: 64
+  NUM_INSTANCES: 16
+
+SOLVER:
+  LOSS: 'softmax_triplet'
+  OPTIMIZER_NAME: 'Adam'
+  MAX_EPOCHS: 320
+  BASE_LR: 0.005
+  WEIGHT_DECAY: 0.0005
+
+  CHECK_PERIOD: 5
+  EVAL_PERIOD: 1
+  PRINT_FREQ: 10
+
+SCHEDULER:
+  NAME: 'StepLR'
+  STEP: 2
+  GAMMA: 0.5
+
+TEST:
+  BATCH_SIZE: 128
+
+
@@ -20,6 +20,7 @@ def make_loader_dsap():
 
 def make_loader(cfg):
     _data = ReIDDataset(dataset_dir=cfg.DATASETS.NAME, root=cfg.DATASETS.ROOT)
+    num_train_pids = _data.num_train_pids
 
     train_loader = DataLoader(ImageData(_data.train, TrainTransform(p=0.5)),
                               sampler=RandomIdentitySampler(_data.train, cfg.DATALOADER.NUM_INSTANCES),
@@ -34,4 +35,4 @@ def make_loader(cfg):
                                 batch_size=cfg.DATALOADER.BATCH_SIZE, num_workers=cfg.DATALOADER.NUM_WORKERS,
                                 pin_memory=True)
 
-    return train_loader, query_loader, gallery_loader
+    return train_loader, query_loader, gallery_loader, num_train_pids
@@ -7,6 +7,37 @@
 -------------------------------------------------
 """
 
+import torch.nn as nn
+
+from models.baseline import Baseline
+from models.losses import TripletLoss
+
+MODEL = {
+    'baseline': Baseline,
+}
+
 
 def make_model(cfg, num_classes):
-    pass
+    if cfg.MODEL.NAME not in MODEL:
+        raise KeyError("Unknown model: ", cfg.MODEL.NAME)
+    else:
+        model = MODEL[cfg.MODEL.NAME](num_classes, arch=cfg.MODEL.ARCH, stride=cfg.MODEL.STRIDE)
+
+    return model
+
+
+def make_loss(cfg):
+    xent_criterion = nn.CrossEntropyLoss()
+
+    if cfg.SOLVER.LOSS == 'softmax_triplet':
+        embedding_criterion = TripletLoss(margin=cfg.SOLVER.MARGIN)
+
+        def criterion(softmax_y, triplet_y, labels):
+            sum_loss = [embedding_criterion(output, labels)[0] for output in triplet_y] + \
+                       [xent_criterion(output, labels) for output in softmax_y]
+            loss = sum(sum_loss)
+            return loss
+
+        return criterion
+    else:
+        raise KeyError("Unknown loss: ", cfg.SOLVER.LOSS)
@@ -29,7 +29,7 @@ def __init__(self, num_classes, arch='resnet50', stride=1):
 
         # backbone
         if arch not in FACTORY:
-            raise KeyError("Unknown models: ", arch)
+            raise KeyError("Unknown arch: ", arch)
         else:
             resnet = FACTORY[arch](pretrained=True)
             if stride == 1:
@@ -50,13 +50,13 @@ def __init__(self, num_classes, arch='resnet50', stride=1):
         self.gap = nn.AdaptiveAvgPool2d((1, 1))
 
         self.bottleneck = nn.Sequential(
-            nn.Linear(2048, 512),
-            nn.BatchNorm1d(512),
+            nn.Linear(2048, 1024),
+            nn.BatchNorm1d(1024),
             nn.LeakyReLU(0.1),
             nn.Dropout(p=0.5)
         )
         self.bottleneck.apply(weights_init_kaiming)
-        self.classifier = nn.Linear(512, self.num_classes)
+        self.classifier = nn.Linear(1024, self.num_classes)
         self.classifier.apply(weights_init_classifier)
 
     def forward(self, x):
@@ -67,7 +67,7 @@ def forward(self, x):
         if self.training:
             feat = self.bottleneck(global_feat)
             cls_score = self.classifier(feat)
-            return [global_feat], [cls_score]
+            return [cls_score], [global_feat]
         else:
             return global_feat
 
 
@@ -0,0 +1,10 @@
+"""
+-------------------------------------------------
+   File Name:    __init__.py.py
+   Author:       Zhonghao Huang
+   Date:         2019/9/10
+   Description:
+-------------------------------------------------
+"""
+
+from .triplet import TripletLoss
@@ -0,0 +1,131 @@
+"""
+-------------------------------------------------
+   File Name:    triplet.py
+   Author:       Zhonghao Huang
+   Date:         2019/9/10
+   Description:
+-------------------------------------------------
+"""
+
+import torch
+import torch.nn as nn
+
+
+def topk_mask(input, dim, K=10, **kwargs):
+    index = input.topk(max(1, min(K, input.size(dim))), dim=dim, **kwargs)[1]
+    return torch.autograd.Variable(torch.zeros_like(input.data)).scatter(dim, index, 1.0)
+
+
+def pdist(A, squared=False, eps=1e-4):
+    prod = torch.mm(A, A.t())
+    norm = prod.diag().unsqueeze(1).expand_as(prod)
+    res = (norm + norm.t() - 2 * prod).clamp(min=0)
+    return res if squared else res.clamp(min=eps).sqrt()
+
+
+def normalize(x, axis=-1):
+    """Normalizing to unit length along the specified dimension.
+    Args:
+      x: pytorch Variable
+    Returns:
+      x: pytorch Variable, same shape as input
+    """
+    x = 1. * x / (torch.norm(x, 2, axis, keepdim=True).expand_as(x) + 1e-12)
+    return x
+
+
+def euclidean_dist(x, y):
+    """
+    Args:
+      x: pytorch Variable, with shape [m, d]
+      y: pytorch Variable, with shape [n, d]
+    Returns:
+      dist: pytorch Variable, with shape [m, n]
+    """
+    m, n = x.size(0), y.size(0)
+    xx = torch.pow(x, 2).sum(1, keepdim=True).expand(m, n)
+    yy = torch.pow(y, 2).sum(1, keepdim=True).expand(n, m).t()
+    dist = xx + yy
+    dist.addmm_(1, -2, x, y.t())
+    dist = dist.clamp(min=1e-12).sqrt()  # for numerical stability
+    return dist
+
+
+def hard_example_mining(dist_mat, labels, margin, return_inds=False):
+    """For each anchor, find the hardest positive and negative sample.
+    Args:
+      dist_mat: pytorch Variable, pair wise distance between samples, shape [N, N]
+      labels: pytorch LongTensor, with shape [N]
+      return_inds: whether to return the indices. Save time if `False`(?)
+    Returns:
+      dist_ap: pytorch Variable, distance(anchor, positive); shape [N]
+      dist_an: pytorch Variable, distance(anchor, negative); shape [N]
+      p_inds: pytorch LongTensor, with shape [N];
+        indices of selected hard positive samples; 0 <= p_inds[i] <= N - 1
+      n_inds: pytorch LongTensor, with shape [N];
+        indices of selected hard negative samples; 0 <= n_inds[i] <= N - 1
+    NOTE: Only consider the case in which all labels have same num of samples,
+      thus we can cope with all anchors in parallel.
+    """
+
+    torch.set_printoptions(threshold=5000)
+    assert len(dist_mat.size()) == 2
+    assert dist_mat.size(0) == dist_mat.size(1)
+    N = dist_mat.size(0)
+
+    # shape [N, N]
+    is_pos = labels.expand(N, N).eq(labels.expand(N, N).t())
+    is_neg = labels.expand(N, N).ne(labels.expand(N, N).t())
+    # `dist_ap` means distance(anchor, positive)
+    # both `dist_ap` and `relative_p_inds` with shape [N, 1]
+    dist_ap, relative_p_inds = torch.max(
+        dist_mat[is_pos].contiguous().view(N, -1), 1, keepdim=True)
+    # `dist_an` means distance(anchor, negative)
+    # both `dist_an` and `relative_n_inds` with shape [N, 1]
+    dist_an, relative_n_inds = torch.min(
+        dist_mat[is_neg].contiguous().view(N, -1), 1, keepdim=True)
+    # shape [N]
+    dist_ap = dist_ap.squeeze(1)
+    dist_an = dist_an.squeeze(1)
+
+    if return_inds:
+        # shape [N, N]
+        ind = (labels.new().resize_as_(labels)
+               .copy_(torch.arange(0, N).long())
+               .unsqueeze(0).expand(N, N))
+        # shape [N, 1]
+        p_inds = torch.gather(
+            ind[is_pos].contiguous().view(N, -1), 1, relative_p_inds.data)
+        n_inds = torch.gather(
+            ind[is_neg].contiguous().view(N, -1), 1, relative_n_inds.data)
+        # shape [N]
+        p_inds = p_inds.squeeze(1)
+        n_inds = n_inds.squeeze(1)
+        return dist_ap, dist_an, p_inds, n_inds
+
+    return dist_ap, dist_an
+
+
+class TripletLoss(object):
+    """Modified from Tong Xiao's open-reid (https://github.com/Cysu/open-reid).
+    Related Triplet Loss theory can be found in paper 'In Defense of the Triplet
+    Loss for Person Re-Identification'."""
+
+    def __init__(self, margin=None):
+        self.margin = margin
+        if margin is not None:
+            self.ranking_loss = nn.MarginRankingLoss(margin=margin)
+        else:
+            self.ranking_loss = nn.SoftMarginLoss()
+
+    def __call__(self, global_feat, labels, normalize_feature=False):
+        if normalize_feature:
+            global_feat = normalize(global_feat, axis=-1)
+        dist_mat = euclidean_dist(global_feat, global_feat)
+        dist_ap, dist_an = hard_example_mining(dist_mat, labels, self.margin)
+        y = dist_an.new().resize_as_(dist_an).fill_(1)
+        if self.margin is not None:
+            loss = self.ranking_loss(dist_an, dist_ap, y)
+        else:
+            loss = self.ranking_loss(dist_an - dist_ap, y)
+        return loss, dist_ap, dist_an