changes

sgrvinod · sgrvinod · commit 3fe0830ae631 · 2019-05-15T09:37:42.000+05:30
diff --git a/README.md b/README.md
@@ -80,4 +80,4 @@ I am still writing this tutorial.
 
 In the meantime, you could take a look at the code – it works!
 
-We achieve an accuracy of **74.8%** (against **75.8%** in the paper) on the Yahoo Answer dataset.
+We achieve an accuracy of **75.1%** (against **75.8%** in the paper) on the Yahoo Answer dataset.
diff --git a/eval.py b/eval.py
@@ -0,0 +1,53 @@
+import time
+from utils import *
+from datasets import HANDataset
+
+device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
+
+# Data parameters
+data_folder = '/media/ssd/han data'
+
+# Evaluation parameters
+batch_size = 64  # batch size
+workers = 4  # number of workers for loading data in the DataLoader
+print_freq = 2000  # print training or validation status every __ batches
+checkpoint = 'checkpoint_han.pth.tar'
+
+# Load model
+checkpoint = torch.load(checkpoint)
+model = checkpoint['model']
+model = model.to(device)
+model.eval()
+
+# Load test data
+test_loader = torch.utils.data.DataLoader(HANDataset(data_folder, 'test'), batch_size=batch_size, shuffle=False,
+                                          num_workers=workers, pin_memory=True)
+
+# Track metrics
+accs = AverageMeter()  # accuracies
+
+# Evaluate in batches
+for i, (documents, sentences_per_document, words_per_sentence, labels) in enumerate(
+        tqdm(test_loader, desc='Evaluating')):
+
+    documents = documents.to(device)  # (batch_size, sentence_limit, word_limit)
+    sentences_per_document = sentences_per_document.squeeze(1).to(device)  # (batch_size)
+    words_per_sentence = words_per_sentence.to(device)  # (batch_size, sentence_limit)
+    labels = labels.squeeze(1).to(device)  # (batch_size)
+
+    # Forward prop.
+    scores, word_alphas, sentence_alphas = model(documents, sentences_per_document,
+                                                 words_per_sentence)  # (n_documents, n_classes), (n_documents, max_doc_len_in_batch, max_sent_len_in_batch), (n_documents, max_doc_len_in_batch)
+
+    # Find accuracy
+    _, predictions = scores.max(dim=1)  # (n_documents)
+    correct_predictions = torch.eq(predictions, labels).sum().item()
+    accuracy = correct_predictions / labels.size(0)
+
+    # Keep track of metrics
+    accs.update(accuracy, labels.size(0))
+
+    start = time.time()
+
+# Print final result
+print('\n * TEST ACCURACY - %.1f per cent\n' % (accs.avg * 100))
diff --git a/train.py b/train.py
@@ -29,11 +29,10 @@
 lr = 1e-3  # learning rate
 momentum = 0.9  # momentum
 workers = 4  # number of workers for loading data in the DataLoader
-epochs = 200  # number of epochs to run without early-stopping
+epochs = 2  # number of epochs to run without early-stopping
 grad_clip = None  # clip gradients at this value
 print_freq = 2000  # print training or validation status every __ batches
 checkpoint = None  # path to model checkpoint, None if none
-best_acc = 0.  # assume the accuracy is 0 at first
 
 device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
 
@@ -44,7 +43,7 @@ def main():
     """
     Training and validation.
     """
-    global best_acc, epochs_since_improvement, checkpoint, start_epoch, word_map
+    global checkpoint, start_epoch, word_map
 
     # Initialize model or load checkpoint
     if checkpoint is not None:
@@ -53,10 +52,8 @@ def main():
         optimizer = checkpoint['optimizer']
         word_map = checkpoint['word_map']
         start_epoch = checkpoint['epoch'] + 1
-        best_acc = checkpoint['best_acc']
-        epochs_since_improvement = checkpoint['epochs_since_improvement']
         print(
-            '\nLoaded checkpoint from epoch %d, with a previous best accuracy of %.3f.\n' % (start_epoch - 1, best_acc))
+            '\nLoaded checkpoint from epoch %d.\n' % (start_epoch - 1))
     else:
         embeddings, emb_size = load_word2vec_embeddings(word2vec_file, word_map)  # load pre-trained word2vec embeddings
 
@@ -85,8 +82,6 @@ def main():
     # DataLoaders
     train_loader = torch.utils.data.DataLoader(HANDataset(data_folder, 'train'), batch_size=batch_size, shuffle=True,
                                                num_workers=workers, pin_memory=True)
-    val_loader = torch.utils.data.DataLoader(HANDataset(data_folder, 'test'), batch_size=batch_size, shuffle=True,
-                                             num_workers=workers, pin_memory=True)
 
     # Epochs
     for epoch in range(start_epoch, epochs):
@@ -97,25 +92,11 @@ def main():
               optimizer=optimizer,
               epoch=epoch)
 
-        # One epoch's validation
-        acc = validate(val_loader=val_loader,
-                       model=model,
-                       criterion=criterion)
-
-        # Did validation accuracy improve?
-        is_best = acc > best_acc
-        best_acc = max(acc, best_acc)
-        if not is_best:
-            epochs_since_improvement += 1
-            print("\nEpochs since improvement: %d\n" % (epochs_since_improvement,))
-        else:
-            epochs_since_improvement = 0
-
         # Decay learning rate every epoch
-        # adjust_learning_rate(optimizer, 0.5)
+        adjust_learning_rate(optimizer, 0.1)
 
         # Save checkpoint
-        save_checkpoint(epoch, model, optimizer, best_acc, word_map, epochs_since_improvement, is_best)
+        save_checkpoint(epoch, model, optimizer, word_map)
 
 
 def train(train_loader, model, criterion, optimizer, epoch):
@@ -190,69 +171,5 @@ def train(train_loader, model, criterion, optimizer, epoch):
                                                                   acc=accs))
 
 
-def validate(val_loader, model, criterion):
-    """
-    Performs one epoch's validation.
-
-    :param val_loader: DataLoader for validation data
-    :param model: model
-    :param criterion: cross entropy loss layer
-    :return: validation accuracy score
-    """
-    model.eval()
-
-    batch_time = AverageMeter()  # forward prop. + back prop. time per batch
-    data_time = AverageMeter()  # data loading time per batch
-    losses = AverageMeter()  # cross entropy loss
-    accs = AverageMeter()  # accuracies
-
-    start = time.time()
-
-    # Batches
-    for i, (documents, sentences_per_document, words_per_sentence, labels) in enumerate(val_loader):
-
-        data_time.update(time.time() - start)
-
-        documents = documents.to(device)  # (batch_size, sentence_limit, word_limit)
-        sentences_per_document = sentences_per_document.squeeze(1).to(device)  # (batch_size)
-        words_per_sentence = words_per_sentence.to(device)  # (batch_size, sentence_limit)
-        labels = labels.squeeze(1).to(device)  # (batch_size)
-
-        # Forward prop.
-        scores, word_alphas, sentence_alphas = model(documents, sentences_per_document,
-                                                     words_per_sentence)  # (n_documents, n_classes), (n_documents, max_doc_len_in_batch, max_sent_len_in_batch), (n_documents, max_doc_len_in_batch)
-
-        # Loss
-        loss = criterion(scores, labels)
-
-        # Find accuracy
-        _, predictions = scores.max(dim=1)  # (n_documents)
-        correct_predictions = torch.eq(predictions, labels).sum().item()
-        accuracy = correct_predictions / labels.size(0)
-
-        # Keep track of metrics
-        losses.update(loss.item(), labels.size(0))
-        batch_time.update(time.time() - start)
-        accs.update(accuracy, labels.size(0))
-
-        start = time.time()
-
-        # Print training status
-        if i % print_freq == 0:
-            print('[{0}/{1}]\t'
-                  'Batch Time {batch_time.val:.3f} ({batch_time.avg:.3f})\t'
-                  'Data Load Time {data_time.val:.3f} ({data_time.avg:.3f})\t'
-                  'Loss {loss.val:.4f} ({loss.avg:.4f})\t'
-                  'Accuracy {acc.val:.3f} ({acc.avg:.3f})'.format(i, len(val_loader),
-                                                                  batch_time=batch_time,
-                                                                  data_time=data_time, loss=losses,
-                                                                  acc=accs))
-
-    print('\n * LOSS - {loss.avg:.3f}, ACCURACY - {acc.avg:.3f}\n'.format(loss=losses,
-                                                                          acc=accs))
-
-    return accs.avg
-
-
 if __name__ == '__main__':
     main()
diff --git a/utils.py b/utils.py
@@ -250,7 +250,7 @@ def clip_gradient(optimizer, grad_clip):
                 param.grad.data.clamp_(-grad_clip, grad_clip)
 
 
-def save_checkpoint(epoch, model, optimizer, best_acc, word_map, epochs_since_improvement, is_best):
+def save_checkpoint(epoch, model, optimizer, word_map):
     """
     Save model checkpoint.
 
@@ -263,16 +263,11 @@ def save_checkpoint(epoch, model, optimizer, best_acc, word_map, epochs_since_im
     :param is_best: is this checkpoint the best so far?
     """
     state = {'epoch': epoch,
-             'best_acc': best_acc,
              'model': model,
              'optimizer': optimizer,
-             'epochs_since_improvement': epochs_since_improvement,
              'word_map': word_map}
     filename = 'checkpoint_han.pth.tar'
     torch.save(state, filename)
-    # If checkpoint is the best so far, create a copy to avoid being overwritten by a subsequent worse checkpoint
-    if is_best:
-        torch.save(state, 'BEST_' + filename)
 
 
 class AverageMeter(object):

Original file line number	Diff line number	Diff line change
`@@ -80,4 +80,4 @@ I am still writing this tutorial.`
`80`	`80`
`81`	`81`	`In the meantime, you could take a look at the code – it works!`
`82`	`82`
`83`		`-We achieve an accuracy of 74.8% (against 75.8% in the paper) on the Yahoo Answer dataset.`
	`83`	`+We achieve an accuracy of 75.1% (against 75.8% in the paper) on the Yahoo Answer dataset.`