Added python implementation

laggui · laggui · commit 661147eb5b0a · 2018-11-09T13:52:06.000-05:00
diff --git a/pytorch/predict.py b/pytorch/predict.py
@@ -0,0 +1,82 @@
+import torch
+import torch.nn as nn
+import torch.backends.cudnn as cudnn
+
+import torchvision.transforms as transforms
+
+from torch import jit
+from PIL import Image
+
+import io
+import time
+import argparse
+import cv2
+
+from vgg import VGGNet
+
+# Check device    
+device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')
+# CIFAR-10 classes
+classes = ('plane', 'car', 'bird', 'cat',
+'deer', 'dog', 'frog', 'horse', 'ship', 'truck')
+
+def predict(model, image):
+    # apply transform and convert BGR -> RGB
+    x = image[:, :, (2, 1, 0)]
+    #print('Image shape: {}'.format(x.shape))
+    # H x W x C -> C x H x W for conv input
+    x = torch.from_numpy(x).permute(2, 0, 1)
+    torch.set_printoptions(threshold=5000)
+
+    to_norm_tensor = transforms.Compose([
+        #transforms.ToTensor(),
+        transforms.Normalize((0.4914, 0.4822, 0.4465), (0.2023, 0.1994, 0.2010)),
+    ])
+
+    img_tensor = to_norm_tensor(x.float().div_(255))
+    #print('Image tensor: {}'.format(img_tensor))
+    #print('Image tensor shape: {}'.format(img_tensor.shape))
+    img_tensor.unsqueeze_(0).to(device) # add a dimension for the batch
+    #print('New shape: {}'.format(img_tensor.shape))
+
+    with torch.no_grad():
+        # forward pass
+        outputs = model(img_tensor)
+    score, predicted = outputs.max(1)
+    #print(outputs)
+    print('Predicted: {} | {}'.format(classes[predicted.item()], score.item()))
+
+
+
+if __name__ == '__main__':
+    parser = argparse.ArgumentParser(description='VGGNet Predict Tool')
+    parser.add_argument('mtype', type=str, choices=['pytorch', 'torch-script'], help='Model type')
+    parser.add_argument('--model', type=str, default='../data/VGG16model.pth', help='Pre-trained model')
+    parser.add_argument('--image', type=str, default='../data/dog.png', help='Input image')
+    args = parser.parse_args()
+
+    # Model
+    print('==> Building model...')
+    if args.mtype == 'pytorch':
+        model = VGGNet('D-DSM', num_classes=10, input_size=32) # depthwise separable
+        # Load model
+        print('==> Loading PyTorch model...')
+        model.load_state_dict(torch.load(args.model))
+        model.eval()
+        model.to(device)
+    else:
+        print('==> Loading Torch Script model...')
+        # Load ScriptModule from io.BytesIO object
+        with open(args.model, 'rb') as f:
+            buffer = io.BytesIO(f.read())
+        model = torch.jit.load(buffer)
+        print('[WARNING] ScriptModules cannot be moved to a GPU device yet. Running strictly on CPU for now.')
+        device = torch.device('cpu') # 'to' is not supported on TracedModules (yet)
+
+    if device.type == 'cuda':
+        cudnn.benchmark = True
+        model = torch.nn.DataParallel(model)
+
+    t0 = time.time()
+    predict(model, cv2.imread(args.image))
+    print('Time: {} seconds'.format(time.time()-t0))
diff --git a/pytorch/test.py b/pytorch/test.py
@@ -0,0 +1,81 @@
+import torch
+import torch.nn as nn
+import torch.backends.cudnn as cudnn
+
+import torchvision.datasets as datasets
+import torchvision.transforms as transforms
+
+from torch.utils.data import DataLoader
+from torch import jit
+
+import io
+import time
+import argparse
+
+from vgg import VGGNet
+
+# Check device    
+device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')
+#device = torch.device('cpu') # 'to' is not supported on TracedModules, ref: https://github.com/pytorch/pytorch/issues/6008
+
+def test(model, test_loader):
+    #model.eval()
+    print_freq = 10 # print every 10 batches
+    correct = 0
+    total = 0
+    
+    with torch.no_grad(): # no need to track history
+        for batch_idx, (inputs, targets) in enumerate(test_loader):
+            inputs, targets = inputs.to(device), targets.to(device)
+
+            # compute output
+            outputs = model(inputs)        
+
+            # record prediction accuracy
+            _, predicted = outputs.max(1)
+            total += targets.size(0)
+            correct += predicted.eq(targets).sum().item()
+
+            if batch_idx % print_freq == 0:
+                print('Batch: %d, Acc: %.3f%% (%d/%d)' % (batch_idx+1, 100.*correct/total, correct, total))
+    return correct, total
+
+if __name__ == '__main__':
+    parser = argparse.ArgumentParser(description='VGGNet Test Tool')
+    parser.add_argument('mtype', type=str, choices=['pytorch', 'torch-script'], help='Model type')
+    args = parser.parse_args()
+
+    # Model
+    print('==> Building model...')
+    if args.mtype == 'pytorch':
+        model = VGGNet('D-DSM', num_classes=10, input_size=32) # depthwise separable
+        # Load model
+        print('==> Loading PyTorch model...')
+        model.load_state_dict(torch.load('VGG16model.pth'))
+        model.to(device)
+    else:
+        print('==> Loading Torch Script model...')
+        # Load ScriptModule from io.BytesIO object
+        with open('VGG16-traced-eval.pt', 'rb') as f:
+            buffer = io.BytesIO(f.read())
+        model = torch.jit.load(buffer)
+        print('[WARNING] ScriptModules cannot be moved to a GPU device yet. Running strictly on CPU for now.')
+        device = torch.device('cpu') # 'to' is not supported on TracedModules (yet)
+
+    transform_test = transforms.Compose([
+        transforms.ToTensor(),
+        transforms.Normalize((0.4914, 0.4822, 0.4465), (0.2023, 0.1994, 0.2010)),
+    ])
+
+    testset = datasets.CIFAR10(root='./data', train=False, download=True, transform=transform_test)
+    test_loader = DataLoader(testset, batch_size=100, shuffle=False, num_workers=2)
+
+    if device.type == 'cuda':
+        cudnn.benchmark = True
+        model = torch.nn.DataParallel(model)
+
+    t0 = time.time()
+    correct, total = test(model, test_loader)
+    t1 = time.time()
+    print('Accuracy of the network on test dataset: %f (%d/%d)' % (100.*correct/total, correct, total))
+    print('Elapsed time: {} seconds'.format(t1-t0))
diff --git a/pytorch/to_torch_script.py b/pytorch/to_torch_script.py
@@ -0,0 +1,46 @@
+import torch
+import argparse
+
+from torch.jit import trace
+
+from vgg import VGGNet
+
+# Check device    
+device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')
+print('[Device] {}'.format(device))
+
+if __name__ == '__main__':
+    parser = argparse.ArgumentParser(description='PyTorch Model to Torch Script')
+    parser.add_argument('mode', type=str, choices=['train', 'eval'], help='Model mode')
+    args = parser.parse_args()
+
+    example_input = torch.rand(1, 3, 32, 32)
+    # TracedModule objects do not inherit the .to() or .eval() methods
+
+    if args.mode == 'train':
+        print('==> Building model...')
+        model = VGGNet('D-DSM', num_classes=10, input_size=32)
+        #model.to(device)
+        model.train()
+
+        # convert to Torch Script
+        print('==> Tracing model...')
+        traced_model = trace(model, example_input)
+
+        # save model for training
+        traced_model.save('VGG16-traced-train.pt')
+    else:
+        # load "normal" pytorch trained model
+        print('==> Building model...')
+        model = VGGNet('D-DSM', num_classes=10, input_size=32)
+        print('==> Loading pre-trained model...')
+        model.load_state_dict(torch.load('VGG16model.pth', map_location=torch.device('cpu')))
+        #model = model.to(device)
+        model.eval()
+
+        # convert to Torch Script
+        print('==> Tracing model...')
+        traced_model = trace(model, example_input)
+
+        # save model for eval
+        traced_model.save('VGG16-traced-eval.pt')
diff --git a/pytorch/train.py b/pytorch/train.py
@@ -0,0 +1,134 @@
+import torch
+import torch.nn as nn
+import torchvision.datasets as datasets
+import torchvision.transforms as transforms
+import torch.backends.cudnn as cudnn
+import numpy as np
+import argparse
+import time
+import io
+
+from torch.utils.data.sampler import SubsetRandomSampler
+from torch.utils.data import Dataset, DataLoader
+from torch.optim.lr_scheduler import ReduceLROnPlateau, StepLR
+
+from torch import jit
+
+from vgg import VGGNet
+
+# Check device    
+device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')
+#device = torch.device('cpu')
+
+def train(model, train_loader, criterion, optimizer, epoch):
+    model.train()
+    print_freq = 10 # print every 10 batches
+    train_loss = 0
+    correct = 0
+    total = 0
+    print('\nEpoch: %d' % epoch)
+    
+    for batch_idx, (inputs, targets) in enumerate(train_loader):
+        inputs, targets = inputs.to(device), targets.to(device)
+        optimizer.zero_grad()
+        
+        # compute output
+        outputs = model(inputs)
+        loss = criterion(outputs, targets)
+        
+        # compute gradient and do SGD step
+        loss.backward()
+        optimizer.step()
+        
+        # record loss and accuracy
+        train_loss += loss.item()
+        _, predicted = outputs.max(1)
+        total += targets.size(0)
+        correct += predicted.eq(targets).sum().item()
+        
+        if batch_idx % print_freq == 0:
+            print('Batch: %d, Loss: %.3f | Acc: %.3f%% (%d/%d)' % (batch_idx+1, train_loss/(batch_idx+1), 100.*correct/total, correct, total))
+
+def validate(model, val_loader, criterion):
+    model.eval()
+    print_freq = 10 # print every 10 batches
+    val_loss = 0.0
+    
+    with torch.no_grad(): # no need to track history
+        for batch_idx, (inputs, targets) in enumerate(val_loader):
+            inputs, targets = inputs.to(device), targets.to(device)
+
+            # compute output
+            outputs = model(inputs)        
+            loss = criterion(outputs, targets)
+
+            # record loss
+            val_loss += loss.item()
+
+            if batch_idx % print_freq == 0:
+                print('Validation on Batch: %d, Loss: %f' % (batch_idx+1, val_loss/(batch_idx+1)))
+    return val_loss
+
+if __name__ == '__main__':
+    parser = argparse.ArgumentParser(description='VGGNet Training Tool')
+    parser.add_argument('mtype', type=str, choices=['pytorch', 'torch-script'], help='Model type')
+    args = parser.parse_args()
+    # Load CIFAR10 dataset
+    print('==> Preparing data...')
+    transform_train = transforms.Compose([
+        transforms.RandomCrop(32, padding=4),
+        transforms.RandomHorizontalFlip(),
+        transforms.ToTensor(),
+        transforms.Normalize((0.4914, 0.4822, 0.4465), (0.2023, 0.1994, 0.2010)),
+    ])
+
+    trainset = datasets.CIFAR10(root='./data', train=True, download=True, transform=transform_train)
+    train_loader = DataLoader(trainset, batch_size=128, shuffle=True, num_workers=4)
+
+    # Model
+    print('==> Building model...')
+    #model = VGGNet('D', num_classes=10, input_size=32) # VGG16 is configuration D (refer to paper)
+    if args.mtype == 'torch-script':
+        # print('==> From Torch Script...')
+        # # Load ScriptModule from io.BytesIO object
+        # with open('VGG16-traced-train.pt', 'rb') as f:
+        #     buffer = io.BytesIO(f.read())
+        # model = torch.jit.load(buffer)
+        raise RuntimeError('Training is not supported on ScriptModules yet.') #https://github.com/pytorch/pytorch/issues/6008
+
+    else:
+        model = VGGNet('D-DSM', num_classes=10, input_size=32) # depthwise separable
+    model = model.to(device)
+
+    if device.type == 'cuda':
+        cudnn.benchmark = True
+        model = torch.nn.DataParallel(model)
+
+    # Training
+    num_epochs = 200 # as opposed to the paper (74) because of CIFAR10 dataset
+    lr = 0.1
+    # define loss function (criterion) and optimizer
+    criterion = nn.CrossEntropyLoss()
+    optimizer = torch.optim.SGD(model.parameters(), lr, momentum=0.9, weight_decay=5e-4)
+
+    print('==> Training...')
+    train_time = 0
+    #scheduler = ReduceLROnPlateau(optimizer, 'min')
+    scheduler = StepLR(optimizer, step_size=100, gamma=0.1) # adjust lr by factor of 10 every 100 epochs
+    for epoch in range(num_epochs):
+        t0 = time.time()
+        # train one epoch
+        train(model, train_loader, criterion, optimizer, epoch)
+        t1 = time.time() - t0
+        print('{} seconds'.format(t1))
+        train_time += t1
+
+        # validate
+        #val_loss = validate(model, val_loader, criterion)
+        # adjust learning rate with scheduler
+        #scheduler.step(val_loss)
+        scheduler.step()
+        
+    print('==> Finished Training: {} seconds'.format(train_time))
+    # Save trained model
+    torch.save(model.state_dict(), 'VGG16model.pth')
diff --git a/pytorch/vgg.py b/pytorch/vgg.py