diff --git a/.gitignore b/.gitignore
new file mode 100644
index 0000000..9342dd3
--- /dev/null
+++ b/.gitignore
@@ -0,0 +1,4 @@
+data/*
+*.pth
+*.npy
+*.pyc
diff --git a/code/main.py b/code/main.py
new file mode 100644
index 0000000..06cda94
--- /dev/null
+++ b/code/main.py
@@ -0,0 +1,303 @@
+from __future__ import print_function
+from __future__ import division
+
+import os
+import pdb
+import csv
+import time
+import random
+import numpy as np
+import matplotlib.pyplot as plt
+
+import torch
+import torchvision
+import torchvision.transforms as transforms
+
+from PIL import Image
+
+from torch.utils.data.dataset import Dataset
+from torch.utils.data import DataLoader
+
+from torch import nn
+from torch.autograd import Variable
+from torch.optim import Adam
+
+from resnet import resnet50 # homemade resnet pre-trained models :)
+from resnet import resnet34 # homemade resnet pre-trained models :)
+
+USE_GPU = True
+
+TRAIN_HEAD_DIRS = ['../data/frames/train/house/1/head/', '../data/frames/train/house/1/head/',
+                   '../data/frames/train/house/2/head/', '../data/frames/train/house/2/head/',
+                   '../data/frames/train/house/3/head/', '../data/frames/train/house/3/head/',
+                   '../data/frames/train/lab/1/head/', '../data/frames/train/lab/1/head/',
+                   '../data/frames/train/lab/2/head/', '../data/frames/train/lab/2/head/',
+                   '../data/frames/train/lab/3/head/', '../data/frames/train/lab/3/head/',
+                   '../data/frames/train/lab/4/head/', '../data/frames/train/lab/4/head/',
+                   '../data/frames/train/office/1/head/', '../data/frames/train/office/1/head/',
+                   '../data/frames/train/office/2/head/', '../data/frames/train/office/2/head/',
+                   '../data/frames/train/office/3/head/', '../data/frames/train/office/3/head/',]
+
+TRAIN_HAND_DIRS = ['../data/frames/train/house/1/Lhand/', '../data/frames/train/house/1/Rhand/',
+                   '../data/frames/train/house/2/Lhand/', '../data/frames/train/house/2/Rhand/',
+                   '../data/frames/train/house/3/Lhand/', '../data/frames/train/house/3/Rhand/',
+                   '../data/frames/train/lab/1/Lhand/', '../data/frames/train/lab/1/Rhand/',
+                   '../data/frames/train/lab/2/Lhand/', '../data/frames/train/lab/2/Rhand/',
+                   '../data/frames/train/lab/3/Lhand/', '../data/frames/train/lab/3/Rhand/',
+                   '../data/frames/train/lab/4/Lhand/', '../data/frames/train/lab/4/Rhand/',
+                   '../data/frames/train/office/1/Lhand/', '../data/frames/train/office/1/Rhand/',
+                   '../data/frames/train/office/2/Lhand/', '../data/frames/train/office/2/Rhand/',
+                   '../data/frames/train/office/3/Lhand/', '../data/frames/train/office/3/Rhand/',]
+
+TEST_HEAD_DIRS = ['../data/frames/test/house/1/head/', '../data/frames/test/house/1/head/',
+                  '../data/frames/test/house/2/head/', '../data/frames/test/house/2/head/',
+                  '../data/frames/test/house/3/head/', '../data/frames/test/house/3/head/',
+                  '../data/frames/test/lab/1/head/', '../data/frames/test/lab/1/head/',
+                  '../data/frames/test/lab/2/head/', '../data/frames/test/lab/2/head/',
+                  '../data/frames/test/lab/3/head/', '../data/frames/test/lab/3/head/',
+                  '../data/frames/test/lab/4/head/', '../data/frames/test/lab/4/head/',
+                  '../data/frames/test/office/1/head/', '../data/frames/test/office/1/head/',
+                  '../data/frames/test/office/2/head/', '../data/frames/test/office/2/head/',
+                  '../data/frames/test/office/3/head/', '../data/frames/test/office/3/head/',]
+
+TEST_HAND_DIRS = ['../data/frames/test/house/1/Lhand/', '../data/frames/test/house/1/Rhand/',
+                  '../data/frames/test/house/2/Lhand/', '../data/frames/test/house/2/Rhand/',
+                  '../data/frames/test/house/3/Lhand/', '../data/frames/test/house/3/Rhand/',
+                  '../data/frames/test/lab/1/Lhand/', '../data/frames/test/lab/1/Rhand/',
+                  '../data/frames/test/lab/2/Lhand/', '../data/frames/test/lab/2/Rhand/',
+                  '../data/frames/test/lab/3/Lhand/', '../data/frames/test/lab/3/Rhand/',
+                  '../data/frames/test/lab/4/Lhand/', '../data/frames/test/lab/4/Rhand/',
+                  '../data/frames/test/office/1/Lhand/', '../data/frames/test/office/1/Rhand/',
+                  '../data/frames/test/office/2/Lhand/', '../data/frames/test/office/2/Rhand/',
+                  '../data/frames/test/office/3/Lhand/', '../data/frames/test/office/3/Rhand/',]
+
+TRAIN_FA_LABELS = ['../data/labels/house/FA_left1.npy', '../data/labels/house/FA_right1.npy',
+                   '../data/labels/house/FA_left2.npy', '../data/labels/house/FA_right2.npy',
+                   '../data/labels/house/FA_left3.npy', '../data/labels/house/FA_right3.npy',
+                   '../data/labels/lab/FA_left1.npy', '../data/labels/lab/FA_right1.npy',
+                   '../data/labels/lab/FA_left2.npy', '../data/labels/lab/FA_right2.npy',
+                   '../data/labels/lab/FA_left3.npy', '../data/labels/lab/FA_right3.npy',
+                   '../data/labels/lab/FA_left4.npy', '../data/labels/lab/FA_right4.npy',
+                   '../data/labels/office/FA_left1.npy', '../data/labels/office/FA_right1.npy',
+                   '../data/labels/office/FA_left2.npy', '../data/labels/office/FA_right2.npy',
+                   '../data/labels/office/FA_left3.npy', '../data/labels/office/FA_right3.npy',]
+
+TRAIN_OBJ_LABELS = ['../data/labels/house/obj_left1.npy', '../data/labels/house/obj_right1.npy',
+                     '../data/labels/house/obj_left2.npy', '../data/labels/house/obj_right2.npy',
+                     '../data/labels/house/obj_left3.npy', '../data/labels/house/obj_right3.npy',
+                     '../data/labels/lab/obj_left1.npy', '../data/labels/lab/obj_right1.npy',
+                     '../data/labels/lab/obj_left2.npy', '../data/labels/lab/obj_right2.npy',
+                     '../data/labels/lab/obj_left3.npy', '../data/labels/lab/obj_right3.npy',
+                     '../data/labels/lab/obj_left4.npy', '../data/labels/lab/obj_right4.npy',
+                     '../data/labels/office/obj_left1.npy', '../data/labels/office/obj_right1.npy',
+                     '../data/labels/office/obj_left2.npy', '../data/labels/office/obj_right2.npy',
+                     '../data/labels/office/obj_left3.npy', '../data/labels/office/obj_right3.npy',]
+
+TEST_FA_LABELS = ['../data/labels/house/FA_left4.npy', '../data/labels/house/FA_right4.npy',
+                  '../data/labels/house/FA_left5.npy', '../data/labels/house/FA_right5.npy',
+                  '../data/labels/house/FA_left6.npy', '../data/labels/house/FA_right6.npy',
+                  '../data/labels/lab/FA_left5.npy', '../data/labels/lab/FA_right5.npy',
+                  '../data/labels/lab/FA_left6.npy', '../data/labels/lab/FA_right6.npy',
+                  '../data/labels/lab/FA_left7.npy', '../data/labels/lab/FA_right7.npy',
+                  '../data/labels/lab/FA_left8.npy', '../data/labels/lab/FA_right8.npy',
+                  '../data/labels/office/FA_left4.npy', '../data/labels/office/FA_right4.npy',
+                  '../data/labels/office/FA_left5.npy', '../data/labels/office/FA_right5.npy',
+                  '../data/labels/office/FA_left6.npy', '../data/labels/office/FA_right6.npy',]
+
+TEST_OBJ_LABELS = ['../data/labels/house/obj_left4.npy', '../data/labels/house/obj_right4.npy',
+                    '../data/labels/house/obj_left5.npy', '../data/labels/house/obj_right5.npy',
+                    '../data/labels/house/obj_left6.npy', '../data/labels/house/obj_right6.npy',
+                    '../data/labels/lab/obj_left5.npy', '../data/labels/lab/obj_right5.npy',
+                    '../data/labels/lab/obj_left6.npy', '../data/labels/lab/obj_right6.npy',
+                    '../data/labels/lab/obj_left7.npy', '../data/labels/lab/obj_right7.npy',
+                    '../data/labels/lab/obj_left8.npy', '../data/labels/lab/obj_right8.npy',
+                    '../data/labels/office/obj_left4.npy', '../data/labels/office/obj_right4.npy',
+                    '../data/labels/office/obj_left5.npy', '../data/labels/office/obj_right5.npy',
+                    '../data/labels/office/obj_left6.npy', '../data/labels/office/obj_right6.npy',]
+
+SCENES = ['house', 'lab', 'office']
+
+EPOCH = 300
+BATCH_SIZE = 64
+
+MSG_DISPLAY_FREQ = 20
+
+LOSS = np.array([])
+
+class HandcamDataset:
+
+    def __init__(self, head_dirs, hand_dirs, fa_nps, obj_nps, transform=None):
+        # check the input params
+        assert len(head_dirs) == len(hand_dirs) == len(fa_nps) == len(obj_nps)
+        # retrieve all the filenames
+        self.data = []
+        for (head_dir, hand_dir, fa_np, obj_np) in zip(head_dirs, hand_dirs, fa_nps, obj_nps):
+            fa_labels = np.load(fa_np)
+            obj_labels = np.load(obj_np)
+            head_filenames = os.listdir(head_dir)
+            head_filenames = sorted(head_filenames,
+                                    key=lambda pid: int(pid.split('Image')[1].split('.')[0]))
+            hand_filenames = os.listdir(hand_dir)
+            hand_filenames = sorted(hand_filenames,
+                                    key=lambda pid: int(pid.split('Image')[1].split('.')[0]))
+            for (head_filename, hand_filename, fa_label, obj_label) in zip(head_filenames, hand_filenames, fa_labels, obj_labels):
+                self.data.append({'head_filename':head_dir+head_filename,
+                                  'hand_filename':hand_dir+hand_filename,
+                                  'fa_label':fa_label,
+                                  'obj_label':obj_label},)
+        # store transformation settings
+        self.transform = transform
+
+    def __getitem__(self, index):
+        scene = SCENES.index(self.data[index]['head_filename'].split('/')[4])
+        head_img = Image.open(self.data[index]['head_filename'])
+        head_img = head_img.convert('RGB')
+        head_img = head_img.resize((224, 224), resample=Image.LANCZOS)
+        hand_img = Image.open(self.data[index]['hand_filename'])
+        hand_img = hand_img.convert('RGB')
+        hand_img = hand_img.resize((224, 224), resample=Image.LANCZOS)
+        if self.transform is not None:
+            head_img = self.transform(head_img)
+            hand_img = self.transform(hand_img)
+        assert isinstance(head_img, torch.FloatTensor)   # img must be torch.FloatTensor
+        assert isinstance(hand_img, torch.FloatTensor)   # img must be torch.FloatTensor
+        fa_label = torch.LongTensor([long(self.data[index]['fa_label'])])  # label must be torch.LongTensor
+        obj_label = torch.LongTensor([long(self.data[index]['obj_label'])])  # label must be torch.LongTensor
+        return scene, head_img, hand_img, fa_label, obj_label
+
+    def __len__(self):
+        return len(self.data)
+
+
+class HanNet(nn.Module):
+
+    def __init__(self, pretrained=False, num_classes=1000):
+        super(HanNet, self).__init__()
+        self.headstream = resnet34(pretrained=pretrained)
+        self.handstream = resnet34(pretrained=pretrained)
+        self.fc = nn.Linear(512 * 2, num_classes)
+
+    def forward(self, x):
+        x = torch.cat((self.headstream(x[0]), self.handstream(x[1])), dim=1)
+        x = self.fc(x)
+        return x
+
+
+def train(train_loader, model, criterion, optimizer, epoch):
+
+    batch_time = 0.0
+
+    # switch to train mode
+    model.train()
+
+    end = time.time()
+
+    running_loss = 0.0
+    global LOSS
+
+    for i, (_, head_inputs, hand_inputs, fa_labels, obj_labels) in enumerate(train_loader):
+
+        fa_labels = torch.squeeze(fa_labels, 1)
+        obj_labels = torch.squeeze(obj_labels, 1)
+
+        if USE_GPU:
+            head_inputs = Variable(head_inputs).cuda(async=True)
+            hand_inputs = Variable(hand_inputs).cuda(async=True)
+            fa_labels = Variable(fa_labels).cuda(async=True)
+            obj_labels = Variable(obj_labels).cuda(async=True)
+        else:
+            head_inputs = Variable(head_inputs)
+            hand_inputs = Variable(hand_inputs)
+            fa_labels = Variable(fa_labels)
+            obj_labels = Variable(obj_labels)
+        
+        outputs = model([head_inputs, hand_inputs])
+
+        loss = criterion(outputs[:, 0:2], fa_labels) + criterion(outputs[:, 2:26], obj_labels) 
+
+        optimizer.zero_grad()
+        loss.backward()
+        optimizer.step()
+
+        running_loss += loss.data[0]
+
+        batch_time += time.time() - end
+        end = time.time()
+
+        if i%MSG_DISPLAY_FREQ == (MSG_DISPLAY_FREQ-1):
+            print("Epoch: [{}][{}/{}]\t Loss: {:.8f}\t Time {:.3f}".format(epoch, i+1, len(train_loader), running_loss/MSG_DISPLAY_FREQ, batch_time/MSG_DISPLAY_FREQ))
+            LOSS = np.append(LOSS, running_loss/MSG_DISPLAY_FREQ)
+            running_loss = 0.0
+            batch_time = 0.0
+
+    np.save('loss_{:03}.npy'.format(epoch), LOSS)
+
+
+def test(test_loader, model, epoch):
+
+    # switch to evaluate mode
+    model.eval()
+
+    confusion_matrix = np.zeros((3, 24, 24))
+
+    for i, (scenes, head_inputs, hand_inputs, _, obj_labels) in enumerate(test_loader):
+
+        obj_labels = torch.squeeze(obj_labels, 1)
+
+        if USE_GPU:
+            head_inputs = Variable(head_inputs, volatile=True).cuda(async=True)
+            hand_inputs = Variable(hand_inputs, volatile=True).cuda(async=True)
+            obj_labels = Variable(obj_labels, volatile=True).cuda(async=True)
+        else:
+            head_inputs = Variable(head_inputs, volatile=True)
+            hand_inputs = Variable(hand_inputs, volatile=True)
+            obj_labels = Variable(obj_labels, volatile=True)
+        
+        outputs = model([head_inputs, hand_inputs])
+
+        _, predictions = torch.max(outputs[:, 2:25], 1)
+
+        for j in range(predictions.data.size(0)):
+
+            scene = scenes[j]
+            prediction = predictions.data[j]
+            label = obj_labels.data[j]
+
+            confusion_matrix[scene][prediction][label] += 1
+
+    print("Acc: {:.3}".format(np.sum(np.trace(confusion_matrix, axis1=1, axis2=2))/np.sum(confusion_matrix)))
+    np.save('cm_{:03}.npy'.format(epoch), confusion_matrix)
+
+def main():
+
+    transformations = transforms.Compose([
+        transforms.ToTensor(),
+        transforms.Normalize(mean=[0.485, 0.456, 0.406], std=[0.229, 0.224, 0.225])
+    ])
+
+    train_dataset = HandcamDataset(TRAIN_HEAD_DIRS, TRAIN_HAND_DIRS, TRAIN_FA_LABELS, TRAIN_OBJ_LABELS, transformations)
+    train_loader = DataLoader(train_dataset, batch_size=BATCH_SIZE, shuffle=True, num_workers=2)
+
+    test_dataset = HandcamDataset(TEST_HEAD_DIRS, TEST_HAND_DIRS, TRAIN_FA_LABELS, TRAIN_OBJ_LABELS, transformations)
+    test_loader = DataLoader(test_dataset, batch_size=BATCH_SIZE, shuffle=True, num_workers=2)
+
+    print("=> using pre-trained model HanNet")
+    model = HanNet(pretrained=True, num_classes=2+24)
+
+    if USE_GPU:
+        model = model.cuda()
+
+    if USE_GPU:
+        criterion = nn.CrossEntropyLoss().cuda()
+    else:
+        criterion = nn.CrossEntropyLoss()
+
+    optimizer = torch.optim.Adam(model.parameters(), lr=1e-3)
+
+    for epoch in range(EPOCH):
+        # train(train_loader, model, criterion, optimizer, epoch)
+        test(test_loader, model, epoch)
+        torch.save(model, 'model_{:03}.pth'.format(epoch))
+
+if __name__ == '__main__':
+    main()
diff --git a/code/resnet.py b/code/resnet.py
new file mode 100644
index 0000000..39f9d5d
--- /dev/null
+++ b/code/resnet.py
@@ -0,0 +1,235 @@
+import pdb
+import torch.nn as nn
+import math
+import torch.utils.model_zoo as model_zoo
+
+from torch.nn.parameter import Parameter
+
+__all__ = ['ResNet', 'resnet18', 'resnet34', 'resnet50', 'resnet101',
+           'resnet152']
+
+
+model_urls = {
+    'resnet18': 'https://download.pytorch.org/models/resnet18-5c106cde.pth',
+    'resnet34': 'https://download.pytorch.org/models/resnet34-333f7ec4.pth',
+    'resnet50': 'https://download.pytorch.org/models/resnet50-19c8e357.pth',
+    'resnet101': 'https://download.pytorch.org/models/resnet101-5d3b4d8f.pth',
+    'resnet152': 'https://download.pytorch.org/models/resnet152-b121ed2d.pth',
+}
+
+
+def conv3x3(in_planes, out_planes, stride=1):
+    "3x3 convolution with padding"
+    return nn.Conv2d(in_planes, out_planes, kernel_size=3, stride=stride,
+                     padding=1, bias=False)
+
+
+class BasicBlock(nn.Module):
+    expansion = 1
+
+    def __init__(self, inplanes, planes, stride=1, downsample=None):
+        super(BasicBlock, self).__init__()
+        self.conv1 = conv3x3(inplanes, planes, stride)
+        self.bn1 = nn.BatchNorm2d(planes)
+        self.relu = nn.ReLU(inplace=True)
+        self.conv2 = conv3x3(planes, planes)
+        self.bn2 = nn.BatchNorm2d(planes)
+        self.downsample = downsample
+        self.stride = stride
+
+    def forward(self, x):
+        residual = x
+
+        out = self.conv1(x)
+        out = self.bn1(out)
+        out = self.relu(out)
+
+        out = self.conv2(out)
+        out = self.bn2(out)
+
+        if self.downsample is not None:
+            residual = self.downsample(x)
+
+        out += residual
+        out = self.relu(out)
+
+        return out
+
+
+class Bottleneck(nn.Module):
+    expansion = 4
+
+    def __init__(self, inplanes, planes, stride=1, downsample=None):
+        super(Bottleneck, self).__init__()
+        self.conv1 = nn.Conv2d(inplanes, planes, kernel_size=1, bias=False)
+        self.bn1 = nn.BatchNorm2d(planes)
+        self.conv2 = nn.Conv2d(planes, planes, kernel_size=3, stride=stride,
+                               padding=1, bias=False)
+        self.bn2 = nn.BatchNorm2d(planes)
+        self.conv3 = nn.Conv2d(planes, planes * 4, kernel_size=1, bias=False)
+        self.bn3 = nn.BatchNorm2d(planes * 4)
+        self.relu = nn.ReLU(inplace=True)
+        self.downsample = downsample
+        self.stride = stride
+
+    def forward(self, x):
+        residual = x
+
+        out = self.conv1(x)
+        out = self.bn1(out)
+        out = self.relu(out)
+
+        out = self.conv2(out)
+        out = self.bn2(out)
+        out = self.relu(out)
+
+        out = self.conv3(out)
+        out = self.bn3(out)
+
+        if self.downsample is not None:
+            residual = self.downsample(x)
+
+        out += residual
+        out = self.relu(out)
+
+        return out
+
+
+class ResNet(nn.Module):
+
+    def __init__(self, block, layers, num_classes=1000):
+        self.inplanes = 64
+        super(ResNet, self).__init__()
+        self.conv1 = nn.Conv2d(3, 64, kernel_size=7, stride=2, padding=3,
+                               bias=False)
+        self.bn1 = nn.BatchNorm2d(64)
+        self.relu = nn.ReLU(inplace=True)
+        self.maxpool = nn.MaxPool2d(kernel_size=3, stride=2, padding=1)
+        self.layer1 = self._make_layer(block, 64, layers[0])
+        self.layer2 = self._make_layer(block, 128, layers[1], stride=2)
+        self.layer3 = self._make_layer(block, 256, layers[2], stride=2)
+        self.layer4 = self._make_layer(block, 512, layers[3], stride=2)
+        self.avgpool = nn.AvgPool2d(7)
+        self.fc = nn.Linear(512 * block.expansion, num_classes)
+
+        for m in self.modules():
+            if isinstance(m, nn.Conv2d):
+                n = m.kernel_size[0] * m.kernel_size[1] * m.out_channels
+                m.weight.data.normal_(0, math.sqrt(2. / n))
+            elif isinstance(m, nn.BatchNorm2d):
+                m.weight.data.fill_(1)
+                m.bias.data.zero_()
+
+    def _make_layer(self, block, planes, blocks, stride=1):
+        downsample = None
+        if stride != 1 or self.inplanes != planes * block.expansion:
+            downsample = nn.Sequential(
+                nn.Conv2d(self.inplanes, planes * block.expansion,
+                          kernel_size=1, stride=stride, bias=False),
+                nn.BatchNorm2d(planes * block.expansion),
+            )
+
+        layers = []
+        layers.append(block(self.inplanes, planes, stride, downsample))
+        self.inplanes = planes * block.expansion
+        for i in range(1, blocks):
+            layers.append(block(self.inplanes, planes))
+
+        return nn.Sequential(*layers)
+
+    def forward(self, x):
+        x = self.conv1(x)
+        x = self.bn1(x)
+        x = self.relu(x)
+        x = self.maxpool(x)
+
+        x = self.layer1(x)
+        x = self.layer2(x)
+        x = self.layer3(x)
+        x = self.layer4(x)
+
+        x = self.avgpool(x)
+        x = x.view(x.size(0), -1)
+        # x = self.fc(x)
+
+        return x
+
+    # homemade pre-trained model loading function :)
+    def load_pretrained_model(self, pretrained_state_dict):
+
+        custom_state_dict = self.state_dict()
+
+        for name, param in pretrained_state_dict.items():
+
+            if name not in custom_state_dict:
+                raise KeyError("unexpected key '{}' in state_dict".format(name))
+
+            if isinstance(param, Parameter):
+                param = param.data
+
+            try:
+                custom_state_dict[name].copy_(param)
+            except:
+                print("skip loading key '{}' due to inconsistent size".format(name))
+
+        self.load_state_dict(custom_state_dict)
+
+
+def resnet18(pretrained=False, **kwargs):
+    """Constructs a ResNet-18 model.
+
+    Args:
+        pretrained (bool): If True, returns a model pre-trained on ImageNet
+    """
+    model = ResNet(BasicBlock, [2, 2, 2, 2], **kwargs)
+    if pretrained:
+        model.load_pretrained_model(model_zoo.load_url(model_urls['resnet18']))
+    return model
+
+
+def resnet34(pretrained=False, **kwargs):
+    """Constructs a ResNet-34 model.
+
+    Args:
+        pretrained (bool): If True, returns a model pre-trained on ImageNet
+    """
+    model = ResNet(BasicBlock, [3, 4, 6, 3], **kwargs)
+    if pretrained:
+        model.load_pretrained_model(model_zoo.load_url(model_urls['resnet34']))
+    return model
+
+
+def resnet50(pretrained=False, **kwargs):
+    """Constructs a ResNet-50 model.
+
+    Args:
+        pretrained (bool): If True, returns a model pre-trained on ImageNet
+    """
+    model = ResNet(Bottleneck, [3, 4, 6, 3], **kwargs)
+    if pretrained:
+        model.load_pretrained_model(model_zoo.load_url(model_urls['resnet50']))
+    return model
+
+
+def resnet101(pretrained=False, **kwargs):
+    """Constructs a ResNet-101 model.
+
+    Args:
+        pretrained (bool): If True, returns a model pre-trained on ImageNet
+    """
+    model = ResNet(Bottleneck, [3, 4, 23, 3], **kwargs)
+    if pretrained:
+        model.load_pretrained_model(model_zoo.load_url(model_urls['resnet101']))
+    return model
+
+
+def resnet152(pretrained=False, **kwargs):
+    """Constructs a ResNet-152 model.
+
+    Args:
+        pretrained (bool): If True, returns a model pre-trained on ImageNet
+    """
+    model = ResNet(Bottleneck, [3, 8, 36, 3], **kwargs)
+    if pretrained:
+        model.load_pretrained_model(model_zoo.load_url(model_urls['resnet152']))
+    return model
diff --git a/results/all_cnf.png b/results/all_cnf.png
new file mode 100644
index 0000000..92c06c9
Binary files /dev/null and b/results/all_cnf.png differ
diff --git a/results/architecture.svg b/results/architecture.svg
new file mode 100644
index 0000000..3223a20
--- /dev/null
+++ b/results/architecture.svg
@@ -0,0 +1,29 @@
+<svg width="580" height="400" xmlns="http://www.w3.org/2000/svg">
+ <!-- Created with Method Draw - http://github.com/duopixel/Method-Draw/ -->
+ <g>
+  <title>background</title>
+  <rect fill="#fff" id="canvas_background" height="402" width="582" y="-1" x="-1"/>
+  <g display="none" overflow="visible" y="0" x="0" height="100%" width="100%" id="canvasGrid">
+   <rect fill="url(#gridpattern)" stroke-width="0" y="0" x="0" height="100%" width="100%"/>
+  </g>
+ </g>
+ <g>
+  <title>Layer 1</title>
+  <path transform="rotate(92, 207.845, 185.682)" id="svg_8" d="m162.845001,249.182495l16.875,-127l56.25,0l16.875,127l-90,0z" fill-opacity="null" stroke-opacity="null" stroke-width="1.5" stroke="#000" fill="none"/>
+  <text xml:space="preserve" text-anchor="start" font-family="Helvetica, Arial, sans-serif" font-size="24" id="svg_9" y="193.5" x="154" fill-opacity="null" stroke-opacity="null" stroke-width="0" stroke="#000" fill="#000000">ResNet50</text>
+  <rect id="svg_11" height="116.999995" width="50.000002" y="213.500003" x="365.000002" fill-opacity="null" stroke-opacity="null" stroke-width="1.5" stroke="#000" fill="none"/>
+  <text style="cursor: move;" xml:space="preserve" text-anchor="start" font-family="Helvetica, Arial, sans-serif" font-size="24" id="svg_15" y="78.5" x="375" fill-opacity="null" stroke-opacity="null" stroke-width="0" stroke="#000" fill="#000000">FA</text>
+  <rect id="svg_24" height="116.999995" width="50.000002" y="49.500003" x="364.000002" fill-opacity="null" stroke-opacity="null" stroke-width="1.5" stroke="#000" fill="none"/>
+  <text xml:space="preserve" text-anchor="start" font-family="Helvetica, Arial, sans-serif" font-size="24" id="svg_25" y="249.5" x="367" fill-opacity="null" stroke-opacity="null" stroke-width="0" stroke="#000" fill="#000000">OBJ</text>
+  <text xml:space="preserve" text-anchor="start" font-family="Helvetica, Arial, sans-serif" font-size="24" id="svg_26" y="298.5" x="382" fill-opacity="null" stroke-opacity="null" stroke-width="0" stroke="#000" fill="#000000">fc</text>
+  <text xml:space="preserve" text-anchor="start" font-family="Helvetica, Arial, sans-serif" font-size="24" id="svg_27" y="137.5" x="381" fill-opacity="null" stroke-opacity="null" stroke-width="0" stroke="#000" fill="#000000">fc</text>
+  <path id="svg_28" d="m335.217438,228.776352l8.511017,-7.659393l8.506287,-7.661804l-8.510498,-7.667831l-8.506805,-7.66301l0,8.521286c-2.084717,0 -4.508392,0 -5.319092,0c-3.8703,0.171173 -8.647125,-4.583099 -13.728302,-10.712784c-1.894318,-2.148102 -3.805817,-4.511978 -5.831604,-6.64682c2.025787,-2.137253 3.934143,-4.498718 5.831604,-6.648026c5.081177,-6.120041 9.858002,-10.881546 13.723083,-10.709167l5.32431,-0.002411l0,8.532135l8.506805,-7.664215l8.510498,-7.671448l-8.510498,-7.67868l-8.506805,-7.667831l0,8.527313l-5.321198,0c-7.904846,0.171173 -13.812531,7.500275 -18.981903,13.456375c-5.130554,6.282776 -9.744232,11.01535 -12.418457,10.707962l-15.261139,0l0,13.613083l15.26535,0c2.673218,-0.308594 7.287842,4.425186 12.419525,10.709167c5.166199,5.958511 11.071777,13.281586 18.978729,13.456375l5.319092,0l0,8.529724l0,0l0,0z" fill-opacity="null" stroke-opacity="null" stroke-width="1.5" stroke="#000" fill="none"/>
+  <path id="svg_29" d="m14.922501,155.596634l0,52l76,0l0,-52l-76,0zm64.037125,47.537598l-52.074137,0l0,-43.075195l52.074137,0l0,43.075195zm-39.407818,-26.192017c4.013901,0 7.270538,-2.700134 7.270538,-6.018372c0,-3.318237 -3.256638,-6.01123 -7.270538,-6.01123c-4.016945,0 -7.270535,2.692993 -7.270535,6.01123c0,3.318237 3.25359,6.018372 7.270535,6.018372zm36.59663,5.236816l-13.841042,-11.447205l-19.470829,16.101624l-5.395794,-4.462402l-7.746281,6.409546l0,12.023254l46.453945,0l0,-18.624817z" fill-opacity="null" stroke-opacity="null" stroke-width="1.5" stroke="#000" fill="none"/>
+  <text xml:space="preserve" text-anchor="start" font-family="Helvetica, Arial, sans-serif" font-size="24" id="svg_30" y="239.5" x="23" fill-opacity="null" stroke-opacity="null" stroke-width="0" stroke="#000" fill="#000000">frame</text>
+  <path id="svg_32" d="m117.860794,192.60025l6.658913,-7.636414l-12.874855,0l-12.874893,0l0,-4.727173l0,-4.727173l12.727173,0c6.999855,0 12.727127,-0.239868 12.727127,-0.532532c0,-0.292969 -2.786652,-3.729248 -6.192535,-7.636414l-6.19252,-7.103882l5.723724,0l5.7239,0l8.741463,10.00946l8.741669,10.009766l-8.758331,9.990234l-8.758446,9.99054l-6.025734,0l-6.025757,0l6.659103,-7.636414l0,0z" fill-opacity="null" stroke-width="1.5" stroke="#0f0f00" fill="none"/>
+  <path id="svg_33" d="m439.09726,107.434692l4.281372,-4.581726l-8.276825,0l-8.276825,0l0,-2.836304l0,-2.836533l8.182068,0c4.499695,0 8.181244,-0.143692 8.181244,-0.319336c0,-0.175781 -1.790497,-2.237518 -3.980621,-4.581802l-3.981445,-4.262329l3.679871,0l3.679871,0l5.619507,6.005676l5.619507,6.005936l-5.630219,5.994186l-5.630219,5.994202l-3.874329,0l-3.873535,0l4.280579,-4.58197l0,0z" fill-opacity="null" stroke-width="1.5" stroke="#0f0f00" fill="none"/>
+  <text xml:space="preserve" text-anchor="start" font-family="Helvetica, Arial, sans-serif" font-size="24" id="svg_35" y="106.5" x="462" fill-opacity="null" stroke-width="0" stroke="#0f0f00" fill="#000000">free/active</text>
+  <path id="svg_36" d="m439.09726,276.434692l4.281372,-4.581726l-8.276825,0l-8.276825,0l0,-2.836304l0,-2.836548l8.182068,0c4.499695,0 8.181244,-0.143677 8.181244,-0.319336c0,-0.175781 -1.790497,-2.237488 -3.980621,-4.581787l-3.981445,-4.262329l3.679871,0l3.679871,0l5.619507,6.005676l5.619507,6.00592l-5.630219,5.994202l-5.630219,5.994202l-3.874329,0l-3.873535,0l4.280579,-4.58197l0,0z" fill-opacity="null" stroke-width="1.5" stroke="#0f0f00" fill="none"/>
+  <text style="cursor: move;" xml:space="preserve" text-anchor="start" font-family="Helvetica, Arial, sans-serif" font-size="24" id="svg_37" y="276.5" x="464" fill-opacity="null" stroke-width="0" stroke="#0f0f00" fill="#000000">obj cat.</text>
+ </g>
+</svg>
\ No newline at end of file
diff --git a/results/house_cnf.png b/results/house_cnf.png
new file mode 100644
index 0000000..65d4652
Binary files /dev/null and b/results/house_cnf.png differ
diff --git a/results/index.md b/results/index.md
index 96ce61c..7eed2a2 100644
--- a/results/index.md
+++ b/results/index.md
@@ -1,47 +1,58 @@
-# Your Name <span style="color:red">(id)</span>
+# 趙浚宏 (106061611)
 
-#Project 5: Deep Classification
+# Project 5: Deep Classification
 
 ## Overview
-The project is related to 
-> quote
+The project is related to [Recognition from Hand Cameras:
+A Revisit with Deep Learning](https://drive.google.com/file/d/0BwCy2boZhfdBM0ZDTV9lZW1rZzg/view). 
+> We revisit the study of a wrist-mounted camera system (re-
+ferred to as HandCam) for recognizing activities of hands. HandCam has two unique properties as compared to egocentric systems [1, 2] (referred
+to as HeadCam): (1) it avoids the need to detect hands; (2) it more
+consistently observes the activities of hands. By taking advantage of
+these properties, we propose a deep-learning-based method to recognize
+hand states (free vs. active hands, hand gestures, object categories), and
+discover object categories.
 
 
 ## Implementation
-1. One
-	* item
-	* item
-2. Two
 
-```
-Code highlights
-```
+* **Network Architecture**
+
+
+   ![](architecture.svg)
+
+
+* **Multitask Loss**
+
+	```
+		Loss = \lambda_1 * CrossEntropy(FA_OUTPUT, FA_LABEL) + \lambda_2 * CrossEntropt(OBJ_OUTPUT, OBJ_LABEL)
+	```
+
+* **Trained 30 epochs** 
+
+* **Adam Optimizer lr=1e-3**
 
 ## Installation
-* Other required packages.
-* How to compile from source?
-
-### Results
-
-<table border=1>
-<tr>
-<td>
-<img src="placeholder.jpg" width="24%"/>
-<img src="placeholder.jpg"  width="24%"/>
-<img src="placeholder.jpg" width="24%"/>
-<img src="placeholder.jpg" width="24%"/>
-</td>
-</tr>
-
-<tr>
-<td>
-<img src="placeholder.jpg" width="24%"/>
-<img src="placeholder.jpg"  width="24%"/>
-<img src="placeholder.jpg" width="24%"/>
-<img src="placeholder.jpg" width="24%"/>
-</td>
-</tr>
-
-</table>
 
+* numpy 1.13.3
+* pytorch 0.2.0
+
+## Results
+
+* House Scene
+
+  ![](house_cnf.png)
+
+* Lab Scene
+
+  ![](lab_cnf.png)
+
+* Office Scene
+
+  ![](office_cnf.png)
+
+
+* All
+
+  ![](all_cnf.png)
 
diff --git a/results/lab_cnf.png b/results/lab_cnf.png
new file mode 100644
index 0000000..62779d7
Binary files /dev/null and b/results/lab_cnf.png differ
diff --git a/results/office_cnf.png b/results/office_cnf.png
new file mode 100644
index 0000000..23fbfdd
Binary files /dev/null and b/results/office_cnf.png differ