sorrowyn
diff --git a/‎README.md
+62 b/‎README.md
+62
diff --git a/‎coco.py
+148 b/‎coco.py
+148
@@ -0,0 +1,62 @@
+# Modular Graph Transformer Networks (MGTN)
+This project implements the multi-learning based on Modular Graph Transformer Networks (MGTN). 
+
+### Requirements
+Please, install the following packages
+- numpy
+- pytorch (1.*)
+- torchnet
+- torchvision
+- tqdm
+- networkx
+
+### Download best checkpoints
+checkpoint/coco/mgtn_final_86.9762.pth.tar ([Dropbox](https://www.dropbox.com/s/fr2286gwxsg80kq/mgtn_final_86.9762.pth.tar?dl=0))
+
+### Performance
+
+| Method                | mAP        | CP        | CR         | CF1        | OP        | OR         | OF1        |
+| --------------------- | ---------- | --------- | ---------- | ---------- | --------- | ---------- | ---------- |
+| CNN\-RNN              | 61\.2      | \-        | \-         | \-         | \-        | \-         | \-         |
+| SRN                   | 77\.1      | 81\.6     | 65\.4      | 71\.2      | 82\.7     | 69\.9      | 75\.8      |
+| Baseline\(ResNet101\) | 77\.3      | 80\.2     | 66\.7      | 72\.8      | 83\.9     | 70\.8      | 76\.8      |
+| Multi\-Evidence       | –          | 80\.4     | 70\.2      | 74\.9      | 85\.2     | 72\.5      | 78\.4      |            |
+| ML\-GCN (2019)        | 82\.4      | 84\.4     | 71\.4      | 77\.4      | 85\.8     | 74\.5      | 79\.8      |
+ML-GCN (ResNeXt50 with ImageNet) | 86.2 | 85.8 | 77.3 | 81.3 | 86.2 | 79.7 | 82.8 |
+| A\-GCN                | 83\.1      | 84\.7     | 72\.3      | 78\.0      | 85\.6     | 75\.5      | 80\.3      |
+| KSSNet                | 83\.7      | 84\.6     | 73\.2      | 77\.2      | 87\.8     | 76\.2      | 81\.5      |
+| SGTN (Our**)          | 86\.6      | 77\.2     | **82\.2**      | 79\.6      | 76\.0     | **82\.6**      | 79\.2      |
+| **MGTN\(Base\)**      | 86\.91     | **89.38** | 74.46      | 81.25      | **90.91** | 76.27      | 82.95      |
+| **MGTN\(Final\}**     | **86\.98** | 86\.11    | 77\.85 | **81\.77** | 87\.71    | 79\.40 | **83\.35** |
+
+** SGTN (Our): https://github.com/ReML-AI/sgtn 
+
+### TGCN on COCO
+
+```sh
+python mgtn.py data/coco --image-size 448 --workers 8 --batch-size 32 --lr 0.03 --learning-rate-decay 0.1 --epoch_step 20 30 --embedding model/embedding/coco_glove_word2vec_80x300_ec.pkl --adj-strong-threshold 0.4 --adj-weak-threshold 0.2 --device_ids 0 1 2 3
+```
+
+### How to cite this work?
+```
+@inproceedings{Nguyen:AAAI:2021,
+	author = {Nguyen, Hoang D. and Vu, Xuan-Son and Le, Duc-Trong},
+	title = {Modular Graph Transformer Networks for Multi-Label Image Classification},
+	booktitle = {Proceedings of the AAAI Conference on Artificial Intelligence},
+	series = {AAAI '21},
+	year = {2021},
+	publisher = {AAAI}
+}
+```
+
+
+
+## Reference
+This project is based on the following implementations:
+
+- https://github.com/durandtibo/wildcat.pytorch
+- https://github.com/tkipf/pygcn
+- https://github.com/Megvii-Nanjing/ML_GCN/
+- https://github.com/seongjunyun/Graph_Transformer_Networks
+
+
@@ -0,0 +1,148 @@
+import torch.utils.data as data
+import json
+import os
+import subprocess
+from PIL import Image
+import numpy as np
+import torch
+import pickle
+from util import *
+
+urls = {'train_img': 'http://images.cocodataset.org/zips/train2014.zip',
+        'val_img': 'http://images.cocodataset.org/zips/val2014.zip',
+        'annotations': 'http://images.cocodataset.org/annotations/annotations_trainval2014.zip'}
+
+
+def download_coco2014(root, phase):
+    if not os.path.exists(root):
+        os.makedirs(root)
+    tmpdir = os.path.join(root, 'tmp/')
+    data = os.path.join(root, 'data/')
+    if not os.path.exists(data):
+        os.makedirs(data)
+    if not os.path.exists(tmpdir):
+        os.makedirs(tmpdir)
+    if phase == 'train':
+        filename = 'train2014.zip'
+    elif phase == 'val':
+        filename = 'val2014.zip'
+    cached_file = os.path.join(tmpdir, filename)
+    cached_file = os.path.join(data, "train2014")
+    if not os.path.exists(cached_file):
+        print('Downloading: "{}" to {}\n'.format(
+            urls[phase + '_img'], cached_file))
+        os.chdir(tmpdir)
+        subprocess.call('wget ' + urls[phase + '_img'], shell=True)
+        os.chdir(root)
+    # extract file
+    img_data = os.path.join(data, filename.split('.')[0])
+    if not os.path.exists(img_data):
+        print('[dataset] Extracting tar file {file} to {path}'.format(
+            file=cached_file, path=data))
+        command = 'unzip {} -d {}'.format(cached_file, data)
+        os.system(command)
+    print('[dataset] Done!')
+
+    # train/val images/annotations
+    cached_file = os.path.join(tmpdir, 'annotations_trainval2014.zip')
+    cached_file = os.path.join(data, 'train_anno.json')
+    if not os.path.exists(cached_file):
+        print('Downloading: "{}" to {}\n'.format(
+            urls['annotations'], cached_file))
+        os.chdir(tmpdir)
+        subprocess.Popen('wget ' + urls['annotations'], shell=True)
+        os.chdir(root)
+    annotations_data = os.path.join(data, 'annotations')
+    if not os.path.exists(annotations_data):
+        print('[dataset] Extracting tar file {file} to {path}'.format(
+            file=cached_file, path=data))
+        command = 'unzip {} -d {}'.format(cached_file, data)
+        os.system(command)
+    print('[annotation] Done!')
+
+    anno = os.path.join(data, '{}_anno.json'.format(phase))
+    img_id = {}
+    annotations_id = {}
+    if not os.path.exists(anno):
+        annotations_file = json.load(
+            open(os.path.join(annotations_data, 'instances_{}2014.json'.format(phase))))
+        annotations = annotations_file['annotations']
+        category = annotations_file['categories']
+        category_id = {}
+        for cat in category:
+            category_id[cat['id']] = cat['name']
+        cat2idx = categoty_to_idx(sorted(category_id.values()))
+        images = annotations_file['images']
+        for annotation in annotations:
+            if annotation['image_id'] not in annotations_id:
+                annotations_id[annotation['image_id']] = set()
+            annotations_id[annotation['image_id']].add(
+                cat2idx[category_id[annotation['category_id']]])
+        for img in images:
+            if img['id'] not in annotations_id:
+                continue
+            if img['id'] not in img_id:
+                img_id[img['id']] = {}
+            img_id[img['id']]['file_name'] = img['file_name']
+            img_id[img['id']]['labels'] = list(annotations_id[img['id']])
+        anno_list = []
+        for k, v in img_id.items():
+            anno_list.append(v)
+        json.dump(anno_list, open(anno, 'w'))
+        if not os.path.exists(os.path.join(data, 'category.json')):
+            json.dump(cat2idx, open(os.path.join(data, 'category.json'), 'w'))
+        del img_id
+        del anno_list
+        del images
+        del annotations_id
+        del annotations
+        del category
+        del category_id
+    print('[json] Done!')
+
+
+def categoty_to_idx(category):
+    cat2idx = {}
+    for cat in category:
+        cat2idx[cat] = len(cat2idx)
+    return cat2idx
+
+
+class COCO2014(data.Dataset):
+    def __init__(self, root, transform=None, phase='train', inp_name=None):
+        self.root = root
+        self.phase = phase
+        self.img_list = []
+        self.transform = transform
+        download_coco2014(root, phase)
+        self.get_anno()
+        self.num_classes = len(self.cat2idx)
+
+        with open(inp_name, 'rb') as f:
+            self.inp = pickle.load(f)
+        self.inp_name = inp_name
+
+    def get_anno(self):
+        list_path = os.path.join(
+            self.root, 'data', '{}_anno.json'.format(self.phase))
+        self.img_list = json.load(open(list_path, 'r'))
+        self.cat2idx = json.load(
+            open(os.path.join(self.root, 'data', 'category.json'), 'r'))
+
+    def __len__(self):
+        return len(self.img_list)
+
+    def __getitem__(self, index):
+        item = self.img_list[index]
+        return self.get(item)
+
+    def get(self, item):
+        filename = item['file_name']
+        labels = sorted(item['labels'])
+        img = Image.open(os.path.join(self.root, 'data',
+                                      '{}2014'.format(self.phase), filename)).convert('RGB')
+        if self.transform is not None:
+            img = self.transform(img)
+        target = np.zeros(self.num_classes, np.float32) - 1
+        target[labels] = 1
+        return (img, filename, self.inp), target