ylingfeng
diff --git a/‎README.md‎
Lines changed: 95 additions & 0 deletions b/‎README.md‎
Lines changed: 95 additions & 0 deletions
diff --git a/‎checkpoints/README.md‎
Lines changed: 9 additions & 0 deletions b/‎checkpoints/README.md‎
Lines changed: 9 additions & 0 deletions
diff --git a/‎dataset.py‎
Lines changed: 183 additions & 0 deletions b/‎dataset.py‎
Lines changed: 183 additions & 0 deletions
diff --git a/‎datasets/README.md‎
Lines changed: 13 additions & 0 deletions b/‎datasets/README.md‎
Lines changed: 13 additions & 0 deletions
diff --git a/‎figs/structure.svg‎
Lines changed: 1 addition & 0 deletions b/‎figs/structure.svg‎
Lines changed: 1 addition & 0 deletions
@@ -0,0 +1,95 @@
+# Code for 'Dynamic MLP for Fine-Grained Image Classification by Leveraging Geographical and Temporal Information'
+
+<p align="center"> <img src="figs/structure.svg" width="100%"></p>
+Dynamic MLP, which is parameterized by the learned embeddings of variable locations and dates to help fine-grained image classification.
+
+## Requirements
+
+Experiment Environment
+- python 3.6
+- pytorch 1.7.1+cu101
+- torchvision 0.8.2
+
+Get pretrained models for SK-Res2Net following [here](checkpoints/README.md).  
+Get datasets following [here](datasets/README.md).
+
+## Train the model
+### 1. Train image-only model
+Specify ```--image_only``` for training image-only models.
+- ResNet-50 (67.924% Top-1 acc)
+```python
+CUDA_VISIBLE_DEVICES=0,1,2,3,4,5,6,7 python3 train.py \
+  --name res50_image_only \
+  --data 'inat21_mini' \
+  --data_dir 'path/to/your/data' \
+  --model_file 'resnet' \
+  --model_name 'resnet50' \
+  --pretrained \
+  --batch_size 512 \
+  --start_lr 0.04 \
+  --image_only
+```
+
+- SK-Res2Net-101 (76.102% Top-1 acc)
+```python
+CUDA_VISIBLE_DEVICES=0,1,2,3,4,5,6,7 python3 train.py \
+  --name sk2_image_only \
+  --data 'inat21_mini' \
+  --data_dir 'path/to/your/data' \
+  --model_file 'sk2res2net' \
+  --model_name 'sk2res2net101' \
+  --pretrained \
+  --batch_size 512 \
+  --start_lr 0.04 \
+  --image_only
+```
+
+### 2. Train dynamic MLP model
+- ResNet-50 (78.751% Top-1 acc)
+```python
+CUDA_VISIBLE_DEVICES=0,1,2,3,4,5,6,7 python3 train.py \
+  --name res50_dynamic_mlp \
+  --data 'inat21_mini' \
+  --data_dir 'path/to/your/data' \
+  --model_file 'resnet_dynamic_mlp' \
+  --model_name 'resnet50' \
+  --pretrained \
+  --batch_size 512 \
+  --start_lr 0.04
+```
+
+- SK-Res2Net-101 (84.694% Top-1 acc)
+```python
+CUDA_VISIBLE_DEVICES=0,1,2,3,4,5,6,7 python3 train.py \
+  --name sk2_dynamic_mlp \
+  --data 'inat21_mini' \
+  --data_dir 'path/to/your/data' \
+  --model_file 'sk2res2net_dynamic_mlp' \
+  --model_name 'sk2res2net101' \
+  --pretrained \
+  --batch_size 512 \
+  --start_lr 0.04
+```
+
+## Test the model
+Specify ```--resume``` and ```--evaluate``` for inference and ```--image_only``` for testing image-only models.
+```python
+python3 train.py \
+  --name sk2_dynamic_mlp \
+  --data 'inat21_mini' \
+  --data_dir 'path/to/your/data' \
+  --model_file 'sk2res2net_dynamic_mlp' \
+  --model_name 'sk2res2net101' \
+  --resume 'path/to/your/checkpoint' \
+  --evaluate
+```
+
+## Model Zoo
+### iNaturalist 2021 mini (90 epoch)
+
+| Backbone       | Size  |   Acc@1    |                                      Log                                      | Download  |
+| -------------- | :---: | :--------: | :---------------------------------------------------------------------------: | :-------: |
+| ResNet-50      |  224  |   67.924   |    [log](logs/log_inat21-mini_90epoch_r50_image-only_67.924_top1_acc.txt)     | [model]() |
+| + Dynamic MLP  |  224  | **78.751** |   [log](logs/log_inat21-mini_90epoch_r50_dynamic-mlp-c_78.751_top1_acc.txt)   | [model]() |
+| SK-Res2Net-101 |  224  |   76.102   |  [log](logs/log_inat21-mini_90epoch_sk2-101_image-only_76.102_top1_acc.txt)   | [model]() |
+| + Dynamic MLP  |  224  | **84.694** | [log](logs/log_inat21-mini_90epoch_sk2-101_dynamic-mlp-c_84.694_top1_acc.txt) | [model]() |
@@ -0,0 +1,9 @@
+# Get pretrained SK-Res2Net model
+The model is trained on ImageNet-1k for 300 epochs.
+
+Click the link to download:  
+[[Google Drive]](https://drive.google.com/file/d/1CJzcta4GoYqH5I5hcHyWoBl4iU1Y4oqc/view?usp=sharing)
+[[Github]]()
+
+|-- checkpoints  
+&emsp;&emsp;|-- sk2res2net101_epoch_300.pth
@@ -0,0 +1,183 @@
+#!/usr/bin/env python3
+import datetime
+import json
+import math
+import os
+
+import numpy as np
+import torch
+import torchvision.transforms as transforms
+from PIL import Image
+from torch.utils.data import Dataset
+
+normalize = transforms.Normalize(mean=[0.485, 0.456, 0.406], std=[0.229, 0.224, 0.225])
+
+
+class INatDataset(Dataset):
+    def __init__(self, data, root, train, transform=None, args=None):
+        self.transform = transform
+        self.args = args
+
+        if train:
+            if 'mini' in data:
+                jpath = os.path.join(root, 'train_mini.json')
+            else:
+                jpath = os.path.join(root, 'train.json')
+        else:
+            jpath = os.path.join(root, 'val.json')
+
+        samples = []
+        with open(jpath, 'r') as f:
+            annotations = json.loads(f)
+        for img, ann in zip(annotations['images'], annotations['annotations']):
+            img_path = os.path.join(root, img['file_name'])
+            label = ann['category_id']
+            extra = {'date': img['date'], 'latitude': img['latitude'], 'longitude': img['longitude']}
+            samples.append((img_path, int(label), extra))
+
+        self.samples = samples
+
+    def __len__(self):
+        return len(self.samples)
+
+    def __getitem__(self, idx):
+        img_path, label, extra = self.samples[idx]
+        date = extra['date']  # 拍摄时间
+        lat = extra['latitude']  # 纬度 -90 ~ 90
+        lng = extra['longitude']  # 经度 -180  ~ 180
+        if (lat is not None) and (lng is not None) and (date is not None):
+            date_time = datetime.datetime.strptime(date[:10], '%Y-%m-%d')
+            date = get_scaled_date_ratio(date_time)
+            lat = float(lat) / 90
+            lng = float(lng) / 180
+            loc = []
+            if 'geo' in self.args.metadata:
+                loc += [lat, lng]
+            if 'temporal' in self.args.metadata:
+                loc += [date]
+            loc = np.array(loc)
+            loc = encode_loc_time(loc)
+        else:
+            loc = np.zeros(self.args.mlp_cin, float)
+        img = Image.open(img_path)
+        if self.transform is not None:
+            img = self.transform(img)
+        return img, label, loc
+
+
+def encode_loc_time(loc_time):
+    # assumes inputs location and date features are in range -1 to 1
+    # location is lon, lat
+    feats = np.concatenate((np.sin(math.pi * loc_time), np.cos(math.pi * loc_time)))
+    return feats
+
+
+def _is_leap_year(year):
+    if year % 4 != 0 or (year % 100 == 0 and year % 400 != 0):
+        return False
+    return True
+
+
+def get_scaled_date_ratio(date_time):
+    r'''
+    scale date to [-1,1]
+    '''
+    days = [31, 28, 31, 30, 31, 30, 31, 31, 30, 31, 30, 31]
+    total_days = 365
+    year = date_time.year
+    month = date_time.month
+    day = date_time.day
+    if _is_leap_year(year):
+        days[1] += 1
+        total_days += 1
+
+    assert day <= days[month - 1]
+    sum_days = sum(days[:month - 1]) + day
+    assert sum_days > 0 and sum_days <= total_days
+
+    return (sum_days / total_days) * 2 - 1
+
+
+def load_train_dataset(args):
+    if args.data == 'inat17':
+        args.num_classes = 5089
+    elif args.data == 'inat18':
+        args.num_classes = 8142
+    elif args.data == 'inat21_mini' or 'inat21_full':
+        args.num_classes = 10000
+    else:
+        raise NotImplementedError
+
+    dataset = INatDataset(
+        args.data,
+        root=args.data_dir,
+        train=True,
+        transform=transforms.Compose([
+            transforms.RandomResizedCrop(224),
+            transforms.RandomHorizontalFlip(),
+            transforms.ToTensor(),
+            normalize,
+        ]),
+        args=args,
+    )
+    train_loader = torch.utils.data.DataLoader(
+        dataset,
+        batch_size=args.batch_size,
+        shuffle=True,
+        num_workers=args.num_workers,
+        pin_memory=True,
+    )
+    return train_loader
+
+
+def load_val_dataset(args):
+    if args.data == 'inat17':
+        args.num_classes = 5089
+    elif args.data == 'inat18':
+        args.num_classes = 8142
+    elif args.data == 'inat21_mini' or 'inat21_full':
+        args.num_classes = 10000
+    else:
+        raise NotImplementedError
+
+    if args.tencrop:
+        dataset = INatDataset(
+            args.data,
+            root=args.data_dir,
+            train=False,
+            transform=transforms.Compose([
+                transforms.Resize(256),
+                transforms.TenCrop(224),
+                transforms.Lambda(lambda crops: torch.stack([transforms.ToTensor()(crop) for crop in crops])),
+                transforms.Lambda(lambda crops: torch.stack([normalize(crop) for crop in crops])),
+            ]),
+            args=args,
+        )
+        val_loader = torch.utils.data.DataLoader(
+            dataset,
+            batch_size=args.batch_size,
+            shuffle=False,
+            num_workers=args.num_workers,
+            pin_memory=True,
+        )
+    else:
+        dataset = INatDataset(
+            args.data,
+            root=args.data_dir,
+            train=False,
+            transform=transforms.Compose([
+                transforms.Resize(256),
+                transforms.CenterCrop(224),
+                transforms.ToTensor(),
+                normalize,
+            ]),
+            args=args,
+        )
+        val_loader = torch.utils.data.DataLoader(
+            dataset,
+            batch_size=args.batch_size,
+            shuffle=False,
+            num_workers=args.num_workers,
+            pin_memory=True,
+        )
+    return val_loader
@@ -0,0 +1,13 @@
+# Get iNaturalist datasets
+
+Download the iNaturalist datasets at:
+https://github.com/visipedia/inat_comp
+
+|-- datasets/  
+&emsp;&emsp;|-- inat21/  
+&emsp;&emsp;&emsp;&emsp;|-- train_mini.json  
+&emsp;&emsp;&emsp;&emsp;|-- train.json  
+&emsp;&emsp;&emsp;&emsp;|-- val.json  
+&emsp;&emsp;&emsp;&emsp;|-- train_mini/  
+&emsp;&emsp;&emsp;&emsp;|-- train/  
+&emsp;&emsp;&emsp;&emsp;|-- val/