Sign-Language/dataset.py at master · Tech-Matrix/Sign-Language · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
import torch
import torch.nn as nn
import numpy as np
from torch.utils.data import Dataset
import torchvision.transforms as transforms

from typing import List
import csv

class SignLanguageMNIST(Dataset):
    """Sign language dataset
    Converting the the csv dataset into labels and images of shape 28*28(where input is a 784 dimensional data)
    Utility for loading Sign Language dataset into PyTorch. Dataset posted on
    Kaggle in 2017, by an unnamed author with username `tecperson`:
    https://www.kaggle.com/datamunge/sign-language-mnist
    Each sample image is 1*1*28*28 tensor and label is scaler"""

    @staticmethod
    def get_label_mapping():
        '''We map all labels to range [0,23].The J and Z letters have been omitted.
         This mapping from dataset labels [0, 23]
        to letter indices [0, 25] is returned below.'''
        mapping = list(range(25))
        mapping.pop(9)
        return mapping

    @staticmethod
    def read_label_samples_from_csv(path:str):
        '''Assuming first column is filled with labels and nest 784 columns represent each pixel value of images.
        All pixel value ranges from 0-255 '''
        mapping = SignLanguageMNIST.get_label_mapping()
        labels , samples = [] , []
        with open(path) as f:
            _ = next(f)
            for line in csv.reader(f):
                label = int(line[0])
                labels.append(mapping.index(label))
                samples.append(list(map(int,line[1:])))
        return labels , samples

    def __init__(self,path: str="data/sign_mnist_train.csv",mean: List[float] = [0.485],std: List[float] = [0.229]):
        #Args : path containing csv file
        #mean and std are for normalizing the data
        labels , samples = SignLanguageMNIST.read_label_samples_from_csv(path)
        self._samples = np.array(samples,dtype=np.uint8).reshape((-1,28,28,1))
        self._labels = np.array(labels,dtype=np.uint8).reshape((-1,1))

        self._mean = mean
        self._std = std

    def __len__(self):
        return len(self._labels)

    def __getitem__(self,idx):
        transform = transforms.Compose([
            transforms.ToPILImage(),
            transforms.RandomResizedCrop(28,scale=(0.8,1.2)),
            transforms.ToTensor(),
            transforms.Normalize(mean=self._mean, std=self._std)
        ])

        return {
            'image' : transform(self._samples[idx]).float(),
            'label' : torch.from_numpy(self._labels[idx]).float()
        }

def get_train_test_loaders(batch_size=32):
    trainset = SignLanguageMNIST('data/sign_mnist_train.csv')
    trainloader = torch.utils.data.DataLoader(trainset,batch_size=batch_size,shuffle=True)

    testset = SignLanguageMNIST('data/sign_mnist_test.csv')
    testloader = torch.utils.data.DataLoader(testset,batch_size=batch_size,shuffle=False)
    return trainloader , testloader

if __name__ == '__main__':
    loader , _ = get_train_test_loaders(2)
    print(next(iter(loader)))