-
Notifications
You must be signed in to change notification settings - Fork 1
Expand file tree
/
Copy pathloader.py
More file actions
48 lines (39 loc) · 1.71 KB
/
loader.py
File metadata and controls
48 lines (39 loc) · 1.71 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
# -*- coding: utf-8 -*-
"""
Created on Tue Jul 14 15:53:48 2020
@author: Joann
"""
#%%
import os
import numpy as np
from torch.utils import data
#%%
class AudioFolder(data.Dataset):
def __init__(self, root, input_length=None):
self.root = root # data_path
self.input_length = input_length # 80000
self.get_songlist() # training data npy
self.binary = np.load(os.path.join(self.root, 'binary_full.npy'))
def __getitem__(self, index):
npy, tag_binary = self.get_npy(index)
return npy.astype('float32'), tag_binary.astype('float32')
def get_songlist(self):
self.fl = np.load(os.path.join(self.root, 'train_full.npy')) # npy with all training file names
def get_npy(self, index):
ix, fn = self.fl[index].split('\t') # fn = wav filename
npy_path = os.path.join(self.root, 'npy_full', fn.split('.')[0]+'.npy') # only get training files from npy
npy = np.load(npy_path)
random_idx = int(np.floor(np.random.random(1) * (len(npy)-self.input_length))) # input_length = how long to go in model
npy = np.array(npy[random_idx:random_idx+self.input_length])
tag_binary = self.binary[int(ix)]
return npy, tag_binary
def __len__(self):
return len(self.fl)
#%%
def get_audio_loader(root, batch_size, num_workers=0, input_length=None):
data_loader = data.DataLoader(dataset=AudioFolder(root, input_length=input_length),
batch_size=batch_size,
shuffle=True,
drop_last=True,
num_workers=num_workers)
return data_loader