-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathBPRData.py
51 lines (42 loc) · 1.37 KB
/
BPRData.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
import numpy as np
import scipy.sparse as sp
import torch.utils.data as data
import pickle
class BPRData(data.Dataset):
def __init__(self, data,
num_item, train_mat=None, num_ng=0, is_training=None):
super(BPRData, self).__init__()
""" Note that the labels are only useful when training, we thus
add them in the ng_sample() function.
"""
self.data = np.array(data)
self.num_item = num_item
self.train_mat = train_mat
self.num_ng = num_ng
self.is_training = is_training
def ng_sample(self):
assert self.is_training, 'no need to sampling when testing'
tmp_trainMat = self.train_mat.todok()
length = self.data.shape[0]
self.neg_data = np.random.randint(low=0, high=self.num_item, size=length)
for i in range(length):
uid = self.data[i][0]
iid = self.neg_data[i]
if (uid, iid) in tmp_trainMat:
while (uid, iid) in tmp_trainMat:
iid = np.random.randint(low=0, high=self.num_item)
self.neg_data[i] = iid
def __len__(self):
return len(self.data)
# return self.num_ng * len(self.data) if \
# self.is_training else len(self.data)
def __getitem__(self, idx):
user = self.data[idx][0]
item_i = self.data[idx][1]
if self.is_training:
neg_data = self.neg_data
item_j = neg_data[idx]
return user, item_i, item_j
else:
return user, item_i
# neg_data = self.neg_data if self.is_training else ([-1]*len(self.data))