|
1 | 1 | function Netflix()::Persa.CFDataset
|
2 |
| - filename = "$(defdir)/netflix/netflix.csv" |
3 |
| - file = readtable(filename, separator = ',', header = false) |
| 2 | + filename = "$(defdir)/netflix/netflix.csv" |
| 3 | + file = readtable(filename, separator = ',', header = false) |
4 | 4 |
|
5 | 5 |
|
6 |
| - df = DataFrame() |
| 6 | + df = DataFrame() |
7 | 7 |
|
8 |
| - df[:user] = labelencode(labelmap(file[:,1]), file[:,1]) |
9 |
| - df[:item] = file[:,2] |
10 |
| - df[:rating] = file[:,3] |
| 8 | + df[:user] = labelencode(labelmap(file[:,1]), file[:,1]) |
| 9 | + df[:item] = file[:,2] |
| 10 | + df[:rating] = file[:,3] |
11 | 11 |
|
12 |
| - return Persa.Dataset(df) |
| 12 | + return Persa.Dataset(df) |
13 | 13 | end
|
14 | 14 |
|
15 | 15 | function MovieTweeting()::Persa.TimeCFDataset
|
16 |
| - filename = "$(defdir)/Movie-Tweeting-200k/ratings.dat" |
17 |
| - file = readtable(filename, separator = ':', header = false) |
| 16 | + filename = "$(defdir)/Movie-Tweeting-200k/ratings.dat" |
| 17 | + file = readtable(filename, separator = ':', header = false) |
18 | 18 |
|
19 |
| - df = DataFrame() |
| 19 | + df = DataFrame() |
20 | 20 |
|
21 |
| - df[:user] = file[:,1] |
22 |
| - df[:item] = labelencode(labelmap(file[:,2]), file[:,2]) |
23 |
| - df[:rating] = file[:,3] |
24 |
| - df[:timestamp] = file[:,4] |
| 21 | + df[:user] = file[:,1] |
| 22 | + df[:item] = labelencode(labelmap(file[:,2]), file[:,2]) |
| 23 | + df[:rating] = file[:,3] |
| 24 | + df[:timestamp] = file[:,4] |
25 | 25 |
|
26 |
| - return Persa.Dataset(df) |
| 26 | + return Persa.Dataset(df) |
27 | 27 | end
|
28 | 28 |
|
29 | 29 | function MovieTweeting10k()::Persa.TimeCFDataset
|
30 |
| - filename = "$(defdir)/mt-snapshot-10k/ratings.dat" |
31 |
| - file = readtable(filename, separator = ':', header = false) |
| 30 | + filename = "$(defdir)/mt-snapshot-10k/ratings.dat" |
| 31 | + file = readtable(filename, separator = ':', header = false) |
32 | 32 |
|
33 |
| - df = DataFrame() |
| 33 | + df = DataFrame() |
34 | 34 |
|
35 |
| - df[:user] = file[:,1] |
36 |
| - df[:item] = labelencode(labelmap(file[:,2]), file[:,2]) |
37 |
| - df[:rating] = file[:,3] |
38 |
| - df[:timestamp] = file[:,4] |
| 35 | + df[:user] = file[:,1] |
| 36 | + df[:item] = labelencode(labelmap(file[:,2]), file[:,2]) |
| 37 | + df[:rating] = file[:,3] |
| 38 | + df[:timestamp] = file[:,4] |
39 | 39 |
|
40 |
| - return Persa.Dataset(df) |
| 40 | + return Persa.Dataset(df) |
41 | 41 | end
|
42 | 42 |
|
43 | 43 | function CiaoDVD()::Persa.TimeCFDataset
|
44 |
| - filename = "$(defdir)/CiaoDVD/movie-ratings.txt" |
45 |
| - file = readtable(filename, separator = ',', header = false) |
| 44 | + filename = "$(defdir)/CiaoDVD/movie-ratings.txt" |
| 45 | + file = readtable(filename, separator = ',', header = false) |
46 | 46 |
|
47 |
| - df = DataFrame() |
| 47 | + df = DataFrame() |
48 | 48 |
|
49 |
| - df[:user] = file[:,1] |
50 |
| - df[:item] = file[:,2] |
51 |
| - df[:rating] = file[:,5] |
52 |
| - df[:timestamp] = convert(Array{Int}, Dates.datetime2unix.(Dates.DateTime(file[:,6]))) |
| 49 | + df[:user] = file[:,1] |
| 50 | + df[:item] = file[:,2] |
| 51 | + df[:rating] = file[:,5] |
| 52 | + df[:timestamp] = convert(Array{Int}, Dates.datetime2unix.(Dates.DateTime(file[:,6]))) |
53 | 53 |
|
54 |
| - return Persa.Dataset(df) |
| 54 | + return Persa.Dataset(df) |
55 | 55 | end
|
56 | 56 |
|
57 | 57 | function FilmTrust()::Persa.CFDataset
|
58 |
| - filename = "$(defdir)/FilmTrust/ratings.txt" |
59 |
| - file = readtable(filename, separator = ' ', header = false) |
| 58 | + filename = "$(defdir)/FilmTrust/ratings.txt" |
| 59 | + file = readtable(filename, separator = ' ', header = false) |
60 | 60 |
|
61 |
| - df = DataFrame() |
| 61 | + df = DataFrame() |
62 | 62 |
|
63 |
| - df[:user] = file[:,1] |
64 |
| - df[:item] = file[:,2] |
65 |
| - df[:rating] = file[:,3] |
| 63 | + df[:user] = file[:,1] |
| 64 | + df[:item] = file[:,2] |
| 65 | + df[:rating] = file[:,3] |
66 | 66 |
|
67 |
| - return Persa.Dataset(df) |
| 67 | + return Persa.Dataset(df) |
68 | 68 | end
|
69 | 69 |
|
70 | 70 | function YahooMusic()::Persa.CFDataset
|
71 |
| - filename = "$(defdir)/yahoo-music-r3/ymusic-r3-dummy-time.dat" |
72 |
| - file = readtable(filename, separator = ' ', header = false) |
| 71 | + filename = "$(defdir)/yahoo-music-r3/ymusic-r3-dummy-time.dat" |
| 72 | + file = readtable(filename, separator = ' ', header = false) |
73 | 73 |
|
74 |
| - df = DataFrame() |
| 74 | + df = DataFrame() |
75 | 75 |
|
76 |
| - df[:user] = file[:,1] |
77 |
| - df[:item] = file[:,2] |
78 |
| - df[:rating] = file[:,3] |
| 76 | + df[:user] = file[:,1] |
| 77 | + df[:item] = file[:,2] |
| 78 | + df[:rating] = file[:,3] |
79 | 79 |
|
80 |
| - return Persa.Dataset(df) |
| 80 | + return Persa.Dataset(df) |
81 | 81 | end
|
82 | 82 |
|
83 | 83 | function LastFM()::Persa.CFDataset
|
84 |
| - filename = "$(defdir)/lastfm/last_fm.dat" |
85 |
| - file = readtable(filename, separator = ',', header = false) |
| 84 | + filename = "$(defdir)/lastfm/last_fm.dat" |
| 85 | + file = readtable(filename, separator = ',', header = false) |
86 | 86 |
|
87 |
| - df = DataFrame() |
| 87 | + df = DataFrame() |
88 | 88 |
|
89 |
| - df[:user] = labelencode(labelmap(file[:,1]), file[:,1]) |
90 |
| - df[:item] = labelencode(labelmap(file[:,2]), file[:,2]) |
91 |
| - df[:rating] = file[:,3] |
| 89 | + df[:user] = labelencode(labelmap(file[:,1]), file[:,1]) |
| 90 | + df[:item] = labelencode(labelmap(file[:,2]), file[:,2]) |
| 91 | + df[:rating] = file[:,3] |
92 | 92 |
|
93 |
| - return Persa.Dataset(df) |
| 93 | + return Persa.Dataset(df) |
94 | 94 | end
|
0 commit comments