Skip to content

Commit 098f071

Browse files
Fix movielens 10m (#156)
* First Attempt at fixing MovieLens 10m * Fix test values
1 parent f988a12 commit 098f071

File tree

2 files changed

+5
-5
lines changed

2 files changed

+5
-5
lines changed

src/datasets/graphs/movielens.jl

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -178,7 +178,7 @@ end
178178

179179
function read_10m_rating_data(dir::String)
180180
rating_data_file = "ratings.dat"
181-
rating_df = read_csv_asdf(joinpath(dir, rating_data_file), header=false, delim="::")
181+
rating_df = read_csv_asdf(joinpath(dir, rating_data_file), header=false, delim="::", quoted=false)
182182
@assert size(rating_df)[2] == 4
183183

184184
rating_data = Dict()
@@ -190,7 +190,7 @@ end
190190

191191
function read_10m_movie_data(dir::String)
192192
movie_data_file = "movies.dat"
193-
movie_df = read_csv_asdf(joinpath(dir, movie_data_file), header=false, delim="::")
193+
movie_df = read_csv_asdf(joinpath(dir, movie_data_file), header=false, delim="::", quoted=false)
194194
movie_data = Dict()
195195

196196
movie_ids = movie_df[!, 1]
@@ -213,7 +213,7 @@ end
213213

214214
function read_10m_user_tag_data(dir::String)
215215
tag_data_file = "tags.dat"
216-
tag_df = read_csv(joinpath(dir, tag_data_file), header=false, delim="::")
216+
tag_df = read_csv(joinpath(dir, tag_data_file), header=false, delim="::", quoted=false)
217217

218218
tag_data = Dict{String, Any}()
219219
tag_data["user_movie"] = tag_df[!, 1:2] |> Matrix{Int}

test/datasets/graphs_no_ci.jl

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -244,12 +244,12 @@ end
244244
@test g isa MLDatasets.HeteroGraph
245245

246246
num_nodes = Dict(
247-
"tag" => 95579,
247+
"tag" => 95580,
248248
"movie" => 10681,
249249
"user" => 69878
250250
)
251251
num_edges = Dict(
252-
("user", "tag", "movie") => 191158,
252+
("user", "tag", "movie") => 191160,
253253
("user", "rating", "movie") => 20000108
254254
)
255255

0 commit comments

Comments
 (0)