Skip to content

Commit e1a5825

Browse files
Merge pull request #2248 from recommenders-team/staging
Staging to main: Fix the issue with Movielens
2 parents 5eca0ba + a251a52 commit e1a5825

File tree

2 files changed

+7
-7
lines changed

2 files changed

+7
-7
lines changed

examples/01_prepare_data/data_split.ipynb

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -73,7 +73,7 @@
7373
"metadata": {},
7474
"outputs": [],
7575
"source": [
76-
"DATA_URL = \"https://files.grouplens.org/datasets/movielens/ml-100k/u.data\"\n",
76+
"DATA_URL = \"http://files.grouplens.org/datasets/movielens/ml-100k/u.data\"\n",
7777
"DATA_PATH = \"ml-100k.data\"\n",
7878
"\n",
7979
"COL_USER = \"UserId\"\n",
@@ -1195,4 +1195,4 @@
11951195
},
11961196
"nbformat": 4,
11971197
"nbformat_minor": 2
1198-
}
1198+
}

recommenders/datasets/movielens.py

Lines changed: 5 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -159,7 +159,7 @@ def load_pandas_df(
159159
):
160160
"""Loads the MovieLens dataset as pd.DataFrame.
161161
162-
Download the dataset from https://files.grouplens.org/datasets/movielens, unzip, and load.
162+
Download the dataset from http://files.grouplens.org/datasets/movielens, unzip, and load.
163163
To load movie information only, you can use load_item_df function.
164164
165165
Args:
@@ -304,7 +304,7 @@ def _load_item_df(size, item_datapath, movie_col, title_col, genres_col, year_co
304304
genres_header_100k = None
305305
if genres_col is not None:
306306
# 100k data's movie genres are encoded as a binary array (the last 19 fields)
307-
# For details, see https://files.grouplens.org/datasets/movielens/ml-100k-README.txt
307+
# For details, see http://files.grouplens.org/datasets/movielens/ml-100k-README.txt
308308
if size == "100k":
309309
genres_header_100k = [*(str(i) for i in range(19))]
310310
item_header.extend(genres_header_100k)
@@ -366,7 +366,7 @@ def load_spark_df(
366366
):
367367
"""Loads the MovieLens dataset as `pyspark.sql.DataFrame`.
368368
369-
Download the dataset from https://files.grouplens.org/datasets/movielens, unzip, and load as `pyspark.sql.DataFrame`.
369+
Download the dataset from http://files.grouplens.org/datasets/movielens, unzip, and load as `pyspark.sql.DataFrame`.
370370
371371
To load movie information only, you can use `load_item_df` function.
372372
@@ -552,7 +552,7 @@ def download_movielens(size, dest_path):
552552
if size not in DATA_FORMAT:
553553
raise ValueError(f"Size: {size}. " + ERROR_MOVIE_LENS_SIZE)
554554

555-
url = "https://files.grouplens.org/datasets/movielens/ml-" + size + ".zip"
555+
url = "http://files.grouplens.org/datasets/movielens/ml-" + size + ".zip"
556556
dirs, file = os.path.split(dest_path)
557557
maybe_download(url, file, work_directory=dirs)
558558

@@ -587,7 +587,7 @@ class MockMovielensSchema(pa.DataFrameModel):
587587
Mock dataset schema to generate fake data for testing purpose.
588588
This schema is configured to mimic the Movielens dataset
589589
590-
https://files.grouplens.org/datasets/movielens/ml-100k/
590+
http://files.grouplens.org/datasets/movielens/ml-100k/
591591
592592
Dataset schema and generation is configured using pandera.
593593
Please see https://pandera.readthedocs.io/en/latest/schema_models.html

0 commit comments

Comments
 (0)