From ae0b846ea689df364056965284ea304bf5fa8981 Mon Sep 17 00:00:00 2001
From: mmosc <ma.moscati@gmail.com>
Date: Fri, 2 Dec 2022 10:46:30 +0100
Subject: [PATCH 1/5] feat: add k-fold cv.

---
 recbole/data/dataset/dataset.py | 18 ++++++++++++++++++
 recbole/data/utils.py           | 22 ++++++++++++++++++++--
 recbole/properties/overall.yaml | 27 +++++++++++++++------------
 3 files changed, 53 insertions(+), 14 deletions(-)

diff --git a/recbole/data/dataset/dataset.py b/recbole/data/dataset/dataset.py
index 7d010e5f8..1d308e63e 100644
--- a/recbole/data/dataset/dataset.py
+++ b/recbole/data/dataset/dataset.py
@@ -1796,6 +1796,24 @@ def build(self):
                 raise NotImplementedError(
                     f"The grouping method [{group_by}] has not been implemented."
                 )
+
+        elif split_mode == "KF":
+            """
+            Will return n_folds datasets
+            """
+            if not isinstance(split_args["KF"], list):
+                raise ValueError(f'The value of "KF" [{split_args}] should be a list.')
+            if group_by is None or group_by.lower() == "none":
+                datasets = self.split_by_ratio(split_args["KF"], group_by=None)
+            elif group_by == "user":
+                datasets = self.split_by_ratio(
+                    split_args["KF"], group_by=self.uid_field
+                )
+            else:
+                raise NotImplementedError(
+                    f"The grouping method [{group_by}] has not been implemented."
+                )
+
         elif split_mode == "LS":
             datasets = self.leave_one_out(
                 group_by=self.uid_field, leave_one_mode=split_args["LS"]
diff --git a/recbole/data/utils.py b/recbole/data/utils.py
index c7da013e9..e1b3516a6 100644
--- a/recbole/data/utils.py
+++ b/recbole/data/utils.py
@@ -22,6 +22,9 @@
 from recbole.utils import ModelType, ensure_dir, get_local_time, set_color
 from recbole.utils.argument_list import dataset_arguments
 
+from recbole.data.interaction import cat_interactions
+from recbole.data.dataset.dataset import Dataset
+
 
 def create_dataset(config):
     """Create dataset according to :attr:`config['model']` and :attr:`config['MODEL_TYPE']`.
@@ -160,9 +163,24 @@ def data_preparation(config, dataset):
         train_data, valid_data, test_data = dataloaders
     else:
         model_type = config["MODEL_TYPE"]
-        built_datasets = dataset.build()
+        if list(config["eval_args"]["split"].keys())[0] == 'KF':
+            print("==KF")
+            folds = dataset.build()# data_preparation(config, dataset)
+            n_folds = len(folds)
+            print(n_folds)
+            k = config["eval_args"]["fold"]
+
+            train_dataset = Dataset(config)
+            train_dataset.inter_feat = cat_interactions([fold.inter_feat for fold in folds[k: n_folds - 2 + k]])
+            valid_dataset = folds[n_folds - 2 + k]
+            test_dataset = folds[n_folds - 1 + k]
+
+            built_datasets = [train_dataset, valid_dataset, test_dataset]
+
+        else:
+            built_datasets = dataset.build()
+            train_dataset, valid_dataset, test_dataset = built_datasets
 
-        train_dataset, valid_dataset, test_dataset = built_datasets
         train_sampler, valid_sampler, test_sampler = create_samplers(
             config, dataset, built_datasets
         )
diff --git a/recbole/properties/overall.yaml b/recbole/properties/overall.yaml
index 577e4c0b4..2ab44a93a 100644
--- a/recbole/properties/overall.yaml
+++ b/recbole/properties/overall.yaml
@@ -5,20 +5,20 @@ use_gpu: True                   # (bool) Whether or not to use GPU.
 seed: 2020                      # (int) Random seed.
 state: INFO                     # (str) Logging level.
 reproducibility: True           # (bool) Whether or not to make results reproducible.
-data_path: 'dataset/'           # (str) The path of input dataset.
+data_path: /home/marta/jku/fairinterplay/dataset  # (str) The path of input dataset.
 checkpoint_dir: 'saved'         # (str) The path to save checkpoint file.
-show_progress: True             # (bool) Whether or not to show the progress bar of every epoch. 
-save_dataset: False             # (bool) Whether or not to save filtered dataset.
+show_progress: True             # (bool) Whether or not to show the progress bar of every epoch.
+save_dataset: True             # (bool) Whether or not to save filtered dataset.
 dataset_save_path: ~            # (str) The path of saved dataset.
-save_dataloaders: False         # (bool) Whether or not save split dataloaders.
+save_dataloaders: True         # (bool) Whether or not save split dataloaders.
 dataloaders_save_path: ~        # (str) The path of saved dataloaders.
-log_wandb: False                # (bool) Whether or not to use Weights & Biases(W&B).
+log_wandb: True                # (bool) Whether or not to use Weights & Biases(W&B).
 wandb_project: 'recbole'        # (str) The project to conduct experiments in W&B.
 shuffle: True                   # (bool) Whether or not to shuffle the training data before each epoch.
 
 # Training Settings
 epochs: 300                     # (int) The number of training epochs.
-train_batch_size: 2048          # (int) The training batch size.
+train_batch_size: 1024          # (int) The training batch size.
 learner: adam                   # (str) The name of used optimizer.
 learning_rate: 0.001            # (float) Learning rate.
 train_neg_sample_args:          # (dict) Negative sampling configuration for model training.
@@ -29,7 +29,7 @@ train_neg_sample_args:          # (dict) Negative sampling configuration for mod
   candidate_num: 0              # (int) The number of candidate negative items when dynamic negative sampling.
 eval_step: 1                    # (int) The number of training epochs before an evaluation on the valid dataset.
 stopping_step: 10               # (int) The threshold for validation-based early stopping.
-clip_grad_norm: ~               # (dict) The args of clip_grad_norm_ which will clip gradient norm of model. 
+clip_grad_norm: ~               # (dict) The args of clip_grad_norm_ which will clip gradient norm of model.
 weight_decay: 0.0               # (float) The weight decay value (L2 penalty) for optimizers.
 loss_decimal_place: 4           # (int) The decimal place of training loss.
 require_pow: False              # (bool) Whether or not to perform power operation in EmbLoss.
@@ -39,14 +39,17 @@ transform: ~                    # (str) The transform operation for batch data p
 
 # Evaluation Settings
 eval_args:                      # (dict) 4 keys: group_by, order, split, and mode
-  split: {'RS':[0.8,0.1,0.1]}   # (dict) The splitting strategy ranging in ['RS','LS'].
-  group_by: user                # (str) The grouping strategy ranging in ['user', 'none'].
+  # split: {'LS': 'valid_and_test'}   # (dict) The splitting strategy ranging in ['RS','LS'].
+  # split: { 'RS': [0.6, 0.2, 0.2] }   # (dict) The splitting strategy ranging in ['RS','LS'].
+  split: {'KF': [0.2, 0.2, 0.2, 0.2, 0.2]}
+  fold: 0
+  group_by: none                # (str) The grouping strategy ranging in ['user', 'none'].
   order: RO                     # (str) The ordering strategy ranging in ['RO', 'TO'].
   mode: full                    # (str) The evaluation mode ranging in ['full','unixxx','popxxx','labeled'].
-repeatable: False               # (bool) Whether to evaluate results with a repeatable recommendation scene. 
+repeatable: False               # (bool) Whether to evaluate results with a repeatable recommendation scene.
 metrics: ["Recall","MRR","NDCG","Hit","Precision"]  # (list or str) Evaluation metrics.
 topk: [10]                      # (list or int or None) The value of k for topk evaluation metrics.
-valid_metric: MRR@10            # (str) The evaluation metric for early stopping. 
+valid_metric: 'NDCG@10'
 valid_metric_bigger: True       # (bool) Whether to take a bigger valid metric value as a better result.
-eval_batch_size: 4096           # (int) The evaluation batch size.
+eval_batch_size: 1024           # (int) The evaluation batch size.
 metric_decimal_place: 4         # (int) The decimal place of metric scores.
\ No newline at end of file

From 5878883bf473cf6b87c91a0ab39b6d5f51b7ad41 Mon Sep 17 00:00:00 2001
From: mmosc <ma.moscati@gmail.com>
Date: Fri, 2 Dec 2022 12:29:25 +0100
Subject: [PATCH 2/5] edit: Add instructions for K-fold CV in the README.

---
 README.md | 29 +++++++++++++++++++++++++++++
 1 file changed, 29 insertions(+)

diff --git a/README.md b/README.md
index 4e3810188..ed50ee1eb 100644
--- a/README.md
+++ b/README.md
@@ -1,6 +1,35 @@
 ![RecBole Logo](asset/logo.png)
 
 --------------------------------------------------------------------------------
+# K-fold CV
+This branch contains an implementation of K-fold CV in RecBole. The implementation relies on
+RecBole's Dataset class and its methods `split_by_ratio` and `build` (`recbole/data/dataset/dataset.py`), on the function `data_preparation`)
+(`recbole/data/utils.py`), and on the general configuration file `overall.yaml` (`recbole/properties`).
+
+Running RecBole calls the `quick_start.py` (`recbole/quick_start`) script, which splits the data with `data_preparation(config, dataset)`.
+K-fold CV happens in this function. First, calling `dataset.build()` with the parameters stored in the 
+`config` dictionary, splits the dataset in folds of sizes defined in the `overall.yaml`. The percentage  of interactions to be assigned to
+each fold (e.g., [0.2, 0.2, 0.2, 0.2, 0.2] for 5 folds) is also stored in the variable `folds` as a list. 
+
+The variable k stores which permutation of the folds is to be used in the current experiment, e.g., for a 5-fold CV and $k=0$, 
+the first three splits will be assigned to the train set, the fourth to the validation, and the last one to the test set.
+
+The function then initializes `train_dataset` as an empty Dataset(config) instance, and fills it with the interactions of the 
+corresponding folds. The remaining two folds are assigned to `valid_dataset`.
+
+For running an experiment on the first fold of a 5-fold CV, the `eval_args` in the `overall.yaml` file need to be set to:
+```python
+# Evaluation Settings
+eval_args:                      # (dict) 4 keys: group_by, order, split, and mode
+  split: {'KF': [0.2, 0.2, 0.2, 0.2, 0.2]}
+  fold: 0
+  group_by: none                # (str) The grouping strategy ranging in ['user', 'none'].
+  order: RO                     # (str) The ordering strategy ranging in ['RO', 'TO'].
+  mode: full                    # (str) The evaluation mode ranging in ['full','unixxx','popxxx','labeled'].
+
+```
+
+
 
 # RecBole (伯乐)
 

From a5bf8227df8815c813ac4d3268b5b7ffaf34d603 Mon Sep 17 00:00:00 2001
From: mmosc <ma.moscati@gmail.com>
Date: Fri, 2 Dec 2022 12:31:39 +0100
Subject: [PATCH 3/5] edit: Edit README.

---
 README.md | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/README.md b/README.md
index ed50ee1eb..024f8ea7d 100644
--- a/README.md
+++ b/README.md
@@ -3,7 +3,7 @@
 --------------------------------------------------------------------------------
 # K-fold CV
 This branch contains an implementation of K-fold CV in RecBole. The implementation relies on
-RecBole's Dataset class and its methods `split_by_ratio` and `build` (`recbole/data/dataset/dataset.py`), on the function `data_preparation`)
+RecBole's Dataset class and its methods `split_by_ratio` and `build` (`recbole/data/dataset/dataset.py`), on the function `data_preparation`
 (`recbole/data/utils.py`), and on the general configuration file `overall.yaml` (`recbole/properties`).
 
 Running RecBole calls the `quick_start.py` (`recbole/quick_start`) script, which splits the data with `data_preparation(config, dataset)`.
@@ -15,7 +15,7 @@ The variable k stores which permutation of the folds is to be used in the curren
 the first three splits will be assigned to the train set, the fourth to the validation, and the last one to the test set.
 
 The function then initializes `train_dataset` as an empty Dataset(config) instance, and fills it with the interactions of the 
-corresponding folds. The remaining two folds are assigned to `valid_dataset`.
+corresponding folds. The remaining two folds are assigned to `valid_dataset` and `test_dataset`.
 
 For running an experiment on the first fold of a 5-fold CV, the `eval_args` in the `overall.yaml` file need to be set to:
 ```python

From 6fe4f960e5c5f3a632bfefaf14ccde97c070d9a2 Mon Sep 17 00:00:00 2001
From: mmosc <ma.moscati@gmail.com>
Date: Fri, 2 Dec 2022 15:25:28 +0100
Subject: [PATCH 4/5] fix: bug in k-fold.

---
 recbole/data/utils.py | 7 ++++---
 1 file changed, 4 insertions(+), 3 deletions(-)

diff --git a/recbole/data/utils.py b/recbole/data/utils.py
index e1b3516a6..1cd4dc490 100644
--- a/recbole/data/utils.py
+++ b/recbole/data/utils.py
@@ -169,11 +169,12 @@ def data_preparation(config, dataset):
             n_folds = len(folds)
             print(n_folds)
             k = config["eval_args"]["fold"]
+            folds = folds[k:] + folds[:k]
 
             train_dataset = Dataset(config)
-            train_dataset.inter_feat = cat_interactions([fold.inter_feat for fold in folds[k: n_folds - 2 + k]])
-            valid_dataset = folds[n_folds - 2 + k]
-            test_dataset = folds[n_folds - 1 + k]
+            train_dataset.inter_feat = cat_interactions([fold.inter_feat for fold in folds[: n_folds - 2]])
+            valid_dataset = folds[n_folds - 2]
+            test_dataset = folds[n_folds - 1]
 
             built_datasets = [train_dataset, valid_dataset, test_dataset]
 

From 732fa1fcae3c5f899527bd70a493c65a6c1b64ce Mon Sep 17 00:00:00 2001
From: mmosc <ma.moscati@gmail.com>
Date: Mon, 5 Dec 2022 11:35:28 +0100
Subject: [PATCH 5/5] edit: Change fold

---
 recbole/properties/overall.yaml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/recbole/properties/overall.yaml b/recbole/properties/overall.yaml
index 2ab44a93a..84033a1f5 100644
--- a/recbole/properties/overall.yaml
+++ b/recbole/properties/overall.yaml
@@ -42,7 +42,7 @@ eval_args:                      # (dict) 4 keys: group_by, order, split, and mod
   # split: {'LS': 'valid_and_test'}   # (dict) The splitting strategy ranging in ['RS','LS'].
   # split: { 'RS': [0.6, 0.2, 0.2] }   # (dict) The splitting strategy ranging in ['RS','LS'].
   split: {'KF': [0.2, 0.2, 0.2, 0.2, 0.2]}
-  fold: 0
+  fold: 2
   group_by: none                # (str) The grouping strategy ranging in ['user', 'none'].
   order: RO                     # (str) The ordering strategy ranging in ['RO', 'TO'].
   mode: full                    # (str) The evaluation mode ranging in ['full','unixxx','popxxx','labeled'].