update the user_based 2,40

861461d5 · Adrien Payen · cd5b2ed2 · 861461d5
--- a/user_based.ipynb
+++ b/user_based.ipynb
@@ -11,19 +11,16 @@
  },
  {
   "cell_type": "code",
-   "execution_count": 1,
+   "execution_count": 10,
   "id": "00d1b249",
   "metadata": {},
   "outputs": [
    {
-     "ename": "ImportError",
+     "name": "stdout",
-     "evalue": "cannot import name 'Constant' from 'constants' (/Library/Frameworks/Python.framework/Versions/3.12/lib/python3.12/site-packages/constants.py)",
+     "output_type": "stream",
-     "output_type": "error",
+     "text": [
-     "traceback": [
+      "The autoreload extension is already loaded. To reload it, use:\n",
-      "\u001b[0;31m---------------------------------------------------------------------------\u001b[0m",
+      "  %reload_ext autoreload\n"
-      "\u001b[0;31mImportError\u001b[0m                               Traceback (most recent call last)",
-      "Cell \u001b[0;32mIn[1], line 14\u001b[0m\n\u001b[1;32m     10\u001b[0m \u001b[38;5;28;01mimport\u001b[39;00m \u001b[38;5;21;01mpandas\u001b[39;00m \u001b[38;5;28;01mas\u001b[39;00m \u001b[38;5;21;01mpd\u001b[39;00m\n\u001b[1;32m     11\u001b[0m \u001b[38;5;66;03m# -- add new imports here --\u001b[39;00m\n\u001b[1;32m     12\u001b[0m \n\u001b[1;32m     13\u001b[0m \u001b[38;5;66;03m# local imports\u001b[39;00m\n\u001b[0;32m---> 14\u001b[0m \u001b[38;5;28;01mfrom\u001b[39;00m \u001b[38;5;21;01mconstants\u001b[39;00m \u001b[38;5;28;01mimport\u001b[39;00m Constant \u001b[38;5;28;01mas\u001b[39;00m C\n\u001b[1;32m     15\u001b[0m \u001b[38;5;28;01mfrom\u001b[39;00m \u001b[38;5;21;01mloaders\u001b[39;00m \u001b[38;5;28;01mimport\u001b[39;00m load_ratings,load_items \n\u001b[1;32m     16\u001b[0m \u001b[38;5;28;01mfrom\u001b[39;00m \u001b[38;5;21;01msurprise\u001b[39;00m \u001b[38;5;28;01mimport\u001b[39;00m KNNWithMeans, accuracy, AlgoBase, PredictionImpossible\n",
-      "\u001b[0;31mImportError\u001b[0m: cannot import name 'Constant' from 'constants' (/Library/Frameworks/Python.framework/Versions/3.12/lib/python3.12/site-packages/constants.py)"
     ]
    }
   ],
@@ -59,7 +56,7 @@
  },
  {
   "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 11,
   "id": "aafd1712",
   "metadata": {},
   "outputs": [
@@ -69,59 +66,18 @@
     "text": [
      "Computing the msd similarity matrix...\n",
      "Done computing similarity matrix.\n",
-      "user: 11         item: 364        r_ui = 4.00   est = 3.42   {'was_impossible': True, 'reason': 'User and/or item is unknown.'}\n"
+      "user: 11         item: 364        r_ui = None   est = 2.49   {'actual_k': 2, 'was_impossible': False}\n"
     ]
    }
   ],
   "source": [
-    "\n",
    "# Create Surprise Dataset from the pandas DataFrame and Reader\n",
    "surprise_data = load_ratings(surprise_format=True)\n",
    "\n",
    "trainset = surprise_data.build_full_trainset()\n",
    "\n",
    "\n",
-    "testset = trainset.build_anti_testset()\n",
+    "testset = trainset.build_anti_testset()\n"
-    "\n",
-    "\n",
-    "sim_options = {\n",
-    "    'name': 'msd',  # Mean Squared Difference (Mean Square Error)\n",
-    "    'user_based': True,  # User-based collaborative filtering\n",
-    "    'min_support': 3  # Minimum number of common ratings required\n",
-    "}\n",
-    "\n",
-    "\n",
-    "# Build an algorithm, and train it.\n",
-    "algo = KNNWithMeans(sim_options=sim_options, k=3, min_k=2)\n",
-    "algo.fit(trainset)\n",
-    "algo.test(testset)\n",
-    "\n",
-    "\n",
-    "uid = str(11)  # raw user id (as in the ratings file). They are **strings**!\n",
-    "iid = str(364) \n",
-    "\n",
-    "pred = algo.predict(uid, iid, r_ui=4, verbose=True)"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "cf3ccdc0",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# -- load data, build trainset and anti testset --\n",
-    "# it depends on the tiny dataset\n",
-    "surprise_data = load_ratings(surprise_format=True)\n",
-    "df_movies = load_items()\n",
-    "\n",
-    "# Assuming you have a pandas DataFrame named 'df' with columns ['user_id', 'item_id', 'rating']\n",
-    "\n",
-    "# Build train set with all available ratings\n",
-    "trainset = surprise_data.build_full_trainset()\n",
-    "\n",
-    "# Build anti-test set\n",
-    "testset = trainset.build_anti_testset()"
   ]
  },
  {
@@ -136,43 +92,34 @@
  {
   "cell_type": "code",
   "execution_count": null,
-   "id": "e6fb78b7",
+   "id": "ce078b43",
   "metadata": {},
-   "outputs": [
+   "outputs": [],
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "Computing the msd similarity matrix...\n",
-      "Done computing similarity matrix.\n",
-      "3.4190898791540785\n"
-     ]
-    }
-   ],
   "source": [
-    "# -- using surprise's user-based algorithm, explore the impact of different parameters and displays predictions --\n",
+    "#User-based prediction for the user 11 and the item 364\n",
    "\n",
-    "# Define the similarity options\n",
    "sim_options = {\n",
    "    'name': 'msd',  # Mean Squared Difference (Mean Square Error)\n",
    "    'user_based': True,  # User-based collaborative filtering\n",
    "    'min_support': 3  # Minimum number of common ratings required\n",
    "}\n",
    "\n",
-    "# Create an instance of KNNWithMeans with the specified options\n",
-    "knn_model = KNNWithMeans(k=3, min_k=2, sim_options=sim_options)\n",
    "\n",
-    "# Train the algorithm on the trainset\n",
+    "# Build an algorithm, and train it.\n",
-    "knn_model.fit(trainset).test(testset)\n",
+    "algo = KNNWithMeans(sim_options=sim_options, k=3, min_k=2)\n",
+    "algo.fit(trainset)\n",
+    "algo.test(testset)\n",
+    "\n",
+    "\n",
+    "uid = 11  # raw user id (as in the ratings file). They are **strings**!\n",
+    "iid = 364 \n",
    "\n",
-    "# Make an estimation for user 11 and item 364\n",
+    "pred = algo.predict(uid, iid, verbose=True)"
-    "prediction = knn_model.predict('11', '364')\n",
-    "print(prediction.est)"
   ]
  },
  {
   "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 13,
   "id": "ffe89c56",
   "metadata": {},
   "outputs": [
@@ -183,102 +130,102 @@
      "Computing the msd similarity matrix...\n",
      "Done computing similarity matrix.\n",
      "Predictions with min_k = 1:\n",
-      "User: 15, Item: 942, Rating: 3.7769516356699464\n",
+      "User: 11, Item: 1214, Rating: 3.6041666666666665\n",
-      "User: 15, Item: 2117, Rating: 2.9340004894942537\n",
+      "User: 11, Item: 364, Rating: 2.49203431372549\n",
-      "User: 15, Item: 2672, Rating: 2.371008709611413\n",
+      "User: 11, Item: 4308, Rating: 1.6041666666666667\n",
-      "User: 15, Item: 5054, Rating: 3.010328638497653\n",
+      "User: 11, Item: 527, Rating: 3.898897058823529\n",
-      "User: 15, Item: 6322, Rating: 1.711175832857413\n",
+      "User: 13, Item: 1997, Rating: 2.8\n",
-      "User: 15, Item: 6323, Rating: 1.7645762379992287\n",
+      "User: 13, Item: 4993, Rating: 3.2375\n",
-      "User: 15, Item: 6757, Rating: 3.010328638497653\n",
+      "User: 13, Item: 2700, Rating: 2.8\n",
-      "User: 15, Item: 7700, Rating: 3.561484741491386\n",
+      "User: 13, Item: 1721, Rating: 1.2374999999999998\n",
-      "User: 15, Item: 7981, Rating: 3.386000174210522\n",
+      "User: 13, Item: 527, Rating: 3.2375\n",
-      "User: 15, Item: 8600, Rating: 3.320743223639117\n",
+      "User: 17, Item: 2028, Rating: 3.8125\n",
-      "User: 15, Item: 8620, Rating: 2.7538763809343654\n",
+      "User: 17, Item: 4993, Rating: 4.128289473684211\n",
-      "User: 15, Item: 31952, Rating: 3.7409900837647396\n",
+      "User: 17, Item: 1214, Rating: 3.6875\n",
-      "User: 15, Item: 3, Rating: 2.222062601579949\n",
+      "User: 17, Item: 4308, Rating: 1.6875\n",
-      "User: 15, Item: 64, Rating: 0.9224387353614938\n",
+      "User: 19, Item: 1997, Rating: 3.5\n",
-      "User: 15, Item: 206, Rating: 2.35668733389394\n",
+      "User: 19, Item: 2028, Rating: 3.5\n",
-      "User: 15, Item: 249, Rating: 3.1290259851652826\n",
+      "User: 19, Item: 4993, Rating: 3.5\n",
-      "User: 15, Item: 276, Rating: 2.1800017354806753\n",
+      "User: 19, Item: 5952, Rating: 3.5\n",
-      "User: 15, Item: 369, Rating: 2.3082373858282694\n",
+      "User: 19, Item: 2700, Rating: 3.5\n",
-      "User: 15, Item: 504, Rating: 2.2600496220227573\n",
+      "User: 19, Item: 1721, Rating: 3.5\n",
-      "User: 15, Item: 515, Rating: 3.6575674086958188\n",
+      "User: 19, Item: 1214, Rating: 3.5\n",
-      "User: 15, Item: 522, Rating: 2.4562020809509626\n",
+      "User: 19, Item: 364, Rating: 3.5\n",
-      "User: 15, Item: 580, Rating: 1.9073310817298395\n",
+      "User: 23, Item: 1997, Rating: 2.782649253731343\n",
-      "User: 15, Item: 599, Rating: 2.780847470837928\n",
+      "User: 23, Item: 2700, Rating: 2.349813432835821\n",
-      "User: 15, Item: 915, Rating: 2.761094249104645\n",
+      "User: 27, Item: 1997, Rating: 4.666666666666667\n",
-      "User: 15, Item: 966, Rating: 3.0894953051643195\n",
+      "User: 27, Item: 2028, Rating: 5.0\n",
-      "User: 15, Item: 1274, Rating: 2.9873500196382845\n",
+      "User: 27, Item: 5952, Rating: 5.0\n",
-      "User: 15, Item: 1299, Rating: 3.0779327239728005\n",
+      "User: 27, Item: 2700, Rating: 4.666666666666667\n",
-      "User: 15, Item: 1345, Rating: 2.2037629856623138\n",
+      "User: 27, Item: 1721, Rating: 3.104166666666667\n",
-      "User: 15, Item: 1354, Rating: 2.001877412379849\n",
+      "User: 27, Item: 364, Rating: 4.604166666666667\n",
-      "User: 15, Item: 532, Rating: 2.7123071345260277\n",
+      "User: 27, Item: 4308, Rating: 3.104166666666667\n",
      "Computing the msd similarity matrix...\n",
      "Done computing similarity matrix.\n",
      "Predictions with min_k = 2:\n",
-      "User: 15, Item: 942, Rating: 3.7769516356699464\n",
+      "User: 11, Item: 1214, Rating: 3.1666666666666665\n",
-      "User: 15, Item: 2117, Rating: 2.9340004894942537\n",
+      "User: 11, Item: 364, Rating: 2.49203431372549\n",
-      "User: 15, Item: 2672, Rating: 2.371008709611413\n",
+      "User: 11, Item: 4308, Rating: 3.1666666666666665\n",
-      "User: 15, Item: 5054, Rating: 2.693661971830986\n",
+      "User: 11, Item: 527, Rating: 3.898897058823529\n",
-      "User: 15, Item: 6322, Rating: 1.711175832857413\n",
+      "User: 13, Item: 1997, Rating: 2.8\n",
-      "User: 15, Item: 6323, Rating: 1.7645762379992287\n",
+      "User: 13, Item: 4993, Rating: 2.8\n",
-      "User: 15, Item: 6757, Rating: 2.693661971830986\n",
+      "User: 13, Item: 2700, Rating: 2.8\n",
-      "User: 15, Item: 7700, Rating: 3.561484741491386\n",
+      "User: 13, Item: 1721, Rating: 2.8\n",
-      "User: 15, Item: 7981, Rating: 3.386000174210522\n",
+      "User: 13, Item: 527, Rating: 2.8\n",
-      "User: 15, Item: 8600, Rating: 3.320743223639117\n",
+      "User: 17, Item: 2028, Rating: 3.8125\n",
-      "User: 15, Item: 8620, Rating: 2.7538763809343654\n",
+      "User: 17, Item: 4993, Rating: 4.128289473684211\n",
-      "User: 15, Item: 31952, Rating: 3.7409900837647396\n",
+      "User: 17, Item: 1214, Rating: 3.25\n",
-      "User: 15, Item: 3, Rating: 2.222062601579949\n",
+      "User: 17, Item: 4308, Rating: 3.25\n",
-      "User: 15, Item: 64, Rating: 0.9224387353614938\n",
+      "User: 19, Item: 1997, Rating: 3.5\n",
-      "User: 15, Item: 206, Rating: 2.35668733389394\n",
+      "User: 19, Item: 2028, Rating: 3.5\n",
-      "User: 15, Item: 249, Rating: 3.1290259851652826\n",
+      "User: 19, Item: 4993, Rating: 3.5\n",
-      "User: 15, Item: 276, Rating: 2.1800017354806753\n",
+      "User: 19, Item: 5952, Rating: 3.5\n",
-      "User: 15, Item: 369, Rating: 2.3082373858282694\n",
+      "User: 19, Item: 2700, Rating: 3.5\n",
-      "User: 15, Item: 504, Rating: 2.2600496220227573\n",
+      "User: 19, Item: 1721, Rating: 3.5\n",
-      "User: 15, Item: 515, Rating: 3.6575674086958188\n",
+      "User: 19, Item: 1214, Rating: 3.5\n",
-      "User: 15, Item: 522, Rating: 2.4562020809509626\n",
+      "User: 19, Item: 364, Rating: 3.5\n",
-      "User: 15, Item: 580, Rating: 1.9073310817298395\n",
+      "User: 23, Item: 1997, Rating: 2.782649253731343\n",
-      "User: 15, Item: 599, Rating: 2.780847470837928\n",
+      "User: 23, Item: 2700, Rating: 2.349813432835821\n",
-      "User: 15, Item: 915, Rating: 2.761094249104645\n",
+      "User: 27, Item: 1997, Rating: 4.666666666666667\n",
-      "User: 15, Item: 966, Rating: 2.693661971830986\n",
+      "User: 27, Item: 2028, Rating: 4.666666666666667\n",
-      "User: 15, Item: 1274, Rating: 2.9873500196382845\n",
+      "User: 27, Item: 5952, Rating: 4.666666666666667\n",
-      "User: 15, Item: 1299, Rating: 3.0779327239728005\n",
+      "User: 27, Item: 2700, Rating: 4.666666666666667\n",
-      "User: 15, Item: 1345, Rating: 2.2037629856623138\n",
+      "User: 27, Item: 1721, Rating: 4.666666666666667\n",
-      "User: 15, Item: 1354, Rating: 2.001877412379849\n",
+      "User: 27, Item: 364, Rating: 4.666666666666667\n",
-      "User: 15, Item: 532, Rating: 2.7123071345260277\n",
+      "User: 27, Item: 4308, Rating: 4.666666666666667\n",
      "Computing the msd similarity matrix...\n",
      "Done computing similarity matrix.\n",
      "Predictions with min_k = 3:\n",
-      "User: 15, Item: 942, Rating: 3.7769516356699464\n",
+      "User: 11, Item: 1214, Rating: 3.1666666666666665\n",
-      "User: 15, Item: 2117, Rating: 2.9340004894942537\n",
+      "User: 11, Item: 364, Rating: 3.1666666666666665\n",
-      "User: 15, Item: 2672, Rating: 2.371008709611413\n",
+      "User: 11, Item: 4308, Rating: 3.1666666666666665\n",
-      "User: 15, Item: 5054, Rating: 2.693661971830986\n",
+      "User: 11, Item: 527, Rating: 3.1666666666666665\n",
-      "User: 15, Item: 6322, Rating: 2.693661971830986\n",
+      "User: 13, Item: 1997, Rating: 2.8\n",
-      "User: 15, Item: 6323, Rating: 1.7645762379992287\n",
+      "User: 13, Item: 4993, Rating: 2.8\n",
-      "User: 15, Item: 6757, Rating: 2.693661971830986\n",
+      "User: 13, Item: 2700, Rating: 2.8\n",
-      "User: 15, Item: 7700, Rating: 2.693661971830986\n",
+      "User: 13, Item: 1721, Rating: 2.8\n",
-      "User: 15, Item: 7981, Rating: 3.386000174210522\n",
+      "User: 13, Item: 527, Rating: 2.8\n",
-      "User: 15, Item: 8600, Rating: 2.693661971830986\n",
+      "User: 17, Item: 2028, Rating: 3.25\n",
-      "User: 15, Item: 8620, Rating: 2.7538763809343654\n",
+      "User: 17, Item: 4993, Rating: 3.25\n",
-      "User: 15, Item: 31952, Rating: 2.693661971830986\n",
+      "User: 17, Item: 1214, Rating: 3.25\n",
-      "User: 15, Item: 3, Rating: 2.222062601579949\n",
+      "User: 17, Item: 4308, Rating: 3.25\n",
-      "User: 15, Item: 64, Rating: 0.9224387353614938\n",
+      "User: 19, Item: 1997, Rating: 3.5\n",
-      "User: 15, Item: 206, Rating: 2.35668733389394\n",
+      "User: 19, Item: 2028, Rating: 3.5\n",
-      "User: 15, Item: 249, Rating: 3.1290259851652826\n",
+      "User: 19, Item: 4993, Rating: 3.5\n",
-      "User: 15, Item: 276, Rating: 2.1800017354806753\n",
+      "User: 19, Item: 5952, Rating: 3.5\n",
-      "User: 15, Item: 369, Rating: 2.3082373858282694\n",
+      "User: 19, Item: 2700, Rating: 3.5\n",
-      "User: 15, Item: 504, Rating: 2.2600496220227573\n",
+      "User: 19, Item: 1721, Rating: 3.5\n",
-      "User: 15, Item: 515, Rating: 3.6575674086958188\n",
+      "User: 19, Item: 1214, Rating: 3.5\n",
-      "User: 15, Item: 522, Rating: 2.4562020809509626\n",
+      "User: 19, Item: 364, Rating: 3.5\n",
-      "User: 15, Item: 580, Rating: 1.9073310817298395\n",
+      "User: 23, Item: 1997, Rating: 2.5625\n",
-      "User: 15, Item: 599, Rating: 2.780847470837928\n",
+      "User: 23, Item: 2700, Rating: 2.5625\n",
-      "User: 15, Item: 915, Rating: 2.761094249104645\n",
+      "User: 27, Item: 1997, Rating: 4.666666666666667\n",
-      "User: 15, Item: 966, Rating: 2.693661971830986\n",
+      "User: 27, Item: 2028, Rating: 4.666666666666667\n",
-      "User: 15, Item: 1274, Rating: 2.9873500196382845\n",
+      "User: 27, Item: 5952, Rating: 4.666666666666667\n",
-      "User: 15, Item: 1299, Rating: 3.0779327239728005\n",
+      "User: 27, Item: 2700, Rating: 4.666666666666667\n",
-      "User: 15, Item: 1345, Rating: 2.2037629856623138\n",
+      "User: 27, Item: 1721, Rating: 4.666666666666667\n",
-      "User: 15, Item: 1354, Rating: 2.001877412379849\n",
+      "User: 27, Item: 364, Rating: 4.666666666666667\n",
-      "User: 15, Item: 532, Rating: 2.7123071345260277\n"
+      "User: 27, Item: 4308, Rating: 4.666666666666667\n"
     ]
    }
   ],
@@ -333,7 +280,7 @@
  },
  {
   "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 14,
   "id": "cc806424",
   "metadata": {},
   "outputs": [
@@ -343,109 +290,108 @@
     "text": [
      "\n",
      "Prédictions avec min_support = 1:\n",
-      "User: 15, Item: 942, Actual_k: 3\n",
+      "User: 11, Item: 1214, Actual_k: 1\n",
-      "User: 15, Item: 2117, Actual_k: 3\n",
+      "User: 11, Item: 364, Actual_k: 2\n",
-      "User: 15, Item: 2672, Actual_k: 3\n",
+      "User: 11, Item: 4308, Actual_k: 1\n",
-      "User: 15, Item: 5054, Actual_k: 1\n",
+      "User: 11, Item: 527, Actual_k: 2\n",
-      "User: 15, Item: 6322, Actual_k: 2\n",
+      "User: 13, Item: 1997, Actual_k: 0\n",
-      "User: 15, Item: 6323, Actual_k: 3\n",
+      "User: 13, Item: 4993, Actual_k: 1\n",
-      "User: 15, Item: 6757, Actual_k: 1\n",
+      "User: 13, Item: 2700, Actual_k: 0\n",
-      "User: 15, Item: 7700, Actual_k: 2\n",
+      "User: 13, Item: 1721, Actual_k: 1\n",
-      "User: 15, Item: 7981, Actual_k: 3\n",
+      "User: 13, Item: 527, Actual_k: 1\n",
-      "User: 15, Item: 8600, Actual_k: 2\n",
+      "User: 17, Item: 2028, Actual_k: 2\n",
-      "User: 15, Item: 8620, Actual_k: 3\n",
+      "User: 17, Item: 4993, Actual_k: 2\n",
-      "User: 15, Item: 31952, Actual_k: 2\n",
+      "User: 17, Item: 1214, Actual_k: 1\n",
-      "User: 15, Item: 3, Actual_k: 3\n",
+      "User: 17, Item: 4308, Actual_k: 1\n",
-      "User: 15, Item: 64, Actual_k: 3\n",
+      "User: 19, Item: 1997, Actual_k: 0\n",
-      "User: 15, Item: 206, Actual_k: 3\n",
+      "User: 19, Item: 2028, Actual_k: 0\n",
-      "User: 15, Item: 249, Actual_k: 3\n",
+      "User: 19, Item: 4993, Actual_k: 0\n",
-      "User: 15, Item: 276, Actual_k: 3\n",
+      "User: 19, Item: 5952, Actual_k: 0\n",
-      "User: 15, Item: 369, Actual_k: 3\n",
+      "User: 19, Item: 2700, Actual_k: 0\n",
-      "User: 15, Item: 504, Actual_k: 3\n",
+      "User: 19, Item: 1721, Actual_k: 0\n",
-      "User: 15, Item: 515, Actual_k: 3\n",
+      "User: 19, Item: 1214, Actual_k: 0\n",
-      "User: 15, Item: 522, Actual_k: 3\n",
+      "User: 19, Item: 364, Actual_k: 0\n",
-      "User: 15, Item: 580, Actual_k: 3\n",
+      "User: 23, Item: 1997, Actual_k: 2\n",
-      "User: 15, Item: 599, Actual_k: 3\n",
+      "User: 23, Item: 2700, Actual_k: 2\n",
-      "User: 15, Item: 915, Actual_k: 3\n",
+      "User: 27, Item: 1997, Actual_k: 0\n",
-      "User: 15, Item: 966, Actual_k: 1\n",
+      "User: 27, Item: 2028, Actual_k: 1\n",
-      "User: 15, Item: 1274, Actual_k: 3\n",
+      "User: 27, Item: 5952, Actual_k: 1\n",
-      "User: 15, Item: 1299, Actual_k: 3\n",
+      "User: 27, Item: 2700, Actual_k: 0\n",
-      "User: 15, Item: 1345, Actual_k: 3\n",
+      "User: 27, Item: 1721, Actual_k: 1\n",
-      "User: 15, Item: 1354, Actual_k: 3\n",
+      "User: 27, Item: 364, Actual_k: 1\n",
-      "User: 15, Item: 532, Actual_k: 3\n",
+      "User: 27, Item: 4308, Actual_k: 1\n",
      "\n",
      "Prédictions avec min_support = 2:\n",
-      "User: 15, Item: 942, Actual_k: 3\n",
+      "User: 11, Item: 1214, Actual_k: 1\n",
-      "User: 15, Item: 2117, Actual_k: 3\n",
+      "User: 11, Item: 364, Actual_k: 2\n",
-      "User: 15, Item: 2672, Actual_k: 3\n",
+      "User: 11, Item: 4308, Actual_k: 1\n",
-      "User: 15, Item: 5054, Actual_k: 1\n",
+      "User: 11, Item: 527, Actual_k: 2\n",
-      "User: 15, Item: 6322, Actual_k: 2\n",
+      "User: 13, Item: 1997, Actual_k: 0\n",
-      "User: 15, Item: 6323, Actual_k: 3\n",
+      "User: 13, Item: 4993, Actual_k: 1\n",
-      "User: 15, Item: 6757, Actual_k: 1\n",
+      "User: 13, Item: 2700, Actual_k: 0\n",
-      "User: 15, Item: 7700, Actual_k: 2\n",
+      "User: 13, Item: 1721, Actual_k: 1\n",
-      "User: 15, Item: 7981, Actual_k: 3\n",
+      "User: 13, Item: 527, Actual_k: 1\n",
-      "User: 15, Item: 8600, Actual_k: 2\n",
+      "User: 17, Item: 2028, Actual_k: 2\n",
-      "User: 15, Item: 8620, Actual_k: 3\n",
+      "User: 17, Item: 4993, Actual_k: 2\n",
-      "User: 15, Item: 31952, Actual_k: 2\n",
+      "User: 17, Item: 1214, Actual_k: 1\n",
-      "User: 15, Item: 3, Actual_k: 3\n",
+      "User: 17, Item: 4308, Actual_k: 1\n",
-      "User: 15, Item: 64, Actual_k: 3\n",
+      "User: 19, Item: 1997, Actual_k: 0\n",
-      "User: 15, Item: 206, Actual_k: 3\n",
+      "User: 19, Item: 2028, Actual_k: 0\n",
-      "User: 15, Item: 249, Actual_k: 3\n",
+      "User: 19, Item: 4993, Actual_k: 0\n",
-      "User: 15, Item: 276, Actual_k: 3\n",
+      "User: 19, Item: 5952, Actual_k: 0\n",
-      "User: 15, Item: 369, Actual_k: 3\n",
+      "User: 19, Item: 2700, Actual_k: 0\n",
-      "User: 15, Item: 504, Actual_k: 3\n",
+      "User: 19, Item: 1721, Actual_k: 0\n",
-      "User: 15, Item: 515, Actual_k: 3\n",
+      "User: 19, Item: 1214, Actual_k: 0\n",
-      "User: 15, Item: 522, Actual_k: 3\n",
+      "User: 19, Item: 364, Actual_k: 0\n",
-      "User: 15, Item: 580, Actual_k: 3\n",
+      "User: 23, Item: 1997, Actual_k: 2\n",
-      "User: 15, Item: 599, Actual_k: 3\n",
+      "User: 23, Item: 2700, Actual_k: 2\n",
-      "User: 15, Item: 915, Actual_k: 3\n",
+      "User: 27, Item: 1997, Actual_k: 0\n",
-      "User: 15, Item: 966, Actual_k: 1\n",
+      "User: 27, Item: 2028, Actual_k: 1\n",
-      "User: 15, Item: 1274, Actual_k: 3\n",
+      "User: 27, Item: 5952, Actual_k: 1\n",
-      "User: 15, Item: 1299, Actual_k: 3\n",
+      "User: 27, Item: 2700, Actual_k: 0\n",
-      "User: 15, Item: 1345, Actual_k: 3\n",
+      "User: 27, Item: 1721, Actual_k: 1\n",
-      "User: 15, Item: 1354, Actual_k: 3\n",
+      "User: 27, Item: 364, Actual_k: 1\n",
-      "User: 15, Item: 532, Actual_k: 3\n",
+      "User: 27, Item: 4308, Actual_k: 1\n",
      "\n",
      "Prédictions avec min_support = 3:\n",
-      "User: 15, Item: 942, Actual_k: 3\n",
+      "User: 11, Item: 1214, Actual_k: 1\n",
-      "User: 15, Item: 2117, Actual_k: 3\n",
+      "User: 11, Item: 364, Actual_k: 2\n",
-      "User: 15, Item: 2672, Actual_k: 3\n",
+      "User: 11, Item: 4308, Actual_k: 1\n",
-      "User: 15, Item: 5054, Actual_k: 1\n",
+      "User: 11, Item: 527, Actual_k: 2\n",
-      "User: 15, Item: 6322, Actual_k: 2\n",
+      "User: 13, Item: 1997, Actual_k: 0\n",
-      "User: 15, Item: 6323, Actual_k: 3\n",
+      "User: 13, Item: 4993, Actual_k: 1\n",
-      "User: 15, Item: 6757, Actual_k: 1\n",
+      "User: 13, Item: 2700, Actual_k: 0\n",
-      "User: 15, Item: 7700, Actual_k: 2\n",
+      "User: 13, Item: 1721, Actual_k: 1\n",
-      "User: 15, Item: 7981, Actual_k: 3\n",
+      "User: 13, Item: 527, Actual_k: 1\n",
-      "User: 15, Item: 8600, Actual_k: 2\n",
+      "User: 17, Item: 2028, Actual_k: 2\n",
-      "User: 15, Item: 8620, Actual_k: 3\n",
+      "User: 17, Item: 4993, Actual_k: 2\n",
-      "User: 15, Item: 31952, Actual_k: 2\n",
+      "User: 17, Item: 1214, Actual_k: 1\n",
-      "User: 15, Item: 3, Actual_k: 3\n",
+      "User: 17, Item: 4308, Actual_k: 1\n",
-      "User: 15, Item: 64, Actual_k: 3\n",
+      "User: 19, Item: 1997, Actual_k: 0\n",
-      "User: 15, Item: 206, Actual_k: 3\n",
+      "User: 19, Item: 2028, Actual_k: 0\n",
-      "User: 15, Item: 249, Actual_k: 3\n",
+      "User: 19, Item: 4993, Actual_k: 0\n",
-      "User: 15, Item: 276, Actual_k: 3\n",
+      "User: 19, Item: 5952, Actual_k: 0\n",
-      "User: 15, Item: 369, Actual_k: 3\n",
+      "User: 19, Item: 2700, Actual_k: 0\n",
-      "User: 15, Item: 504, Actual_k: 3\n",
+      "User: 19, Item: 1721, Actual_k: 0\n",
-      "User: 15, Item: 515, Actual_k: 3\n",
+      "User: 19, Item: 1214, Actual_k: 0\n",
-      "User: 15, Item: 522, Actual_k: 3\n",
+      "User: 19, Item: 364, Actual_k: 0\n",
-      "User: 15, Item: 580, Actual_k: 3\n",
+      "User: 23, Item: 1997, Actual_k: 2\n",
-      "User: 15, Item: 599, Actual_k: 3\n",
+      "User: 23, Item: 2700, Actual_k: 2\n",
-      "User: 15, Item: 915, Actual_k: 3\n",
+      "User: 27, Item: 1997, Actual_k: 0\n",
-      "User: 15, Item: 966, Actual_k: 1\n",
+      "User: 27, Item: 2028, Actual_k: 1\n",
-      "User: 15, Item: 1274, Actual_k: 3\n",
+      "User: 27, Item: 5952, Actual_k: 1\n",
-      "User: 15, Item: 1299, Actual_k: 3\n",
+      "User: 27, Item: 2700, Actual_k: 0\n",
-      "User: 15, Item: 1345, Actual_k: 3\n",
+      "User: 27, Item: 1721, Actual_k: 1\n",
-      "User: 15, Item: 1354, Actual_k: 3\n",
+      "User: 27, Item: 364, Actual_k: 1\n",
-      "User: 15, Item: 532, Actual_k: 3\n",
+      "User: 27, Item: 4308, Actual_k: 1\n",
      "\n",
      "Matrice de similarité:\n",
-      "[[1.         0.39130435 0.35942029 ... 0.24358974 0.28513238 0.21451104]\n",
+      "[[1.         0.         0.24615385 0.         0.43243243 0.        ]\n",
-      " [0.39130435 1.         0.32786885 ... 0.30967742 0.42424242 0.21621622]\n",
+      " [0.         1.         0.         0.         0.17094017 0.        ]\n",
-      " [0.35942029 0.32786885 1.         ... 0.36666667 0.72727273 0.34375   ]\n",
+      " [0.24615385 0.         1.         0.         0.53333333 0.        ]\n",
-      " ...\n",
+      " [0.         0.         0.         1.         0.         0.        ]\n",
-      " [0.24358974 0.30967742 0.36666667 ... 1.         0.6779661  0.37569061]\n",
+      " [0.43243243 0.17094017 0.53333333 0.         1.         0.25      ]\n",
-      " [0.28513238 0.42424242 0.72727273 ... 0.6779661  1.         0.83333333]\n",
+      " [0.         0.         0.         0.         0.25       1.        ]]\n",
-      " [0.21451104 0.21621622 0.34375    ... 0.37569061 0.83333333 1.        ]]\n",
      "None\n"
     ]
    }
@@ -485,7 +431,7 @@
  },
  {
   "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 15,
   "id": "d03ed9eb",
   "metadata": {},
   "outputs": [
@@ -493,13 +439,12 @@
     "name": "stdout",
     "output_type": "stream",
     "text": [
-      "[[3.  1.5 4.  ... nan nan nan]\n",
+      "[[1.5 4.  5.  4.5 3.  1.  nan nan nan nan]\n",
-      " [nan nan nan ... nan nan nan]\n",
+      " [nan 2.  nan 2.  nan nan 1.  5.  4.  nan]\n",
-      " [4.  3.  3.  ... nan nan nan]\n",
+      " [5.  nan nan 4.5 3.  1.  nan 1.5 nan 4.5]\n",
-      " ...\n",
+      " [nan nan nan nan nan nan nan nan 2.  5. ]\n",
-      " [4.5 nan nan ... nan nan nan]\n",
+      " [nan 3.  3.  4.  nan 1.  3.  2.5 1.  3. ]\n",
-      " [nan nan nan ... nan nan nan]\n",
+      " [nan nan 5.  nan nan nan 4.  nan nan 5. ]]\n"
-      " [2.  nan nan ... nan nan nan]]\n"
     ]
    }
   ],
@@ -629,7 +574,7 @@
  },
  {
   "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 16,
   "id": "be53ae27",
   "metadata": {},
   "outputs": [
@@ -637,10 +582,10 @@
     "name": "stdout",
     "output_type": "stream",
     "text": [
-      "UserBased MAE: 1.5398252671298895\n",
+      "UserBased MAE: 1.7175000000000002\n",
-      "UserBased RMSE: 1.5553141029705104\n",
+      "UserBased RMSE: 1.7384170241918369\n",
-      "KNNWithMeans MAE: 0.5419110316300769\n",
+      "KNNWithMeans MAE: 0.661617428851614\n",
-      "KNNWithMeans RMSE: 0.7019543155680094\n"
+      "KNNWithMeans RMSE: 0.8426896111887758\n"
     ]
    }
   ],
@@ -686,7 +631,7 @@
  },
  {
   "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 17,
   "id": "c20d8e19",
   "metadata": {},
   "outputs": [
@@ -698,10 +643,10 @@
      "Done computing similarity matrix.\n",
      "Computing the cosine similarity matrix...\n",
      "Done computing similarity matrix.\n",
-      "RMSE: 0.9799\n",
+      "RMSE: 1.0812\n",
-      "RMSE: 0.9871\n",
+      "RMSE: 1.0910\n",
-      "RMSE with MSD similarity: 0.9798533097556152\n",
+      "RMSE with MSD similarity: 1.0811758629789194\n",
-      "RMSE with Jaccard similarity: 0.9870653791755158\n"
+      "RMSE with Jaccard similarity: 1.0910225374454734\n"
     ]
    }
   ],

 %% Cell type:markdown id:f4a8f664 tags:
 # Custom User-based Model
 The present notebooks aims at creating a UserBased class that inherits from the Algobase class (surprise package) and that can be customized with various similarity metrics, peer groups and score aggregation functions.
 %% Cell type:code id:00d1b249 tags:
 ``` python
 # reloads modules automatically before entering the execution of code
 %load_ext autoreload
 %autoreload 2
 # standard library imports
 # -- add new imports here --
 # third parties imports
 import numpy as np
 import pandas as pd
 # -- add new imports here --
 # local imports
 from constants import Constant as C
 from loaders import load_ratings,load_items
 from surprise import KNNWithMeans, accuracy, AlgoBase, PredictionImpossible
 import heapq
 ```
 %% Output
-    ---------------------------------------------------------------------------
+    The autoreload extension is already loaded. To reload it, use:
-    ImportError                               Traceback (most recent call last)
+      %reload_ext autoreload
-Cell     In[1], line 14
-         10 import pandas as pd
-         11 # -- add new imports here --
-         12
-         13 # local imports
-    ---> 14 from constants import Constant as C
-         15 from loaders import load_ratings,load_items
-         16 from surprise import KNNWithMeans, accuracy, AlgoBase, PredictionImpossible
-    ImportError: cannot import name 'Constant' from 'constants' (/Library/Frameworks/Python.framework/Versions/3.12/lib/python3.12/site-packages/constants.py)
 %% Cell type:markdown id:22716aa3 tags:
 # 1. Loading Data
 Prepare a dataset in order to help implementing a user-based recommender system
 %% Cell type:code id:aafd1712 tags:
 ``` python
 # Create Surprise Dataset from the pandas DataFrame and Reader
 surprise_data = load_ratings(surprise_format=True)
 trainset = surprise_data.build_full_trainset()
 testset = trainset.build_anti_testset()
-sim_options = {
-    'name': 'msd',  # Mean Squared Difference (Mean Square Error)
-    'user_based': True,  # User-based collaborative filtering
-    'min_support': 3  # Minimum number of common ratings required
-}
-# Build an algorithm, and train it.
-algo = KNNWithMeans(sim_options=sim_options, k=3, min_k=2)
-algo.fit(trainset)
-algo.test(testset)
-uid = str(11)  # raw user id (as in the ratings file). They are **strings**!
-iid = str(364)
-pred = algo.predict(uid, iid, r_ui=4, verbose=True)
 ```
 %% Output
    Computing the msd similarity matrix...
    Done computing similarity matrix.
-    user: 11         item: 364        r_ui = 4.00   est = 3.42   {'was_impossible': True, 'reason': 'User and/or item is unknown.'}
+    user: 11         item: 364        r_ui = None   est = 2.49   {'actual_k': 2, 'was_impossible': False}
-%% Cell type:code id:cf3ccdc0 tags:
-``` python
-# -- load data, build trainset and anti testset --
-# it depends on the tiny dataset
-surprise_data = load_ratings(surprise_format=True)
-df_movies = load_items()
-# Assuming you have a pandas DataFrame named 'df' with columns ['user_id', 'item_id', 'rating']
-# Build train set with all available ratings
-trainset = surprise_data.build_full_trainset()
-# Build anti-test set
-testset = trainset.build_anti_testset()
-```
 %% Cell type:markdown id:94adf3a6 tags:
 # 2. Explore Surprise's user-based algorithm
 Displays user-based predictions and similarity matrix on the test dataset using the KNNWithMeans class
-%% Cell type:code id:e6fb78b7 tags:
+%% Cell type:code id:ce078b43 tags:
 ``` python
-# -- using surprise's user-based algorithm, explore the impact of different parameters and displays predictions --
+#User-based prediction for the user 11 and the item 364
-# Define the similarity options
 sim_options = {
    'name': 'msd',  # Mean Squared Difference (Mean Square Error)
    'user_based': True,  # User-based collaborative filtering
    'min_support': 3  # Minimum number of common ratings required
 }
-# Create an instance of KNNWithMeans with the specified options
-knn_model = KNNWithMeans(k=3, min_k=2, sim_options=sim_options)
-# Train the algorithm on the trainset
+# Build an algorithm, and train it.
-knn_model.fit(trainset).test(testset)
+algo = KNNWithMeans(sim_options=sim_options, k=3, min_k=2)
+algo.fit(trainset)
+algo.test(testset)
-# Make an estimation for user 11 and item 364
-prediction = knn_model.predict('11', '364')
-print(prediction.est)
-```
-%% Output
+uid = 11  # raw user id (as in the ratings file). They are **strings**!
+iid = 364
-    Computing the msd similarity matrix...
+pred = algo.predict(uid, iid, verbose=True)
-    Done computing similarity matrix.
+```
-    3.4190898791540785
 %% Cell type:code id:ffe89c56 tags:
 ``` python
 # Playing with KNN
 # Define the similarity options
 sim_options = {
    'name': 'msd',  # Mean Squared Difference (Mean Square Error)
    'user_based': True,  # User-based collaborative filtering
    'min_support': 3  # Minimum number of common ratings required. This data is
 }
 # Create an instance of KNNWithMeans with the specified options
 def predict_ratings(trainset, testset, min_k_values):
    for min_k in min_k_values:
        knn_model = KNNWithMeans(sim_options=sim_options, k=3, min_k=min_k)
        # Train the algorithm on the trainset
        knn_model.fit(trainset)
        # Make predictions for all ratings in the anti testset
        predictions = knn_model.test(testset)
        # Display 30 predictions
        print(f"Predictions with min_k = {min_k}:")
        for prediction in predictions[:30]:
            print(f"User: {prediction.uid}, Item: {prediction.iid}, Rating: {prediction.est}")
 # Assuming trainset and testset are already defined
 predict_ratings(trainset, testset, min_k_values=[1, 2, 3])
 ```
 %% Output
    Computing the msd similarity matrix...
    Done computing similarity matrix.
    Predictions with min_k = 1:
-    User: 15, Item: 942, Rating: 3.7769516356699464
+    User: 11, Item: 1214, Rating: 3.6041666666666665
-    User: 15, Item: 2117, Rating: 2.9340004894942537
+    User: 11, Item: 364, Rating: 2.49203431372549
-    User: 15, Item: 2672, Rating: 2.371008709611413
+    User: 11, Item: 4308, Rating: 1.6041666666666667
-    User: 15, Item: 5054, Rating: 3.010328638497653
+    User: 11, Item: 527, Rating: 3.898897058823529
-    User: 15, Item: 6322, Rating: 1.711175832857413
+    User: 13, Item: 1997, Rating: 2.8
-    User: 15, Item: 6323, Rating: 1.7645762379992287
+    User: 13, Item: 4993, Rating: 3.2375
-    User: 15, Item: 6757, Rating: 3.010328638497653
+    User: 13, Item: 2700, Rating: 2.8
-    User: 15, Item: 7700, Rating: 3.561484741491386
+    User: 13, Item: 1721, Rating: 1.2374999999999998
-    User: 15, Item: 7981, Rating: 3.386000174210522
+    User: 13, Item: 527, Rating: 3.2375
-    User: 15, Item: 8600, Rating: 3.320743223639117
+    User: 17, Item: 2028, Rating: 3.8125
-    User: 15, Item: 8620, Rating: 2.7538763809343654
+    User: 17, Item: 4993, Rating: 4.128289473684211
-    User: 15, Item: 31952, Rating: 3.7409900837647396
+    User: 17, Item: 1214, Rating: 3.6875
-    User: 15, Item: 3, Rating: 2.222062601579949
+    User: 17, Item: 4308, Rating: 1.6875
-    User: 15, Item: 64, Rating: 0.9224387353614938
+    User: 19, Item: 1997, Rating: 3.5
-    User: 15, Item: 206, Rating: 2.35668733389394
+    User: 19, Item: 2028, Rating: 3.5
-    User: 15, Item: 249, Rating: 3.1290259851652826
+    User: 19, Item: 4993, Rating: 3.5
-    User: 15, Item: 276, Rating: 2.1800017354806753
+    User: 19, Item: 5952, Rating: 3.5
-    User: 15, Item: 369, Rating: 2.3082373858282694
+    User: 19, Item: 2700, Rating: 3.5
-    User: 15, Item: 504, Rating: 2.2600496220227573
+    User: 19, Item: 1721, Rating: 3.5
-    User: 15, Item: 515, Rating: 3.6575674086958188
+    User: 19, Item: 1214, Rating: 3.5
-    User: 15, Item: 522, Rating: 2.4562020809509626
+    User: 19, Item: 364, Rating: 3.5
-    User: 15, Item: 580, Rating: 1.9073310817298395
+    User: 23, Item: 1997, Rating: 2.782649253731343
-    User: 15, Item: 599, Rating: 2.780847470837928
+    User: 23, Item: 2700, Rating: 2.349813432835821
-    User: 15, Item: 915, Rating: 2.761094249104645
+    User: 27, Item: 1997, Rating: 4.666666666666667
-    User: 15, Item: 966, Rating: 3.0894953051643195
+    User: 27, Item: 2028, Rating: 5.0
-    User: 15, Item: 1274, Rating: 2.9873500196382845
+    User: 27, Item: 5952, Rating: 5.0
-    User: 15, Item: 1299, Rating: 3.0779327239728005
+    User: 27, Item: 2700, Rating: 4.666666666666667
-    User: 15, Item: 1345, Rating: 2.2037629856623138
+    User: 27, Item: 1721, Rating: 3.104166666666667
-    User: 15, Item: 1354, Rating: 2.001877412379849
+    User: 27, Item: 364, Rating: 4.604166666666667
-    User: 15, Item: 532, Rating: 2.7123071345260277
+    User: 27, Item: 4308, Rating: 3.104166666666667
    Computing the msd similarity matrix...
    Done computing similarity matrix.
    Predictions with min_k = 2:
-    User: 15, Item: 942, Rating: 3.7769516356699464
+    User: 11, Item: 1214, Rating: 3.1666666666666665
-    User: 15, Item: 2117, Rating: 2.9340004894942537
+    User: 11, Item: 364, Rating: 2.49203431372549
-    User: 15, Item: 2672, Rating: 2.371008709611413
+    User: 11, Item: 4308, Rating: 3.1666666666666665
-    User: 15, Item: 5054, Rating: 2.693661971830986
+    User: 11, Item: 527, Rating: 3.898897058823529
-    User: 15, Item: 6322, Rating: 1.711175832857413
+    User: 13, Item: 1997, Rating: 2.8
-    User: 15, Item: 6323, Rating: 1.7645762379992287
+    User: 13, Item: 4993, Rating: 2.8
-    User: 15, Item: 6757, Rating: 2.693661971830986
+    User: 13, Item: 2700, Rating: 2.8
-    User: 15, Item: 7700, Rating: 3.561484741491386
+    User: 13, Item: 1721, Rating: 2.8
-    User: 15, Item: 7981, Rating: 3.386000174210522
+    User: 13, Item: 527, Rating: 2.8
-    User: 15, Item: 8600, Rating: 3.320743223639117
+    User: 17, Item: 2028, Rating: 3.8125
-    User: 15, Item: 8620, Rating: 2.7538763809343654
+    User: 17, Item: 4993, Rating: 4.128289473684211
-    User: 15, Item: 31952, Rating: 3.7409900837647396
+    User: 17, Item: 1214, Rating: 3.25
-    User: 15, Item: 3, Rating: 2.222062601579949
+    User: 17, Item: 4308, Rating: 3.25
-    User: 15, Item: 64, Rating: 0.9224387353614938
+    User: 19, Item: 1997, Rating: 3.5
-    User: 15, Item: 206, Rating: 2.35668733389394
+    User: 19, Item: 2028, Rating: 3.5
-    User: 15, Item: 249, Rating: 3.1290259851652826
+    User: 19, Item: 4993, Rating: 3.5
-    User: 15, Item: 276, Rating: 2.1800017354806753
+    User: 19, Item: 5952, Rating: 3.5
-    User: 15, Item: 369, Rating: 2.3082373858282694
+    User: 19, Item: 2700, Rating: 3.5
-    User: 15, Item: 504, Rating: 2.2600496220227573
+    User: 19, Item: 1721, Rating: 3.5
-    User: 15, Item: 515, Rating: 3.6575674086958188
+    User: 19, Item: 1214, Rating: 3.5
-    User: 15, Item: 522, Rating: 2.4562020809509626
+    User: 19, Item: 364, Rating: 3.5
-    User: 15, Item: 580, Rating: 1.9073310817298395
+    User: 23, Item: 1997, Rating: 2.782649253731343
-    User: 15, Item: 599, Rating: 2.780847470837928
+    User: 23, Item: 2700, Rating: 2.349813432835821
-    User: 15, Item: 915, Rating: 2.761094249104645
+    User: 27, Item: 1997, Rating: 4.666666666666667
-    User: 15, Item: 966, Rating: 2.693661971830986
+    User: 27, Item: 2028, Rating: 4.666666666666667
-    User: 15, Item: 1274, Rating: 2.9873500196382845
+    User: 27, Item: 5952, Rating: 4.666666666666667
-    User: 15, Item: 1299, Rating: 3.0779327239728005
+    User: 27, Item: 2700, Rating: 4.666666666666667
-    User: 15, Item: 1345, Rating: 2.2037629856623138
+    User: 27, Item: 1721, Rating: 4.666666666666667
-    User: 15, Item: 1354, Rating: 2.001877412379849
+    User: 27, Item: 364, Rating: 4.666666666666667
-    User: 15, Item: 532, Rating: 2.7123071345260277
+    User: 27, Item: 4308, Rating: 4.666666666666667
    Computing the msd similarity matrix...
    Done computing similarity matrix.
    Predictions with min_k = 3:
-    User: 15, Item: 942, Rating: 3.7769516356699464
+    User: 11, Item: 1214, Rating: 3.1666666666666665
-    User: 15, Item: 2117, Rating: 2.9340004894942537
+    User: 11, Item: 364, Rating: 3.1666666666666665
-    User: 15, Item: 2672, Rating: 2.371008709611413
+    User: 11, Item: 4308, Rating: 3.1666666666666665
-    User: 15, Item: 5054, Rating: 2.693661971830986
+    User: 11, Item: 527, Rating: 3.1666666666666665
-    User: 15, Item: 6322, Rating: 2.693661971830986
+    User: 13, Item: 1997, Rating: 2.8
-    User: 15, Item: 6323, Rating: 1.7645762379992287
+    User: 13, Item: 4993, Rating: 2.8
-    User: 15, Item: 6757, Rating: 2.693661971830986
+    User: 13, Item: 2700, Rating: 2.8
-    User: 15, Item: 7700, Rating: 2.693661971830986
+    User: 13, Item: 1721, Rating: 2.8
-    User: 15, Item: 7981, Rating: 3.386000174210522
+    User: 13, Item: 527, Rating: 2.8
-    User: 15, Item: 8600, Rating: 2.693661971830986
+    User: 17, Item: 2028, Rating: 3.25
-    User: 15, Item: 8620, Rating: 2.7538763809343654
+    User: 17, Item: 4993, Rating: 3.25
-    User: 15, Item: 31952, Rating: 2.693661971830986
+    User: 17, Item: 1214, Rating: 3.25
-    User: 15, Item: 3, Rating: 2.222062601579949
+    User: 17, Item: 4308, Rating: 3.25
-    User: 15, Item: 64, Rating: 0.9224387353614938
+    User: 19, Item: 1997, Rating: 3.5
-    User: 15, Item: 206, Rating: 2.35668733389394
+    User: 19, Item: 2028, Rating: 3.5
-    User: 15, Item: 249, Rating: 3.1290259851652826
+    User: 19, Item: 4993, Rating: 3.5
-    User: 15, Item: 276, Rating: 2.1800017354806753
+    User: 19, Item: 5952, Rating: 3.5
-    User: 15, Item: 369, Rating: 2.3082373858282694
+    User: 19, Item: 2700, Rating: 3.5
-    User: 15, Item: 504, Rating: 2.2600496220227573
+    User: 19, Item: 1721, Rating: 3.5
-    User: 15, Item: 515, Rating: 3.6575674086958188
+    User: 19, Item: 1214, Rating: 3.5
-    User: 15, Item: 522, Rating: 2.4562020809509626
+    User: 19, Item: 364, Rating: 3.5
-    User: 15, Item: 580, Rating: 1.9073310817298395
+    User: 23, Item: 1997, Rating: 2.5625
-    User: 15, Item: 599, Rating: 2.780847470837928
+    User: 23, Item: 2700, Rating: 2.5625
-    User: 15, Item: 915, Rating: 2.761094249104645
+    User: 27, Item: 1997, Rating: 4.666666666666667
-    User: 15, Item: 966, Rating: 2.693661971830986
+    User: 27, Item: 2028, Rating: 4.666666666666667
-    User: 15, Item: 1274, Rating: 2.9873500196382845
+    User: 27, Item: 5952, Rating: 4.666666666666667
-    User: 15, Item: 1299, Rating: 3.0779327239728005
+    User: 27, Item: 2700, Rating: 4.666666666666667
-    User: 15, Item: 1345, Rating: 2.2037629856623138
+    User: 27, Item: 1721, Rating: 4.666666666666667
-    User: 15, Item: 1354, Rating: 2.001877412379849
+    User: 27, Item: 364, Rating: 4.666666666666667
-    User: 15, Item: 532, Rating: 2.7123071345260277
+    User: 27, Item: 4308, Rating: 4.666666666666667
 %% Cell type:markdown id:c5209097 tags:
 Quelque soit les neighbours (1,2,3) la valeur du ratings ne change pas
 %% Cell type:markdown id:c8890e11 tags:
 1).Predictions with min_k = 1: In this case, the model makes predictions without considering any minimum number of neighbors. Each prediction is made solely based on the similarity between the target user and other users who have rated the same items. Consequently, we observe varying prediction values for different items. For instance, for user 15 and item 942, the predicted rating is 3.777, while for item 64, the predicted rating is only 0.922. This indicates that the model heavily relies on the ratings from users who may have rated only a single item in common with the target user, leading to potentially erratic predictions.
 2). Predictions with min_k = 2: Here, a minimum of 2 neighbors are required to make a prediction. This introduces a bit of regularization, ensuring that predictions are made based on a slightly broader consensus. We notice that the predictions are somewhat similar to those with min_k = 1, but there are slight changes in some ratings. For example, the rating for item 5054 changes from 3.010 to 2.694. This suggests that the model is slightly more conservative in its predictions due to the requirement of at least two neighbors.
 3). Predictions with min_k = 3: With a minimum of 3 neighbors, the model becomes even more conservative. It requires a stronger consensus among users before making predictions. As a result, we see more uniformity in the predicted ratings compared to the previous cases. For example, for item 6322, the prediction changes from 1.711 (min_k = 1) to 2.694 (min_k = 2) and finally to 2.694 again (min_k = 3). This indicates that the model is increasingly cautious as it demands more agreement among neighbors before making predictions
 %% Cell type:code id:cc806424 tags:
 ``` python
 def analyse_min_support(knn_model, testset):
    # Rétablir min_k à 2
    knn_model.min_k = 2
    # Modifier min_support de 1 à 3 et observer actual_k
    for min_support in range(1, 4):
        knn_model.sim_options['min_support'] = min_support
        predictions_min_support = knn_model.test(testset[:30])  # Prendre les 30 premières prédictions pour l'affichage
        print(f"\nPrédictions avec min_support = {min_support}:")
        for prediction in predictions_min_support:
            actual_k = prediction.details['actual_k']
            print(f"User: {prediction.uid}, Item: {prediction.iid}, Actual_k: {actual_k}")
    # Visualiser la matrice de similarité
    similarity_matrix = knn_model.sim  # Algorithme de knn_model
    print("\nMatrice de similarité:")
    print(similarity_matrix)
 # Appel de la fonction et impression de l'analyse
 result = analyse_min_support(knn_model, testset)
 print(result)
 ```
 %% Output
    Prédictions avec min_support = 1:
-    User: 15, Item: 942, Actual_k: 3
+    User: 11, Item: 1214, Actual_k: 1
-    User: 15, Item: 2117, Actual_k: 3
+    User: 11, Item: 364, Actual_k: 2
-    User: 15, Item: 2672, Actual_k: 3
+    User: 11, Item: 4308, Actual_k: 1
-    User: 15, Item: 5054, Actual_k: 1
+    User: 11, Item: 527, Actual_k: 2
-    User: 15, Item: 6322, Actual_k: 2
+    User: 13, Item: 1997, Actual_k: 0
-    User: 15, Item: 6323, Actual_k: 3
+    User: 13, Item: 4993, Actual_k: 1
-    User: 15, Item: 6757, Actual_k: 1
+    User: 13, Item: 2700, Actual_k: 0
-    User: 15, Item: 7700, Actual_k: 2
+    User: 13, Item: 1721, Actual_k: 1
-    User: 15, Item: 7981, Actual_k: 3
+    User: 13, Item: 527, Actual_k: 1
-    User: 15, Item: 8600, Actual_k: 2
+    User: 17, Item: 2028, Actual_k: 2
-    User: 15, Item: 8620, Actual_k: 3
+    User: 17, Item: 4993, Actual_k: 2
-    User: 15, Item: 31952, Actual_k: 2
+    User: 17, Item: 1214, Actual_k: 1
-    User: 15, Item: 3, Actual_k: 3
+    User: 17, Item: 4308, Actual_k: 1
-    User: 15, Item: 64, Actual_k: 3
+    User: 19, Item: 1997, Actual_k: 0
-    User: 15, Item: 206, Actual_k: 3
+    User: 19, Item: 2028, Actual_k: 0
-    User: 15, Item: 249, Actual_k: 3
+    User: 19, Item: 4993, Actual_k: 0
-    User: 15, Item: 276, Actual_k: 3
+    User: 19, Item: 5952, Actual_k: 0
-    User: 15, Item: 369, Actual_k: 3
+    User: 19, Item: 2700, Actual_k: 0
-    User: 15, Item: 504, Actual_k: 3
+    User: 19, Item: 1721, Actual_k: 0
-    User: 15, Item: 515, Actual_k: 3
+    User: 19, Item: 1214, Actual_k: 0
-    User: 15, Item: 522, Actual_k: 3
+    User: 19, Item: 364, Actual_k: 0
-    User: 15, Item: 580, Actual_k: 3
+    User: 23, Item: 1997, Actual_k: 2
-    User: 15, Item: 599, Actual_k: 3
+    User: 23, Item: 2700, Actual_k: 2
-    User: 15, Item: 915, Actual_k: 3
+    User: 27, Item: 1997, Actual_k: 0
-    User: 15, Item: 966, Actual_k: 1
+    User: 27, Item: 2028, Actual_k: 1
-    User: 15, Item: 1274, Actual_k: 3
+    User: 27, Item: 5952, Actual_k: 1
-    User: 15, Item: 1299, Actual_k: 3
+    User: 27, Item: 2700, Actual_k: 0
-    User: 15, Item: 1345, Actual_k: 3
+    User: 27, Item: 1721, Actual_k: 1
-    User: 15, Item: 1354, Actual_k: 3
+    User: 27, Item: 364, Actual_k: 1
-    User: 15, Item: 532, Actual_k: 3
+    User: 27, Item: 4308, Actual_k: 1
    Prédictions avec min_support = 2:
-    User: 15, Item: 942, Actual_k: 3
+    User: 11, Item: 1214, Actual_k: 1
-    User: 15, Item: 2117, Actual_k: 3
+    User: 11, Item: 364, Actual_k: 2
-    User: 15, Item: 2672, Actual_k: 3
+    User: 11, Item: 4308, Actual_k: 1
-    User: 15, Item: 5054, Actual_k: 1
+    User: 11, Item: 527, Actual_k: 2
-    User: 15, Item: 6322, Actual_k: 2
+    User: 13, Item: 1997, Actual_k: 0
-    User: 15, Item: 6323, Actual_k: 3
+    User: 13, Item: 4993, Actual_k: 1
-    User: 15, Item: 6757, Actual_k: 1
+    User: 13, Item: 2700, Actual_k: 0
-    User: 15, Item: 7700, Actual_k: 2
+    User: 13, Item: 1721, Actual_k: 1
-    User: 15, Item: 7981, Actual_k: 3
+    User: 13, Item: 527, Actual_k: 1
-    User: 15, Item: 8600, Actual_k: 2
+    User: 17, Item: 2028, Actual_k: 2
-    User: 15, Item: 8620, Actual_k: 3
+    User: 17, Item: 4993, Actual_k: 2
-    User: 15, Item: 31952, Actual_k: 2
+    User: 17, Item: 1214, Actual_k: 1
-    User: 15, Item: 3, Actual_k: 3
+    User: 17, Item: 4308, Actual_k: 1
-    User: 15, Item: 64, Actual_k: 3
+    User: 19, Item: 1997, Actual_k: 0
-    User: 15, Item: 206, Actual_k: 3
+    User: 19, Item: 2028, Actual_k: 0
-    User: 15, Item: 249, Actual_k: 3
+    User: 19, Item: 4993, Actual_k: 0
-    User: 15, Item: 276, Actual_k: 3
+    User: 19, Item: 5952, Actual_k: 0
-    User: 15, Item: 369, Actual_k: 3
+    User: 19, Item: 2700, Actual_k: 0
-    User: 15, Item: 504, Actual_k: 3
+    User: 19, Item: 1721, Actual_k: 0
-    User: 15, Item: 515, Actual_k: 3
+    User: 19, Item: 1214, Actual_k: 0
-    User: 15, Item: 522, Actual_k: 3
+    User: 19, Item: 364, Actual_k: 0
-    User: 15, Item: 580, Actual_k: 3
+    User: 23, Item: 1997, Actual_k: 2
-    User: 15, Item: 599, Actual_k: 3
+    User: 23, Item: 2700, Actual_k: 2
-    User: 15, Item: 915, Actual_k: 3
+    User: 27, Item: 1997, Actual_k: 0
-    User: 15, Item: 966, Actual_k: 1
+    User: 27, Item: 2028, Actual_k: 1
-    User: 15, Item: 1274, Actual_k: 3
+    User: 27, Item: 5952, Actual_k: 1
-    User: 15, Item: 1299, Actual_k: 3
+    User: 27, Item: 2700, Actual_k: 0
-    User: 15, Item: 1345, Actual_k: 3
+    User: 27, Item: 1721, Actual_k: 1
-    User: 15, Item: 1354, Actual_k: 3
+    User: 27, Item: 364, Actual_k: 1
-    User: 15, Item: 532, Actual_k: 3
+    User: 27, Item: 4308, Actual_k: 1
    Prédictions avec min_support = 3:
-    User: 15, Item: 942, Actual_k: 3
+    User: 11, Item: 1214, Actual_k: 1
-    User: 15, Item: 2117, Actual_k: 3
+    User: 11, Item: 364, Actual_k: 2
-    User: 15, Item: 2672, Actual_k: 3
+    User: 11, Item: 4308, Actual_k: 1
-    User: 15, Item: 5054, Actual_k: 1
+    User: 11, Item: 527, Actual_k: 2
-    User: 15, Item: 6322, Actual_k: 2
+    User: 13, Item: 1997, Actual_k: 0
-    User: 15, Item: 6323, Actual_k: 3
+    User: 13, Item: 4993, Actual_k: 1
-    User: 15, Item: 6757, Actual_k: 1
+    User: 13, Item: 2700, Actual_k: 0
-    User: 15, Item: 7700, Actual_k: 2
+    User: 13, Item: 1721, Actual_k: 1
-    User: 15, Item: 7981, Actual_k: 3
+    User: 13, Item: 527, Actual_k: 1
-    User: 15, Item: 8600, Actual_k: 2
+    User: 17, Item: 2028, Actual_k: 2
-    User: 15, Item: 8620, Actual_k: 3
+    User: 17, Item: 4993, Actual_k: 2
-    User: 15, Item: 31952, Actual_k: 2
+    User: 17, Item: 1214, Actual_k: 1
-    User: 15, Item: 3, Actual_k: 3
+    User: 17, Item: 4308, Actual_k: 1
-    User: 15, Item: 64, Actual_k: 3
+    User: 19, Item: 1997, Actual_k: 0
-    User: 15, Item: 206, Actual_k: 3
+    User: 19, Item: 2028, Actual_k: 0
-    User: 15, Item: 249, Actual_k: 3
+    User: 19, Item: 4993, Actual_k: 0
-    User: 15, Item: 276, Actual_k: 3
+    User: 19, Item: 5952, Actual_k: 0
-    User: 15, Item: 369, Actual_k: 3
+    User: 19, Item: 2700, Actual_k: 0
-    User: 15, Item: 504, Actual_k: 3
+    User: 19, Item: 1721, Actual_k: 0
-    User: 15, Item: 515, Actual_k: 3
+    User: 19, Item: 1214, Actual_k: 0
-    User: 15, Item: 522, Actual_k: 3
+    User: 19, Item: 364, Actual_k: 0
-    User: 15, Item: 580, Actual_k: 3
+    User: 23, Item: 1997, Actual_k: 2
-    User: 15, Item: 599, Actual_k: 3
+    User: 23, Item: 2700, Actual_k: 2
-    User: 15, Item: 915, Actual_k: 3
+    User: 27, Item: 1997, Actual_k: 0
-    User: 15, Item: 966, Actual_k: 1
+    User: 27, Item: 2028, Actual_k: 1
-    User: 15, Item: 1274, Actual_k: 3
+    User: 27, Item: 5952, Actual_k: 1
-    User: 15, Item: 1299, Actual_k: 3
+    User: 27, Item: 2700, Actual_k: 0
-    User: 15, Item: 1345, Actual_k: 3
+    User: 27, Item: 1721, Actual_k: 1
-    User: 15, Item: 1354, Actual_k: 3
+    User: 27, Item: 364, Actual_k: 1
-    User: 15, Item: 532, Actual_k: 3
+    User: 27, Item: 4308, Actual_k: 1
    Matrice de similarité:
-    [[1.         0.39130435 0.35942029 ... 0.24358974 0.28513238 0.21451104]
+    [[1.         0.         0.24615385 0.         0.43243243 0.        ]
-     [0.39130435 1.         0.32786885 ... 0.30967742 0.42424242 0.21621622]
+     [0.         1.         0.         0.         0.17094017 0.        ]
-     [0.35942029 0.32786885 1.         ... 0.36666667 0.72727273 0.34375   ]
+     [0.24615385 0.         1.         0.         0.53333333 0.        ]
-     ...
+     [0.         0.         0.         1.         0.         0.        ]
-     [0.24358974 0.30967742 0.36666667 ... 1.         0.6779661  0.37569061]
+     [0.43243243 0.17094017 0.53333333 0.         1.         0.25      ]
-     [0.28513238 0.42424242 0.72727273 ... 0.6779661  1.         0.83333333]
+     [0.         0.         0.         0.         0.25       1.        ]]
-     [0.21451104 0.21621622 0.34375    ... 0.37569061 0.83333333 1.        ]]
    None
 %% Cell type:markdown id:2dd01f5b tags:
 # 3. Implement and explore a customizable user-based algorithm
 Create a self-made user-based algorithm allowing to customize the similarity metric, peer group calculation and aggregation function
 %% Cell type:code id:d03ed9eb tags:
 ``` python
 class UserBased(AlgoBase):
    def __init__(self, k=3, min_k=1, sim_options={}, **kwargs):
        AlgoBase.__init__(self, sim_options=sim_options, **kwargs)
        self.k = k
        self.min_k = min_k
        self.sim_options = sim_options
    def fit(self, trainset):
        AlgoBase.fit(self, trainset)
        self.compute_rating_matrix()
        self.compute_similarity_matrix()
        self.compute_mean_ratings()
    def estimate(self, u, i):
        if not (self.trainset.knows_user(u) and self.trainset.knows_item(i)):
            raise PredictionImpossible('User and/or item is unknown.')
        estimate = self.mean_ratings[u]
        # Step 1: Create the peer group of user u for item i
        peer_group = []
        for j, rating in enumerate(self.trainset.ir[i]):
            if rating is not None:
                similarity = self.sim[u, j]  # Similarity between user u and user j for item i
                peer_group.append((j, similarity, rating))
        # Step 2: Pick up the top neighbors efficiently
        k_neighbors = heapq.nlargest(self.min_k, peer_group, key=lambda x: x[1])  # Top k neighbors based on similarity
        # Step 3: Compute the weighted average
        actual_k = len(k_neighbors)
        if actual_k >= self.min_k:
            weighted_sum = 0
            total_similarity = 0
            for j, similarity, rating_list in k_neighbors:
                # Assuming rating_list is a list or array containing ratings
                rating = rating_list[0]  # Access the first element of the rating list
                weighted_sum += similarity * rating
                total_similarity += similarity
            if total_similarity != 0:
                peer_group_average = weighted_sum / total_similarity
                estimate += peer_group_average
        return estimate
    def compute_rating_matrix(self):
        # Get the number of users and items
        n_users = self.trainset.n_users
        n_items = self.trainset.n_items
        ratings_matrix = np.empty((n_users, n_items))
        ratings_matrix[:] = np.nan
        # Fill in the ratings matrix with available ratings
        for user_id, user_ratings in self.trainset.ur.items():
            if user_ratings:  # Check if user has ratings
                for item_id, rating in user_ratings:
                    ratings_matrix[user_id, item_id] = rating
        # Set the computed ratings matrix to self.ratings_matrix
        self.ratings_matrix = ratings_matrix
    def compute_similarity_matrix(self):
        # Get the number of users
        n_users = self.trainset.n_users
        # Initialize the similarity matrix with zeros and ones in the diagonal
        similarity_matrix = np.eye(n_users)
        # Iterate through pairs of users to compute similarities
        for i in range(n_users):
            for j in range(i + 1, n_users):
                # Compute support
                support = np.sum(~np.isnan(self.ratings_matrix[i]) & ~np.isnan(self.ratings_matrix[j]))
                # Check if support is greater than or equal to min_k
                if support >= self.min_k:
                    # Compute similarity using Jaccard similarity
                    intersection = np.sum(~np.isnan(self.ratings_matrix[i]) & ~np.isnan(self.ratings_matrix[j]))
                    union = np.sum(~np.isnan(self.ratings_matrix[i]) | ~np.isnan(self.ratings_matrix[j]))
                    similarity = intersection / union
                    similarity_matrix[i, j] = similarity
                    similarity_matrix[j, i] = similarity  # Similarity matrix is symmetric
        # Set the computed similarity matrix to self.sim
        self.sim = similarity_matrix
    def compute_mean_ratings(self):
        # Compute the mean rating of every user
        mean_ratings = []
        for user_id, ratings in self.trainset.ur.items():
            if ratings:  # Check if user has ratings
                mean_rating = np.mean([rating[1] for rating in ratings])
                mean_ratings.append(mean_rating)
            else:
                mean_ratings.append(0)  # If no ratings available, set mean to 0
        # Set the computed mean ratings
        self.mean_ratings = mean_ratings
 user_based_instance = UserBased(trainset=trainset)
 # Appel de la méthode fit pour calculer les matrices des évaluations, de similarité et les moyennes des évaluations
 user_based_instance.fit(trainset)
 # Affichage de la matrice des évaluations
 print(user_based_instance.ratings_matrix)
 ```
 %% Output
-    [[3.  1.5 4.  ... nan nan nan]
+    [[1.5 4.  5.  4.5 3.  1.  nan nan nan nan]
-     [nan nan nan ... nan nan nan]
+     [nan 2.  nan 2.  nan nan 1.  5.  4.  nan]
-     [4.  3.  3.  ... nan nan nan]
+     [5.  nan nan 4.5 3.  1.  nan 1.5 nan 4.5]
-     ...
+     [nan nan nan nan nan nan nan nan 2.  5. ]
-     [4.5 nan nan ... nan nan nan]
+     [nan 3.  3.  4.  nan 1.  3.  2.5 1.  3. ]
-     [nan nan nan ... nan nan nan]
+     [nan nan 5.  nan nan nan 4.  nan nan 5. ]]
-     [2.  nan nan ... nan nan nan]]
 %% Cell type:markdown id:dfdc9cfe tags:
 # 4. Compare KNNWithMeans with UserBased
 Try to replicate KNNWithMeans with your self-made UserBased and check that outcomes are identical
 %% Cell type:code id:be53ae27 tags:
 ``` python
 # 1. Obtain Predictions
 # Using UserBased algorithm
 user_based_predictions = []
 for uid, iid, true_r in testset:
    user_based_pred = user_based_instance.predict(uid, iid)
    user_based_predictions.append((uid, iid, true_r, user_based_pred.est, {}))
 # Using KNNWithMeans algorithm
 knn_predictions = []
 for uid, iid, true_r in testset:
    knn_pred = knn_model.predict(uid, iid)
    knn_predictions.append((uid, iid, true_r, knn_pred.est, knn_pred.details))
 # 2. Calculate Metrics
 # Calculate MAE and RMSE for UserBased algorithm
 user_based_mae = accuracy.mae(user_based_predictions, verbose=False)
 user_based_rmse = accuracy.rmse(user_based_predictions, verbose=False)
 # Calculate MAE and RMSE for KNNWithMeans algorithm
 knn_mae = accuracy.mae(knn_predictions, verbose=False)
 knn_rmse = accuracy.rmse(knn_predictions, verbose=False)
 # 3. Compare Results
 print("UserBased MAE:", user_based_mae)
 print("UserBased RMSE:", user_based_rmse)
 print("KNNWithMeans MAE:", knn_mae)
 print("KNNWithMeans RMSE:", knn_rmse)
 ```
 %% Output
-    UserBased MAE: 1.5398252671298895
+    UserBased MAE: 1.7175000000000002
-    UserBased RMSE: 1.5553141029705104
+    UserBased RMSE: 1.7384170241918369
-    KNNWithMeans MAE: 0.5419110316300769
+    KNNWithMeans MAE: 0.661617428851614
-    KNNWithMeans RMSE: 0.7019543155680094
+    KNNWithMeans RMSE: 0.8426896111887758
 %% Cell type:markdown id:cced76d9 tags:
 # 5. Compare MSD and Jacard
 Compare predictions made with MSD similarity and Jacard similarity
 %% Cell type:code id:c20d8e19 tags:
 ``` python
 from surprise import accuracy
 from surprise.model_selection import train_test_split
 from surprise import Dataset, Reader
 from surprise import KNNBasic
 # Split the dataset into training and testing sets
 trainset, testset = train_test_split(surprise_data, test_size=0.2)
 # Initialize the model with MSD similarity
 sim_options_msd = {'name': 'msd'}
 user_based_msd = KNNBasic(sim_options=sim_options_msd)
 user_based_msd.fit(trainset)
 # Initialize the model with Jacard similarity
 sim_options_jaccard = {'name': 'cosine'}
 user_based_jaccard = KNNBasic(sim_options=sim_options_jaccard)
 user_based_jaccard.fit(trainset)
 # Make predictions with each model on the test set
 predictions_msd = user_based_msd.test(testset)
 predictions_jaccard = user_based_jaccard.test(testset)
 # Calculate and display the performances of the two models
 rmse_msd = accuracy.rmse(predictions_msd)
 rmse_jaccard = accuracy.rmse(predictions_jaccard)
 print("RMSE with MSD similarity:", rmse_msd)
 print("RMSE with Jaccard similarity:", rmse_jaccard)
 ```
 %% Output
    Computing the msd similarity matrix...
    Done computing similarity matrix.
    Computing the cosine similarity matrix...
    Done computing similarity matrix.
-    RMSE: 0.9799
+    RMSE: 1.0812
-    RMSE: 0.9871
+    RMSE: 1.0910
-    RMSE with MSD similarity: 0.9798533097556152
+    RMSE with MSD similarity: 1.0811758629789194
-    RMSE with Jaccard similarity: 0.9870653791755158
+    RMSE with Jaccard similarity: 1.0910225374454734