update eval block

9823af64 · Adrien Payen · c53e2367 · 9823af64
--- a/evaluator.ipynb
+++ b/evaluator.ipynb
@@ -13,7 +13,7 @@
  },
  {
   "cell_type": "code",
-   "execution_count": 61,
+   "execution_count": 109,
   "id": "6aaf9140",
   "metadata": {},
   "outputs": [
@@ -59,7 +59,7 @@
  },
  {
   "cell_type": "code",
-   "execution_count": 62,
+   "execution_count": 110,
   "id": "d6d82188",
   "metadata": {},
   "outputs": [],
@@ -201,7 +201,7 @@
  },
  {
   "cell_type": "code",
-   "execution_count": 63,
+   "execution_count": 111,
   "id": "f1849e55",
   "metadata": {},
   "outputs": [],
@@ -257,7 +257,7 @@
  },
  {
   "cell_type": "code",
-   "execution_count": 64,
+   "execution_count": 112,
   "id": "704f4d2a",
   "metadata": {},
   "outputs": [
@@ -302,31 +302,109 @@
      "Training loo predictions\n",
      "Training full predictions\n",
      "Handling model ContentBased_Lr\n",
-      "Training split predictions\n"
+      "Training split predictions\n",
+      "- computing metric mae\n",
+      "- computing metric rmse\n",
+      "Training loo predictions\n",
+      "Training full predictions\n",
+      "The data has been exported to the evaluation report\n"
     ]
    },
    {
-     "ename": "ValueError",
+     "data": {
-     "evalue": "1210 is not a valid inner id.",
+      "text/html": [
-     "output_type": "error",
+       "<div>\n",
-     "traceback": [
+       "<style scoped>\n",
-      "\u001b[0;31m---------------------------------------------------------------------------\u001b[0m",
+       "    .dataframe tbody tr th:only-of-type {\n",
-      "\u001b[0;31mKeyError\u001b[0m                                  Traceback (most recent call last)",
+       "        vertical-align: middle;\n",
-      "File \u001b[0;32m/Library/Frameworks/Python.framework/Versions/3.12/lib/python3.12/site-packages/surprise/trainset.py:180\u001b[0m, in \u001b[0;36mTrainset.to_raw_iid\u001b[0;34m(self, iiid)\u001b[0m\n\u001b[1;32m    179\u001b[0m \u001b[38;5;28;01mtry\u001b[39;00m:\n\u001b[0;32m--> 180\u001b[0m     \u001b[38;5;28;01mreturn\u001b[39;00m \u001b[38;5;28;43mself\u001b[39;49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43m_inner2raw_id_items\u001b[49m\u001b[43m[\u001b[49m\u001b[43miiid\u001b[49m\u001b[43m]\u001b[49m\n\u001b[1;32m    181\u001b[0m \u001b[38;5;28;01mexcept\u001b[39;00m \u001b[38;5;167;01mKeyError\u001b[39;00m:\n",
+       "    }\n",
-      "\u001b[0;31mKeyError\u001b[0m: 1210",
+       "\n",
-      "\nDuring handling of the above exception, another exception occurred:\n",
+       "    .dataframe tbody tr th {\n",
-      "\u001b[0;31mValueError\u001b[0m                                Traceback (most recent call last)",
+       "        vertical-align: top;\n",
-      "Cell \u001b[0;32mIn[64], line 16\u001b[0m\n\u001b[1;32m     14\u001b[0m sp_ratings \u001b[38;5;241m=\u001b[39m load_ratings(surprise_format\u001b[38;5;241m=\u001b[39m\u001b[38;5;28;01mTrue\u001b[39;00m)\n\u001b[1;32m     15\u001b[0m precomputed_dict \u001b[38;5;241m=\u001b[39m precomputed_information(pd\u001b[38;5;241m.\u001b[39mread_csv(\u001b[38;5;124m\"\u001b[39m\u001b[38;5;124mdata/tiny/evidence/ratings.csv\u001b[39m\u001b[38;5;124m\"\u001b[39m))\n\u001b[0;32m---> 16\u001b[0m evaluation_report \u001b[38;5;241m=\u001b[39m \u001b[43mcreate_evaluation_report\u001b[49m\u001b[43m(\u001b[49m\u001b[43mEvalConfig\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[43msp_ratings\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[43mprecomputed_dict\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[43mAVAILABLE_METRICS\u001b[49m\u001b[43m)\u001b[49m\n\u001b[1;32m     17\u001b[0m export_evaluation_report(evaluation_report)\n",
+       "    }\n",
-      "Cell \u001b[0;32mIn[62], line 95\u001b[0m, in \u001b[0;36mcreate_evaluation_report\u001b[0;34m(eval_config, sp_ratings, precomputed_dict, available_metrics)\u001b[0m\n\u001b[1;32m     93\u001b[0m \u001b[38;5;28;01mif\u001b[39;00m \u001b[38;5;28mlen\u001b[39m(eval_config\u001b[38;5;241m.\u001b[39msplit_metrics) \u001b[38;5;241m>\u001b[39m \u001b[38;5;241m0\u001b[39m:\n\u001b[1;32m     94\u001b[0m     \u001b[38;5;28mprint\u001b[39m(\u001b[38;5;124m'\u001b[39m\u001b[38;5;124mTraining split predictions\u001b[39m\u001b[38;5;124m'\u001b[39m)\n\u001b[0;32m---> 95\u001b[0m     predictions \u001b[38;5;241m=\u001b[39m \u001b[43mgenerate_split_predictions\u001b[49m\u001b[43m(\u001b[49m\u001b[43malgo\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[43msp_ratings\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[43meval_config\u001b[49m\u001b[43m)\u001b[49m\n\u001b[1;32m     96\u001b[0m     \u001b[38;5;28;01mfor\u001b[39;00m metric \u001b[38;5;129;01min\u001b[39;00m eval_config\u001b[38;5;241m.\u001b[39msplit_metrics:\n\u001b[1;32m     97\u001b[0m         \u001b[38;5;28mprint\u001b[39m(\u001b[38;5;124mf\u001b[39m\u001b[38;5;124m'\u001b[39m\u001b[38;5;124m- computing metric \u001b[39m\u001b[38;5;132;01m{\u001b[39;00mmetric\u001b[38;5;132;01m}\u001b[39;00m\u001b[38;5;124m'\u001b[39m)\n",
+       "\n",
-      "Cell \u001b[0;32mIn[62], line 9\u001b[0m, in \u001b[0;36mgenerate_split_predictions\u001b[0;34m(algo, ratings_dataset, eval_config)\u001b[0m\n\u001b[1;32m      6\u001b[0m trainset, testset \u001b[38;5;241m=\u001b[39m train_test_split(ratings_dataset, test_size\u001b[38;5;241m=\u001b[39meval_config\u001b[38;5;241m.\u001b[39mtest_size)\n\u001b[1;32m      8\u001b[0m \u001b[38;5;66;03m# Training the algorithm on the train data set\u001b[39;00m\n\u001b[0;32m----> 9\u001b[0m \u001b[43malgo\u001b[49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mfit\u001b[49m\u001b[43m(\u001b[49m\u001b[43mtrainset\u001b[49m\u001b[43m)\u001b[49m\n\u001b[1;32m     11\u001b[0m \u001b[38;5;66;03m# Predict ratings for the testset\u001b[39;00m\n\u001b[1;32m     12\u001b[0m predictions \u001b[38;5;241m=\u001b[39m algo\u001b[38;5;241m.\u001b[39mtest(testset)\n",
+       "    .dataframe thead th {\n",
-      "File \u001b[0;32m~/vscodeworkspace/recomsys/models.py:130\u001b[0m, in \u001b[0;36mContentBased.fit\u001b[0;34m(self, trainset)\u001b[0m\n\u001b[1;32m    126\u001b[0m user_ratings \u001b[38;5;241m=\u001b[39m [(\u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mtrainset\u001b[38;5;241m.\u001b[39mto_raw_iid(i), rating) \u001b[38;5;28;01mfor\u001b[39;00m (i, rating) \u001b[38;5;129;01min\u001b[39;00m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mtrainset\u001b[38;5;241m.\u001b[39mur[u]]\n\u001b[1;32m    128\u001b[0m df_user \u001b[38;5;241m=\u001b[39m pd\u001b[38;5;241m.\u001b[39mDataFrame(user_ratings, columns \u001b[38;5;241m=\u001b[39m [\u001b[38;5;124m\"\u001b[39m\u001b[38;5;124mitem_id\u001b[39m\u001b[38;5;124m\"\u001b[39m, \u001b[38;5;124m\"\u001b[39m\u001b[38;5;124muser_ratings\u001b[39m\u001b[38;5;124m\"\u001b[39m])\n\u001b[0;32m--> 130\u001b[0m df_user[\u001b[38;5;124m\"\u001b[39m\u001b[38;5;124mitem_id\u001b[39m\u001b[38;5;124m\"\u001b[39m] \u001b[38;5;241m=\u001b[39m \u001b[43mdf_user\u001b[49m\u001b[43m[\u001b[49m\u001b[38;5;124;43m\"\u001b[39;49m\u001b[38;5;124;43mitem_id\u001b[39;49m\u001b[38;5;124;43m\"\u001b[39;49m\u001b[43m]\u001b[49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mmap\u001b[49m\u001b[43m(\u001b[49m\u001b[43mtrainset\u001b[49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mto_raw_iid\u001b[49m\u001b[43m)\u001b[49m\n\u001b[1;32m    132\u001b[0m df_user \u001b[38;5;241m=\u001b[39m df_user\u001b[38;5;241m.\u001b[39mmerge(\u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mcontent_features, left_on \u001b[38;5;241m=\u001b[39m \u001b[38;5;124m\"\u001b[39m\u001b[38;5;124mitem_id\u001b[39m\u001b[38;5;124m\"\u001b[39m, right_index \u001b[38;5;241m=\u001b[39m \u001b[38;5;28;01mTrue\u001b[39;00m, how \u001b[38;5;241m=\u001b[39m \u001b[38;5;124m'\u001b[39m\u001b[38;5;124mleft\u001b[39m\u001b[38;5;124m'\u001b[39m)\n\u001b[1;32m    134\u001b[0m X \u001b[38;5;241m=\u001b[39m df_user[\u001b[38;5;124m'\u001b[39m\u001b[38;5;124mn_character_title\u001b[39m\u001b[38;5;124m'\u001b[39m]\u001b[38;5;241m.\u001b[39mvalues\u001b[38;5;241m.\u001b[39mreshape(\u001b[38;5;241m-\u001b[39m\u001b[38;5;241m1\u001b[39m,\u001b[38;5;241m1\u001b[39m)\n",
+       "        text-align: right;\n",
-      "File \u001b[0;32m/Library/Frameworks/Python.framework/Versions/3.12/lib/python3.12/site-packages/pandas/core/series.py:4544\u001b[0m, in \u001b[0;36mSeries.map\u001b[0;34m(self, arg, na_action)\u001b[0m\n\u001b[1;32m   4464\u001b[0m \u001b[38;5;28;01mdef\u001b[39;00m \u001b[38;5;21mmap\u001b[39m(\n\u001b[1;32m   4465\u001b[0m     \u001b[38;5;28mself\u001b[39m,\n\u001b[1;32m   4466\u001b[0m     arg: Callable \u001b[38;5;241m|\u001b[39m Mapping \u001b[38;5;241m|\u001b[39m Series,\n\u001b[1;32m   4467\u001b[0m     na_action: Literal[\u001b[38;5;124m\"\u001b[39m\u001b[38;5;124mignore\u001b[39m\u001b[38;5;124m\"\u001b[39m] \u001b[38;5;241m|\u001b[39m \u001b[38;5;28;01mNone\u001b[39;00m \u001b[38;5;241m=\u001b[39m \u001b[38;5;28;01mNone\u001b[39;00m,\n\u001b[1;32m   4468\u001b[0m ) \u001b[38;5;241m-\u001b[39m\u001b[38;5;241m>\u001b[39m Series:\n\u001b[1;32m   4469\u001b[0m \u001b[38;5;250m    \u001b[39m\u001b[38;5;124;03m\"\"\"\u001b[39;00m\n\u001b[1;32m   4470\u001b[0m \u001b[38;5;124;03m    Map values of Series according to an input mapping or function.\u001b[39;00m\n\u001b[1;32m   4471\u001b[0m \n\u001b[0;32m   (...)\u001b[0m\n\u001b[1;32m   4542\u001b[0m \u001b[38;5;124;03m    dtype: object\u001b[39;00m\n\u001b[1;32m   4543\u001b[0m \u001b[38;5;124;03m    \"\"\"\u001b[39;00m\n\u001b[0;32m-> 4544\u001b[0m     new_values \u001b[38;5;241m=\u001b[39m \u001b[38;5;28;43mself\u001b[39;49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43m_map_values\u001b[49m\u001b[43m(\u001b[49m\u001b[43marg\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[43mna_action\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[43mna_action\u001b[49m\u001b[43m)\u001b[49m\n\u001b[1;32m   4545\u001b[0m     \u001b[38;5;28;01mreturn\u001b[39;00m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_constructor(new_values, index\u001b[38;5;241m=\u001b[39m\u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mindex, copy\u001b[38;5;241m=\u001b[39m\u001b[38;5;28;01mFalse\u001b[39;00m)\u001b[38;5;241m.\u001b[39m__finalize__(\n\u001b[1;32m   4546\u001b[0m         \u001b[38;5;28mself\u001b[39m, method\u001b[38;5;241m=\u001b[39m\u001b[38;5;124m\"\u001b[39m\u001b[38;5;124mmap\u001b[39m\u001b[38;5;124m\"\u001b[39m\n\u001b[1;32m   4547\u001b[0m     )\n",
+       "    }\n",
-      "File \u001b[0;32m/Library/Frameworks/Python.framework/Versions/3.12/lib/python3.12/site-packages/pandas/core/base.py:921\u001b[0m, in \u001b[0;36mIndexOpsMixin._map_values\u001b[0;34m(self, mapper, na_action, convert)\u001b[0m\n\u001b[1;32m    918\u001b[0m \u001b[38;5;28;01mif\u001b[39;00m \u001b[38;5;28misinstance\u001b[39m(arr, ExtensionArray):\n\u001b[1;32m    919\u001b[0m     \u001b[38;5;28;01mreturn\u001b[39;00m arr\u001b[38;5;241m.\u001b[39mmap(mapper, na_action\u001b[38;5;241m=\u001b[39mna_action)\n\u001b[0;32m--> 921\u001b[0m \u001b[38;5;28;01mreturn\u001b[39;00m \u001b[43malgorithms\u001b[49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mmap_array\u001b[49m\u001b[43m(\u001b[49m\u001b[43marr\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[43mmapper\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[43mna_action\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[43mna_action\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[43mconvert\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[43mconvert\u001b[49m\u001b[43m)\u001b[49m\n",
+       "</style>\n",
-      "File \u001b[0;32m/Library/Frameworks/Python.framework/Versions/3.12/lib/python3.12/site-packages/pandas/core/algorithms.py:1814\u001b[0m, in \u001b[0;36mmap_array\u001b[0;34m(arr, mapper, na_action, convert)\u001b[0m\n\u001b[1;32m   1812\u001b[0m values \u001b[38;5;241m=\u001b[39m arr\u001b[38;5;241m.\u001b[39mastype(\u001b[38;5;28mobject\u001b[39m, copy\u001b[38;5;241m=\u001b[39m\u001b[38;5;28;01mFalse\u001b[39;00m)\n\u001b[1;32m   1813\u001b[0m \u001b[38;5;28;01mif\u001b[39;00m na_action \u001b[38;5;129;01mis\u001b[39;00m \u001b[38;5;28;01mNone\u001b[39;00m:\n\u001b[0;32m-> 1814\u001b[0m     \u001b[38;5;28;01mreturn\u001b[39;00m \u001b[43mlib\u001b[49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mmap_infer\u001b[49m\u001b[43m(\u001b[49m\u001b[43mvalues\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[43mmapper\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[43mconvert\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[43mconvert\u001b[49m\u001b[43m)\u001b[49m\n\u001b[1;32m   1815\u001b[0m \u001b[38;5;28;01melse\u001b[39;00m:\n\u001b[1;32m   1816\u001b[0m     \u001b[38;5;28;01mreturn\u001b[39;00m lib\u001b[38;5;241m.\u001b[39mmap_infer_mask(\n\u001b[1;32m   1817\u001b[0m         values, mapper, mask\u001b[38;5;241m=\u001b[39misna(values)\u001b[38;5;241m.\u001b[39mview(np\u001b[38;5;241m.\u001b[39muint8), convert\u001b[38;5;241m=\u001b[39mconvert\n\u001b[1;32m   1818\u001b[0m     )\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
-      "File \u001b[0;32mlib.pyx:2926\u001b[0m, in \u001b[0;36mpandas._libs.lib.map_infer\u001b[0;34m()\u001b[0m\n",
+       "  <thead>\n",
-      "File \u001b[0;32m/Library/Frameworks/Python.framework/Versions/3.12/lib/python3.12/site-packages/surprise/trainset.py:182\u001b[0m, in \u001b[0;36mTrainset.to_raw_iid\u001b[0;34m(self, iiid)\u001b[0m\n\u001b[1;32m    180\u001b[0m     \u001b[38;5;28;01mreturn\u001b[39;00m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_inner2raw_id_items[iiid]\n\u001b[1;32m    181\u001b[0m \u001b[38;5;28;01mexcept\u001b[39;00m \u001b[38;5;167;01mKeyError\u001b[39;00m:\n\u001b[0;32m--> 182\u001b[0m     \u001b[38;5;28;01mraise\u001b[39;00m \u001b[38;5;167;01mValueError\u001b[39;00m(\u001b[38;5;28mstr\u001b[39m(iiid) \u001b[38;5;241m+\u001b[39m \u001b[38;5;124m\"\u001b[39m\u001b[38;5;124m is not a valid inner id.\u001b[39m\u001b[38;5;124m\"\u001b[39m)\n",
+       "    <tr style=\"text-align: right;\">\n",
-      "\u001b[0;31mValueError\u001b[0m: 1210 is not a valid inner id."
+       "      <th></th>\n",
-     ]
+       "      <th>mae</th>\n",
+       "      <th>rmse</th>\n",
+       "      <th>hit_rate</th>\n",
+       "      <th>novelty</th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>baseline_1</th>\n",
+       "      <td>1.561178</td>\n",
+       "      <td>1.792482</td>\n",
+       "      <td>0.074766</td>\n",
+       "      <td>99.405607</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>baseline_2</th>\n",
+       "      <td>1.471412</td>\n",
+       "      <td>1.819364</td>\n",
+       "      <td>0.000000</td>\n",
+       "      <td>429.942991</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>baseline_3</th>\n",
+       "      <td>0.878270</td>\n",
+       "      <td>1.085591</td>\n",
+       "      <td>0.074766</td>\n",
+       "      <td>99.405607</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>baseline_4</th>\n",
+       "      <td>0.705673</td>\n",
+       "      <td>0.912313</td>\n",
+       "      <td>0.130841</td>\n",
+       "      <td>60.202804</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>ContentBased_sample</th>\n",
+       "      <td>1.013747</td>\n",
+       "      <td>1.350417</td>\n",
+       "      <td>0.084112</td>\n",
+       "      <td>178.048598</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>ContentBased_score</th>\n",
+       "      <td>1.461846</td>\n",
+       "      <td>1.803067</td>\n",
+       "      <td>0.018692</td>\n",
+       "      <td>437.222430</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>ContentBased_Lr</th>\n",
+       "      <td>1.202626</td>\n",
+       "      <td>1.460273</td>\n",
+       "      <td>0.084112</td>\n",
+       "      <td>278.046729</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "                          mae      rmse  hit_rate     novelty\n",
+       "baseline_1           1.561178  1.792482  0.074766   99.405607\n",
+       "baseline_2           1.471412  1.819364  0.000000  429.942991\n",
+       "baseline_3           0.878270  1.085591  0.074766   99.405607\n",
+       "baseline_4           0.705673  0.912313  0.130841   60.202804\n",
+       "ContentBased_sample  1.013747  1.350417  0.084112  178.048598\n",
+       "ContentBased_score   1.461846  1.803067  0.018692  437.222430\n",
+       "ContentBased_Lr      1.202626  1.460273  0.084112  278.046729"
+      ]
+     },
+     "execution_count": 112,
+     "metadata": {},
+     "output_type": "execute_result"
    }
   ],
   "source": [

 %% Cell type:markdown id:a665885b tags:
 # Evaluator Module
 The Evaluator module creates evaluation reports.
 Reports contain evaluation metrics depending on models specified in the evaluation config.
 %% Cell type:code id:6aaf9140 tags:
 ``` python
 # reloads modules automatically before entering the execution of code
 %load_ext autoreload
 %autoreload 2
 # imports
 import numpy as np
 import pandas as pd
 # local imports
 from configs import EvalConfig
 from constants import Constant as C
 from loaders import export_evaluation_report
 from loaders import load_ratings
 # New imports
 from surprise.model_selection import train_test_split
 from surprise import accuracy
 from surprise.model_selection import LeaveOneOut
 from collections import Counter
 ```
 %% Output
    The autoreload extension is already loaded. To reload it, use:
      %reload_ext autoreload
 %% Cell type:markdown id:d47c24a4 tags:
 # 1. Model validation functions
 Validation functions are a way to perform crossvalidation on recommender system models.
 %% Cell type:code id:d6d82188 tags:
 ``` python
 # -- implement the function generate_split_predictions --
 def generate_split_predictions(algo, ratings_dataset, eval_config):
    """Generate predictions on a random test set specified in eval_config"""
    # Spliting the data into train and test sets
    trainset, testset = train_test_split(ratings_dataset, test_size=eval_config.test_size)
    # Training the algorithm on the train data set
    algo.fit(trainset)
    # Predict ratings for the testset
    predictions = algo.test(testset)
    return predictions
 # -- implement the function generate_loo_top_n --
 def generate_loo_top_n(algo, ratings_dataset, eval_config):
    """Generate top-n recommendations for each user on a random Leave-one-out split (LOO)"""
    # Create a LeaveOneOut split
    loo = LeaveOneOut(n_splits=1)
    for trainset, testset in loo.split(ratings_dataset):
        algo.fit(trainset)  # Train the algorithm on the training set
        anti_testset = trainset.build_anti_testset()  # Build the anti test-set
        predictions = algo.test(anti_testset)  # Get predictions on the anti test-set
        top_n = {}
        for uid, iid, _, est, _ in predictions:
            if uid not in top_n:
                top_n[uid] = []
            top_n[uid].append((iid, est))
        for uid, user_ratings in top_n.items():
            user_ratings.sort(key=lambda x: x[1], reverse=True)
            top_n[uid] = user_ratings[:eval_config.top_n_value]  # Get top-N recommendations
        anti_testset_top_n = top_n
        return anti_testset_top_n, testset
 def generate_full_top_n(algo, ratings_dataset, eval_config):
    """Generate top-n recommendations for each user with full training set (LOO)"""
    full_trainset = ratings_dataset.build_full_trainset()  # Build the full training set
    algo.fit(full_trainset)  # Train the algorithm on the full training set
    anti_testset = full_trainset.build_anti_testset()  # Build the anti test-set
    predictions = algo.test(anti_testset)  # Get predictions on the anti test-set
    top_n = {}
    for uid, iid, _, est, _ in predictions:
        if uid not in top_n:
            top_n[uid] = []
        top_n[uid].append((iid, est))
    for uid, user_ratings in top_n.items():
        user_ratings.sort(key=lambda x: x[1], reverse=True)
        top_n[uid] = user_ratings[:eval_config.top_n_value]  # Get top-N recommendations
    anti_testset_top_n = top_n
    return anti_testset_top_n
 def precomputed_information(movie_data):
    """ Returns a dictionary that precomputes relevant information for evaluating in full mode
    Dictionary keys:
    - precomputed_dict["item_to_rank"] : contains a dictionary mapping movie ids to rankings
    - (-- for your project, add other relevant information here -- )
    """
    # Initialize an empty dictionary to store item_id to rank mapping
    item_to_rank = {}
    # Calculate popularity rank for each movie
    ratings_count = movie_data.groupby('movieId').size().sort_values(ascending=False)
    # Assign ranks to movies based on their popularity
    for rank, (movie_id, _) in enumerate(ratings_count.items(), start=1):
        item_to_rank[movie_id] = rank
    # Create the precomputed dictionary
    precomputed_dict = {}
    precomputed_dict["item_to_rank"] = item_to_rank
    return precomputed_dict
 def create_evaluation_report(eval_config, sp_ratings, precomputed_dict, available_metrics):
    """ Create a DataFrame evaluating various models on metrics specified in an evaluation config.
    """
    evaluation_dict = {}
    for model_name, model, arguments in eval_config.models:
        print(f'Handling model {model_name}')
        algo = model(**arguments)
        evaluation_dict[model_name] = {}
        # Type 1 : split evaluations
        if len(eval_config.split_metrics) > 0:
            print('Training split predictions')
            predictions = generate_split_predictions(algo, sp_ratings, eval_config)
            for metric in eval_config.split_metrics:
                print(f'- computing metric {metric}')
                assert metric in available_metrics['split']
                evaluation_function, parameters =  available_metrics["split"][metric]
                evaluation_dict[model_name][metric] = evaluation_function(predictions, **parameters)
        # Type 2 : loo evaluations
        if len(eval_config.loo_metrics) > 0:
            print('Training loo predictions')
            anti_testset_top_n, testset = generate_loo_top_n(algo, sp_ratings, eval_config)
            for metric in eval_config.loo_metrics:
                assert metric in available_metrics['loo']
                evaluation_function, parameters =  available_metrics["loo"][metric]
                evaluation_dict[model_name][metric] = evaluation_function(anti_testset_top_n, testset, **parameters)
        # Type 3 : full evaluations
        if len(eval_config.full_metrics) > 0:
            print('Training full predictions')
            anti_testset_top_n = generate_full_top_n(algo, sp_ratings, eval_config)
            for metric in eval_config.full_metrics:
                assert metric in available_metrics['full']
                evaluation_function, parameters =  available_metrics["full"][metric]
                evaluation_dict[model_name][metric] = evaluation_function(
                    anti_testset_top_n,
                    **precomputed_dict,
                    **parameters
                )
    return pd.DataFrame.from_dict(evaluation_dict).T
 ```
 %% Cell type:markdown id:f7e83d1d tags:
 # 2. Evaluation metrics
 Implement evaluation metrics for either rating predictions (split metrics) or for top-n recommendations (loo metric, full metric)
 %% Cell type:code id:f1849e55 tags:
 ``` python
 # -- implement the function get_hit_rate --
 def get_hit_rate(anti_testset_top_n, testset):
    """Compute the average hit over the users (loo metric)
    A hit (1) happens when the movie in the testset has been picked by the top-n recommender
    A fail (0) happens when the movie in the testset has not been picked by the top-n recommender
    """
    hits = 0
    total_users = len(testset)
    for uid, true_iid, _ in testset:
        if uid in anti_testset_top_n and true_iid in {iid for iid, _ in anti_testset_top_n[uid]}:
            hits += 1
    hit_rate = hits / total_users
    return hit_rate
 # -- implement the function get_novelty --
 def get_novelty(anti_testset_top_n, item_to_rank):
    """Compute the average novelty of the top-n recommendation over the users (full metric)
    The novelty is defined as the average ranking of the movies recommended
    """
    total_rank_sum = 0
    total_recommendations = 0
    for uid, recommendations in anti_testset_top_n.items():
        for iid, _ in recommendations:
            if iid in item_to_rank:
                total_rank_sum += item_to_rank[iid]
                total_recommendations += 1
    if total_recommendations == 0:
        return 0  # Avoid division by zero
    average_rank_sum = total_rank_sum / total_recommendations
    return average_rank_sum
 ```
 %% Cell type:markdown id:1a9855b3 tags:
 # 3. Evaluation workflow
 Load data, evaluate models and save the experimental outcomes
 %% Cell type:code id:704f4d2a tags:
 ``` python
 AVAILABLE_METRICS = {
    "split": {
        "mae": (accuracy.mae, {'verbose': False}),
        "rmse": (accuracy.rmse, {'verbose': False})
    },
    "loo": {
        "hit_rate": (get_hit_rate, {}),
    },
    "full": {
        "novelty": (get_novelty, {}),
    }
 }
 sp_ratings = load_ratings(surprise_format=True)
 precomputed_dict = precomputed_information(pd.read_csv("data/tiny/evidence/ratings.csv"))
 evaluation_report = create_evaluation_report(EvalConfig, sp_ratings, precomputed_dict, AVAILABLE_METRICS)
 export_evaluation_report(evaluation_report)
 ```
 %% Output
    Handling model baseline_1
    Training split predictions
    - computing metric mae
    - computing metric rmse
    Training loo predictions
    Training full predictions
    Handling model baseline_2
    Training split predictions
    - computing metric mae
    - computing metric rmse
    Training loo predictions
    Training full predictions
    Handling model baseline_3
    Training split predictions
    - computing metric mae
    - computing metric rmse
    Training loo predictions
    Training full predictions
    Handling model baseline_4
    Training split predictions
    - computing metric mae
    - computing metric rmse
    Training loo predictions
    Training full predictions
    Handling model ContentBased_sample
    Training split predictions
    - computing metric mae
    - computing metric rmse
    Training loo predictions
    Training full predictions
    Handling model ContentBased_score
    Training split predictions
    - computing metric mae
    - computing metric rmse
    Training loo predictions
    Training full predictions
    Handling model ContentBased_Lr
    Training split predictions
+    - computing metric mae
+    - computing metric rmse
+    Training loo predictions
+    Training full predictions
+    The data has been exported to the evaluation report
-    ---------------------------------------------------------------------------
+                              mae      rmse  hit_rate     novelty
-    KeyError                                  Traceback (most recent call last)
+    baseline_1           1.561178  1.792482  0.074766   99.405607
-File     /Library/Frameworks/Python.framework/Versions/3.12/lib/python3.12/site-packages/surprise/trainset.py:180, in Trainset.to_raw_iid(self, iiid)
+    baseline_2           1.471412  1.819364  0.000000  429.942991
-        179 try:
+    baseline_3           0.878270  1.085591  0.074766   99.405607
-    --> 180     return self._inner2raw_id_items[iiid]
+    baseline_4           0.705673  0.912313  0.130841   60.202804
-        181 except KeyError:
+    ContentBased_sample  1.013747  1.350417  0.084112  178.048598
-    KeyError: 1210
+    ContentBased_score   1.461846  1.803067  0.018692  437.222430
+    ContentBased_Lr      1.202626  1.460273  0.084112  278.046729
-During handling of the above exception, another exception occurred:
-    ValueError                                Traceback (most recent call last)
-Cell     In[64], line 16
-         14 sp_ratings = load_ratings(surprise_format=True)
-         15 precomputed_dict = precomputed_information(pd.read_csv("data/tiny/evidence/ratings.csv"))
-    ---> 16 evaluation_report = create_evaluation_report(EvalConfig, sp_ratings, precomputed_dict, AVAILABLE_METRICS)
-         17 export_evaluation_report(evaluation_report)
-Cell     In[62], line 95, in create_evaluation_report(eval_config, sp_ratings, precomputed_dict, available_metrics)
-         93 if len(eval_config.split_metrics) > 0:
-         94     print('Training split predictions')
-    ---> 95     predictions = generate_split_predictions(algo, sp_ratings, eval_config)
-         96     for metric in eval_config.split_metrics:
-         97         print(f'- computing metric {metric}')
-Cell     In[62], line 9, in generate_split_predictions(algo, ratings_dataset, eval_config)
-          6 trainset, testset = train_test_split(ratings_dataset, test_size=eval_config.test_size)
-          8 # Training the algorithm on the train data set
-    ----> 9 algo.fit(trainset)
-         11 # Predict ratings for the testset
-         12 predictions = algo.test(testset)
-File     ~/vscodeworkspace/recomsys/models.py:130, in ContentBased.fit(self, trainset)
-        126 user_ratings = [(self.trainset.to_raw_iid(i), rating) for (i, rating) in self.trainset.ur[u]]
-        128 df_user = pd.DataFrame(user_ratings, columns = ["item_id", "user_ratings"])
-    --> 130 df_user["item_id"] = df_user["item_id"].map(trainset.to_raw_iid)
-        132 df_user = df_user.merge(self.content_features, left_on = "item_id", right_index = True, how = 'left')
-        134 X = df_user['n_character_title'].values.reshape(-1,1)
-File     /Library/Frameworks/Python.framework/Versions/3.12/lib/python3.12/site-packages/pandas/core/series.py:4544, in Series.map(self, arg, na_action)
-       4464 def map(
-       4465     self,
-       4466     arg: Callable | Mapping | Series,
-       4467     na_action: Literal["ignore"] | None = None,
-       4468 ) -> Series:
-       4469     """
-       4470     Map values of Series according to an input mapping or function.
-       4471
-       (...)
-       4542     dtype: object
-       4543     """
-    -> 4544     new_values = self._map_values(arg, na_action=na_action)
-       4545     return self._constructor(new_values, index=self.index, copy=False).__finalize__(
-       4546         self, method="map"
-       4547     )
-File     /Library/Frameworks/Python.framework/Versions/3.12/lib/python3.12/site-packages/pandas/core/base.py:921, in IndexOpsMixin._map_values(self, mapper, na_action, convert)
-        918 if isinstance(arr, ExtensionArray):
-        919     return arr.map(mapper, na_action=na_action)
-    --> 921 return algorithms.map_array(arr, mapper, na_action=na_action, convert=convert)
-File     /Library/Frameworks/Python.framework/Versions/3.12/lib/python3.12/site-packages/pandas/core/algorithms.py:1814, in map_array(arr, mapper, na_action, convert)
-       1812 values = arr.astype(object, copy=False)
-       1813 if na_action is None:
-    -> 1814     return lib.map_infer(values, mapper, convert=convert)
-       1815 else:
-       1816     return lib.map_infer_mask(
-       1817         values, mapper, mask=isna(values).view(np.uint8), convert=convert
-       1818     )
-File     lib.pyx:2926, in pandas._libs.lib.map_infer()
-File     /Library/Frameworks/Python.framework/Versions/3.12/lib/python3.12/site-packages/surprise/trainset.py:182, in Trainset.to_raw_iid(self, iiid)
-        180     return self._inner2raw_id_items[iiid]
-        181 except KeyError:
-    --> 182     raise ValueError(str(iiid) + " is not a valid inner id.")
-    ValueError: 1210 is not a valid inner id.
 %% Cell type:markdown id:6f8b6d19 tags:
 dire quel modèle est meilleur ?