sequential-parameter-optimization
diff --git a/‎notebooks/00_spot_doc.ipynb‎
Lines changed: 258 additions & 0 deletions b/‎notebooks/00_spot_doc.ipynb‎
Lines changed: 258 additions & 0 deletions
@@ -884,6 +884,264 @@
     "\n",
     "# root.mainloop()"
    ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 1,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "def apk(actual, predicted, k=10):\n",
+    "    \"\"\"\n",
+    "    Computes the average precision at k.\n",
+    "    This function computes the average precision at k between two lists of\n",
+    "    items.\n",
+    "    Parameters\n",
+    "    ----------\n",
+    "    actual : list\n",
+    "             A list of elements that are to be predicted (order doesn't matter)\n",
+    "    predicted : list\n",
+    "                A list of predicted elements (order does matter)\n",
+    "    k : int, optional\n",
+    "        The maximum number of predicted elements\n",
+    "    Returns\n",
+    "    -------\n",
+    "    score : double\n",
+    "            The average precision at k over the input lists\n",
+    "    \"\"\"\n",
+    "    if len(predicted) > k:\n",
+    "        predicted = predicted[:k]\n",
+    "\n",
+    "    score = 0.0\n",
+    "    num_hits = 0.0\n",
+    "\n",
+    "    for i, p in enumerate(predicted):\n",
+    "        if p in actual and p not in predicted[:i]:\n",
+    "            num_hits += 1.0\n",
+    "            score += num_hits / (i + 1.0)\n",
+    "\n",
+    "    if not actual:\n",
+    "        return 0.0\n",
+    "\n",
+    "    return score / min(len(actual), k)\n",
+    "\n",
+    "\n",
+    "def mapk(actual, predicted, k=10):\n",
+    "    \"\"\"\n",
+    "    Computes the mean average precision at k.\n",
+    "    This function computes the mean average precision at k between two lists\n",
+    "    of lists of items.\n",
+    "    Parameters\n",
+    "    ----------\n",
+    "    actual : list\n",
+    "             A list of lists of elements that are to be predicted\n",
+    "             (order doesn't matter in the lists)\n",
+    "    predicted : list\n",
+    "                A list of lists of predicted elements\n",
+    "                (order matters in the lists)\n",
+    "    k : int, optional\n",
+    "        The maximum number of predicted elements\n",
+    "    Returns\n",
+    "    -------\n",
+    "    score : double\n",
+    "            The mean average precision at k over the input lists\n",
+    "    \"\"\"\n",
+    "    return np.mean([apk(a, p, k) for a, p in zip(actual, predicted)])\n",
+    "\n",
+    "\n",
+    "def mapk_score(y_true, y_pred, k=3):\n",
+    "    \"\"\" Wrapper for mapk func using numpy arrays\n",
+    "     Args:\n",
+    "            y_true (np.array): array of true values\n",
+    "            y_pred (np.array): array of predicted values\n",
+    "            k (int): number of predictions\n",
+    "    Returns:\n",
+    "            score (float): mean average precision at k\n",
+    "    Examples:\n",
+    "            >>> y_true = np.array([0, 1, 2, 2])\n",
+    "            >>> y_pred = np.array([[0.5, 0.2, 0.2],  # 0 is in top 2\n",
+    "                     [0.3, 0.4, 0.2],  # 1 is in top 2\n",
+    "                     [0.2, 0.4, 0.3],  # 2 is in top 2\n",
+    "                     [0.7, 0.2, 0.1]]) # 2 isn't in top 2\n",
+    "            >>> mapk_score(y_true, y_pred, k=1)\n",
+    "            0.33333333333333331\n",
+    "            >>> mapk_score(y_true, y_pred, k=2)\n",
+    "            0.75\n",
+    "            >>> mapk_score(y_true, y_pred, k=3)\n",
+    "            0.3611111111111111\n",
+    "            >>> mapk_score(y_true, y_pred, k=4)\n",
+    "            0.34722222222222221\n",
+    "            >>> mapk_score(y_true, y_pred, k=5)\n",
+    "            0.34722222222222221\n",
+    "       \"\"\"\n",
+    "    sorted_prediction_ids = np.argsort(-y_pred, axis=1)\n",
+    "    top_k_prediction_ids = sorted_prediction_ids[:, :k]\n",
+    "    score = mapk(y_true.reshape(-1, 1), top_k_prediction_ids, k=k)\n",
+    "    return score"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 17,
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "0.75"
+      ]
+     },
+     "execution_count": 17,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "import numpy as np\n",
+    "# rom spotPython.utils.metrics import mapk_score\n",
+    "from sklearn.metrics import top_k_accuracy_score\n",
+    "\n",
+    "y_true = np.array([0, 1, 2, 2])\n",
+    "y_pred = np.array([[0.5, 0.2, 0.2],  # 0 is in top 2\n",
+    "            [0.3, 0.4, 0.2],  # 1 is in top 2\n",
+    "            [0.2, 0.4, 0.3],  # 2 is in top 2\n",
+    "            [0.7, 0.2, 0.1]]) # 2 isn't in top 2\n",
+    "top_k_accuracy_score(y_true, y_pred, k=2)\n",
+    "#mapk_score(y_true, y_pred, k=2)\n"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 7,
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "0.4583333333333333"
+      ]
+     },
+     "execution_count": 7,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "mapk_score(y_true, y_pred, k=5)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 11,
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "(4,)"
+      ]
+     },
+     "execution_count": 11,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "y_true.shape"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 12,
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "numpy.ndarray"
+      ]
+     },
+     "execution_count": 12,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "type(y_true)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 13,
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "array([[0],\n",
+       "       [1],\n",
+       "       [2],\n",
+       "       [2]])"
+      ]
+     },
+     "execution_count": 13,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "y_true.reshape(-1, 1)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 15,
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "array([0, 1, 2, 2])"
+      ]
+     },
+     "execution_count": 15,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "y_true"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 18,
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "array([[0, 1, 2],\n",
+       "       [1, 0, 2],\n",
+       "       [1, 2, 0],\n",
+       "       [0, 1, 2]])"
+      ]
+     },
+     "execution_count": 18,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "np.argsort(-y_pred, axis=1)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": []
   }
  ],
  "metadata": {