{
"cells": [
{
"cell_type": "code",
"execution_count": 13,
"id": "3f8c6593-fa93-44c3-bbc2-7191da00ed1f",
"metadata": {},
"outputs": [],
"source": [
"import numpy as np\n",
"import pandas as pd\n",
"import matplotlib.pyplot as plt\n",
"%matplotlib inline"
]
},
{
"cell_type": "code",
"execution_count": 9,
"id": "cf716145-8bf5-41d5-a8dc-ecad0802ed28",
"metadata": {},
"outputs": [],
"source": [
"labels_df = pd.read_csv(\"train.csv\", header=None)\n",
"labels_df.columns = [\"path1\", \"path2\", \"path3\", \"is_collected\"]"
]
},
{
"cell_type": "code",
"execution_count": 14,
"id": "82b36668-d24c-42fb-a956-6db50cf93c5f",
"metadata": {},
"outputs": [],
"source": [
"items = []\n",
"for is_collected in labels_df[\"is_collected\"].values:\n",
" item = \"True\" if is_collected else \"False\"\n",
" items.append(item)\n",
"items = np.array(items)"
]
},
{
"cell_type": "code",
"execution_count": 15,
"id": "1401cdb8-6fec-4635-b1f4-dd96becd81eb",
"metadata": {},
"outputs": [
{
"data": {
"image/png": "iVBORw0KGgoAAAANSUhEUgAAAYQAAAD4CAYAAADsKpHdAAAAOXRFWHRTb2Z0d2FyZQBNYXRwbG90bGliIHZlcnNpb24zLjMuNCwgaHR0cHM6Ly9tYXRwbG90bGliLm9yZy8QVMy6AAAACXBIWXMAAAsTAAALEwEAmpwYAAARpElEQVR4nO3df6xf9X3f8ecrdkq9ZTB+XJhlWzUqrhRAihMszxLalsxV8Zo/TCTQLuuKJ1lyhRyp1bJJUEVq9oenoC1BQhpojkAYlAVc0hRvDWuRyRR18iA3kRdjCM1VocG1h28LozANFjvv/XHfV/r6+uv7077XMc+HdPQ93/f5fM75HP/xfd3zOef7daoKSZI+stwDkCRdHAwESRJgIEiSmoEgSQIMBElSW7ncA1ioa665ptavX7/cw5Cknyvf//73/6qqRoZt+7kNhPXr1zM2Nrbcw5CknytJ/uJc25wykiQBBoIkqRkIkiTAQJAktVkDIckvJnkxyf9McjTJv+n6VUmeS/Ljfr1yoM99ScaTvJrktoH6LUmO9LYHk6TrlyV5qusvJFl/Ac5VkjSDuVwhfAD846r6BLAR2JZkC3AvcLCqNgAH+z1JbgRGgZuAbcBDSVb0vh4GdgEbetnW9Z3A21V1A/AAcP/iT02SNB+zBkJNeq/ffrSXArYD+7q+D7i917cDT1bVB1X1GjAObE6yGri8qg7V5E+sPj6tz9S+nga2Tl09SJKWxpzuISRZkeQwcBJ4rqpeAK6rqhMA/XptN18DvDHQ/VjX1vT69PoZfarqFPAOcPWQcexKMpZkbGJiYk4nKEmamzkFQlWdrqqNwFom/9q/eYbmw/6yrxnqM/WZPo69VbWpqjaNjAz9op0kaYHm9U3lqvrfSf4bk3P/byZZXVUnejroZDc7Bqwb6LYWON71tUPqg32OJVkJXAG8Nc9zmbP19/7Rhdr1rF7/8meX7diSNJO5PGU0kuTv9voq4FeBHwEHgB3dbAfwTK8fAEb7yaHrmbx5/GJPK72bZEvfH7h7Wp+pfd0BPF/+V26StKTmcoWwGtjXTwp9BNhfVf8lySFgf5KdwE+AOwGq6miS/cDLwClgd1Wd7n3dAzwGrAKe7QXgEeCJJONMXhmMno+TkyTN3ayBUFU/BD45pP7XwNZz9NkD7BlSHwPOuv9QVe/TgSJJWh5+U1mSBBgIkqRmIEiSAANBktQMBEkSYCBIkpqBIEkCDARJUjMQJEmAgSBJagaCJAkwECRJzUCQJAEGgiSpGQiSJMBAkCQ1A0GSBBgIkqRmIEiSAANBktQMBEkSYCBIkpqBIEkCDARJUjMQJEmAgSBJarMGQpJ1Sb6T5JUkR5P8dte/lOQvkxzu5dcH+tyXZDzJq0luG6jfkuRIb3swSbp+WZKnuv5CkvUX4FwlSTOYyxXCKeALVfVxYAuwO8mNve2BqtrYy7cBetsocBOwDXgoyYpu/zCwC9jQy7au7wTerqobgAeA+xd/apKk+Zg1EKrqRFX9oNffBV4B1szQZTvwZFV9UFWvAePA5iSrgcur6lBVFfA4cPtAn329/jSwderqQZK0NOZ1D6Gncj4JvNClzyf5YZJHk1zZtTXAGwPdjnVtTa9Pr5/Rp6pOAe8AVw85/q4kY0nGJiYm5jN0SdIs5hwIST4GfBP4nar6Gyanf34Z2AicAL4y1XRI95qhPlOfMwtVe6tqU1VtGhkZmevQJUlzMKdASPJRJsPg61X1BwBV9WZVna6qnwFfAzZ382PAuoHua4HjXV87pH5GnyQrgSuAtxZyQpKkhZnLU0YBHgFeqaqvDtRXDzT7HPBSrx8ARvvJoeuZvHn8YlWdAN5NsqX3eTfwzECfHb1+B/B832eQJC2RlXNocyvwm8CRJIe79rvAXUk2Mjm18zrwWwBVdTTJfuBlJp9Q2l1Vp7vfPcBjwCrg2V5gMnCeSDLO5JXB6GJOSpI0f7MGQlX9KcPn+L89Q589wJ4h9THg5iH194E7ZxuLJOnC8ZvKkiTAQJAkNQNBkgQYCJKkZiBIkgADQZLUDARJEmAgSJKagSBJAgwESVIzECRJgIEgSWoGgiQJMBAkSc1AkCQBBoIkqRkIkiTAQJAkNQNBkgQYCJKkZiBIkgADQZLUDARJEmAgSJKagSBJAgwESVKbNRCSrEvynSSvJDma5Le7flWS55L8uF+vHOhzX5LxJK8muW2gfkuSI73twSTp+mVJnur6C0nWX4BzlSTNYC5XCKeAL1TVx4EtwO4kNwL3AgeragNwsN/T20aBm4BtwENJVvS+HgZ2ARt62db1ncDbVXUD8ABw/3k4N0nSPMwaCFV1oqp+0OvvAq8Aa4DtwL5utg+4vde3A09W1QdV9RowDmxOshq4vKoOVVUBj0/rM7Wvp4GtU1cPkqSlMa97CD2V80ngBeC6qjoBk6EBXNvN1gBvDHQ71rU1vT69fkafqjoFvANcPeT4u5KMJRmbmJiYz9AlSbOYcyAk+RjwTeB3qupvZmo6pFYz1Gfqc2aham9VbaqqTSMjI7MNWZI0D3MKhCQfZTIMvl5Vf9DlN3saiH492fVjwLqB7muB411fO6R+Rp8kK4ErgLfmezKSpIWby1NGAR4BXqmqrw5sOgDs6PUdwDMD9dF+cuh6Jm8ev9jTSu8m2dL7vHtan6l93QE83/cZJElLZOUc2twK/CZwJMnhrv0u8GVgf5KdwE+AOwGq6miS/cDLTD6htLuqTne/e4DHgFXAs73AZOA8kWScySuD0cWdliRpvmYNhKr6U4bP8QNsPUefPcCeIfUx4OYh9ffpQJEkLQ+/qSxJAgwESVIzECRJgIEgSWoGgiQJMBAkSc1AkCQBBoIkqRkIkiTAQJAkNQNBkgQYCJKkZiBIkgADQZLUDARJEmAgSJKagSBJAgwESVIzECRJgIEgSWoGgiQJMBAkSc1AkCQBBoIkqRkIkiRgDoGQ5NEkJ5O8NFD7UpK/THK4l18f2HZfkvEkrya5baB+S5Ijve3BJOn6ZUme6voLSdaf53OUJM3BXK4QHgO2Dak/UFUbe/k2QJIbgVHgpu7zUJIV3f5hYBewoZepfe4E3q6qG4AHgPsXeC6SpEWYNRCq6rvAW3Pc33bgyar6oKpeA8aBzUlWA5dX1aGqKuBx4PaBPvt6/Wlg69TVgyRp6SzmHsLnk/ywp5Su7Noa4I2BNse6tqbXp9fP6FNVp4B3gKsXMS5J0gIsNBAeBn4Z2AicAL7S9WF/2dcM9Zn6nCXJriRjScYmJibmNWBJ0swWFAhV9WZVna6qnwFfAzb3pmPAuoGma4HjXV87pH5GnyQrgSs4xxRVVe2tqk1VtWlkZGQhQ5ckncOCAqHvCUz5HDD1BNIBYLSfHLqeyZvHL1bVCeDdJFv6/sDdwDMDfXb0+h3A832fQZK0hFbO1iDJN4BPA9ckOQb8HvDpJBuZnNp5HfgtgKo6mmQ/8DJwCthdVad7V/cw+cTSKuDZXgAeAZ5IMs7klcHoeTgvSdI8zRoIVXXXkPIjM7TfA+wZUh8Dbh5Sfx+4c7ZxSJIuLL+pLEkCDARJUjMQJEmAgSBJagaCJAkwECRJzUCQJAEGgiSpGQiSJMBAkCQ1A0GSBBgIkqRmIEiSAANBktQMBEkSYCBIkpqBIEkCDARJUjMQJEmAgSBJagaCJAkwECRJzUCQJAEGgiSpGQiSJMBAkCS1WQMhyaNJTiZ5aaB2VZLnkvy4X68c2HZfkvEkrya5baB+S5Ijve3BJOn6ZUme6voLSdaf53OUJM3BXK4QHgO2TavdCxysqg3AwX5PkhuBUeCm7vNQkhXd52FgF7Chl6l97gTerqobgAeA+xd6MpKkhZs1EKrqu8Bb08rbgX29vg+4faD+ZFV9UFWvAePA5iSrgcur6lBVFfD4tD5T+3oa2Dp19SBJWjoLvYdwXVWdAOjXa7u+BnhjoN2xrq3p9en1M/pU1SngHeDqYQdNsivJWJKxiYmJBQ5dkjTM+b6pPOwv+5qhPlOfs4tVe6tqU1VtGhkZWeAQJUnDLDQQ3uxpIPr1ZNePAesG2q0Fjnd97ZD6GX2SrASu4OwpKknSBbbQQDgA7Oj1HcAzA/XRfnLoeiZvHr/Y00rvJtnS9wfuntZnal93AM/3fQZJ0hJaOVuDJN8APg1ck+QY8HvAl4H9SXYCPwHuBKiqo0n2Ay8Dp4DdVXW6d3UPk08srQKe7QXgEeCJJONMXhmMnpczkyTNy6yBUFV3nWPT1nO03wPsGVIfA24eUn+fDhRJ0vLxm8qSJMBAkCQ1A0GSBBgIkqRmIEiSAANBktQMBEkSYCBIkpqBIEkCDARJUjMQJEmAgSBJagaCJAkwECRJzUCQJAEGgiSpGQiSJMBAkCQ1A0GSBBgIkqRmIEiSAANBktQMBEkSYCBIkpqBIEkCDARJUltUICR5PcmRJIeTjHXtqiTPJflxv1450P6+JONJXk1y20D9lt7PeJIHk2Qx45Ikzd/5uEL4TFVtrKpN/f5e4GBVbQAO9nuS3AiMAjcB24CHkqzoPg8Du4ANvWw7D+OSJM3DhZgy2g7s6/V9wO0D9Ser6oOqeg0YBzYnWQ1cXlWHqqqAxwf6SJKWyGIDoYA/SfL9JLu6dl1VnQDo12u7vgZ4Y6Dvsa6t6fXp9bMk2ZVkLMnYxMTEIocuSRq0cpH9b62q40muBZ5L8qMZ2g67L1Az1M8uVu0F9gJs2rRpaBtJ0sIs6gqhqo7360ngW8Bm4M2eBqJfT3bzY8C6ge5rgeNdXzukLklaQgsOhCR/O8nfmVoHfg14CTgA7OhmO4Bnev0AMJrksiTXM3nz+MWeVno3yZZ+uujugT6SpCWymCmj64Bv9ROiK4H/VFX/Ncn3gP1JdgI/Ae4EqKqjSfYDLwOngN1Vdbr3dQ/wGLAKeLYXSdISWnAgVNWfA58YUv9rYOs5+uwB9gypjwE3L3QskqTF85vKkiTAQJAkNQNBkgQYCJKkZiBIkgADQZLUDARJEmAgSJKagSBJAgwESVIzECRJwOL/PwRJ+lBaf+8fLduxX//yZy/Ifr1CkCQBBoIkqRkIkiTAQJAkNQNBkgQYCJKkZiBIkgADQZLUDARJEmAgSJKagSBJAgwESVIzECRJgIEgSWoXTSAk2Zbk1STjSe5d7vFI0ofNRREISVYA/wH4J8CNwF1JblzeUUnSh8tFEQjAZmC8qv68qv4f8CSwfZnHJEkfKhfL/5i2Bnhj4P0x4O9Pb5RkF7Cr376X5NUFHu8a4K8W2HdRcv9yHFXSpST3L+oz7JfOteFiCYQMqdVZhaq9wN5FHywZq6pNi92PJC2HC/UZdrFMGR0D1g28XwscX6axSNKH0sUSCN8DNiS5PskvAKPAgWUekyR9qFwUU0ZVdSrJ54E/BlYAj1bV0Qt4yEVPO0nSMrogn2GpOmuqXpL0IXSxTBlJkpaZgSBJAi6SewjnQ5LTwJGB0u1V9fo52r5XVR9bkoFJ0hwkuRo42G//HnAamOj3m/tLuxd2DJfKPYT5fMgbCJIuZkm+BLxXVf9+oLayqk5dyONeslNGST6W5GCSHyQ5kuSsn8JIsjrJd5McTvJSkn/Q9V9Lcqj7/n4Sw0PSkkvyWJKvJvkOcH+SLyX5VwPbX0qyvtf/eZIX+/PsP/ZvxM3LpRQIq/of4nCSbwHvA5+rqk8BnwG+kmT6N6L/GfDHVbUR+ARwOMk1wBeBX+2+Y8C/XLKzkKQz/QqTn0dfOFeDJB8H/ilwa3+enQZ+Y74HumTuIQD/t/8hAEjyUeDfJvmHwM+Y/L2k64D/NdDne8Cj3fYPq+pwkn/E5C+u/vfOj18ADi3NKUjSWX6/qk7P0mYrcAvwvf7cWgWcnO+BLqVAmO43gBHglqr6aZLXgV8cbFBV3+3A+CzwRJJ/B7wNPFdVdy31gCVpiP8zsH6KM2d2pj7TAuyrqvsWc6BLacpouiuAkx0Gn2HIL/wl+aVu8zXgEeBTwP8Abk1yQ7f5W0l+ZQnHLUnn8jqTn1Mk+RRwfdcPAnckuba3XdWfb/NyKV8hfB34z0nGgMPAj4a0+TTwr5P8FHgPuLuqJpL8C+AbSS7rdl8E/uyCj1iSZvZN4O4kh5mc8v4zgKp6OckXgT9J8hHgp8Bu4C/ms/NL5rFTSdLiXMpTRpKkeTAQJEmAgSBJagaCJAkwECRJzUCQJAEGgiSp/X+HnPkIxXtoiwAAAABJRU5ErkJggg==\n",
"text/plain": [
"<Figure size 432x288 with 1 Axes>"
]
},
"metadata": {
"needs_background": "light"
},
"output_type": "display_data"
}
],
"source": [
"plt.hist(items)\n",
"plt.show()"
]
},
{
"cell_type": "code",
"execution_count": 16,
"id": "bca04b79-e9e7-4e45-965c-f94a6cd1cf2b",
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"2577"
]
},
"execution_count": 16,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"np.count_nonzero(items == \"True\")"
]
},
{
"cell_type": "code",
"execution_count": 17,
"id": "4405f10a-9c73-4d5c-b530-7e01870f2a6c",
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"29796"
]
},
"execution_count": 17,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"np.count_nonzero(items == \"False\")"
]
}
],
"metadata": {
"kernelspec": {
"display_name": "Python 3",
"language": "python",
"name": "python3"
},
"language_info": {
"codemirror_mode": {
"name": "ipython",
"version": 3
},
"file_extension": ".py",
"mimetype": "text/x-python",
"name": "python",
"nbconvert_exporter": "python",
"pygments_lexer": "ipython3",
"version": "3.8.8"
}
},
"nbformat": 4,
"nbformat_minor": 5
}