{ "cells": [ { "cell_type": "markdown", "metadata": { "id": "view-in-github" }, "source": [ "\"Open" ] }, { "cell_type": "code", "execution_count": null, "metadata": { "colab": { "base_uri": "https://localhost:8080/" }, "id": "gsPQAdhlisSg", "outputId": "1b022646-7fc1-4edc-e13f-69ba28487287" }, "outputs": [ { "output_type": "stream", "name": "stdout", "text": [ "Mounted at /content/drive/\n" ] } ], "source": [ "import numpy as np \n", "import pandas as pd \n", "import seaborn as sns\n", "import matplotlib.pyplot as plt\n", "from imblearn.over_sampling import BorderlineSMOTE\n", "from sklearn.model_selection import train_test_split\n", "from sklearn.ensemble import RandomForestClassifier\n", "from sklearn.metrics import precision_score, recall_score, f1_score, confusion_matrix\n", "from sklearn.linear_model import LogisticRegression\n", "from google.colab import drive\n", "\n", "drive.mount('/content/drive/', force_remount=True)\n" ] }, { "cell_type": "code", "execution_count": null, "metadata": { "colab": { "base_uri": "https://localhost:8080/" }, "id": "tY6Vxi8X-Fwf", "outputId": "74156519-99a6-49c4-f9bd-1a491609f9c0" }, "outputs": [ { "output_type": "stream", "name": "stdout", "text": [ "creditcard.csv\n" ] } ], "source": [ "!ls \"/content/drive/MyDrive/Credit_Card\"" ] }, { "cell_type": "code", "execution_count": null, "metadata": { "id": "wir7KI3um4pQ" }, "outputs": [], "source": [ "data = pd.read_csv(\"/content/drive/MyDrive/Credit_Card/creditcard.csv\")" ] }, { "cell_type": "code", "execution_count": null, "metadata": { "colab": { "base_uri": "https://localhost:8080/" }, "id": "C5Ok114Xosaf", "outputId": "247f6c50-fc2b-4592-820e-71a473c0459e" }, "outputs": [ { "output_type": "stream", "name": "stdout", "text": [ " Time V1 V2 V3 V4 V5 V6 V7 \\\n", "0 0.0 -1.359807 -0.072781 2.536347 1.378155 -0.338321 0.462388 0.239599 \n", "1 0.0 1.191857 0.266151 0.166480 0.448154 0.060018 -0.082361 -0.078803 \n", "2 1.0 -1.358354 -1.340163 1.773209 0.379780 -0.503198 1.800499 0.791461 \n", "3 1.0 -0.966272 -0.185226 1.792993 -0.863291 -0.010309 1.247203 0.237609 \n", "4 2.0 -1.158233 0.877737 1.548718 0.403034 -0.407193 0.095921 0.592941 \n", "\n", " V8 V9 ... V21 V22 V23 V24 V25 \\\n", "0 0.098698 0.363787 ... -0.018307 0.277838 -0.110474 0.066928 0.128539 \n", "1 0.085102 -0.255425 ... -0.225775 -0.638672 0.101288 -0.339846 0.167170 \n", "2 0.247676 -1.514654 ... 0.247998 0.771679 0.909412 -0.689281 -0.327642 \n", "3 0.377436 -1.387024 ... -0.108300 0.005274 -0.190321 -1.175575 0.647376 \n", "4 -0.270533 0.817739 ... -0.009431 0.798278 -0.137458 0.141267 -0.206010 \n", "\n", " V26 V27 V28 Amount Class \n", "0 -0.189115 0.133558 -0.021053 149.62 0 \n", "1 0.125895 -0.008983 0.014724 2.69 0 \n", "2 -0.139097 -0.055353 -0.059752 378.66 0 \n", "3 -0.221929 0.062723 0.061458 123.50 0 \n", "4 0.502292 0.219422 0.215153 69.99 0 \n", "\n", "[5 rows x 31 columns] \n", "\n", "\n", "\n" ] }, { "output_type": "execute_result", "data": { "text/plain": [ "(284807, 31)" ] }, "metadata": {}, "execution_count": 93 } ], "source": [ "print(data.head(),\"\\n\"*3)\n", "\n", "data.shape" ] }, { "cell_type": "code", "execution_count": null, "metadata": { "colab": { "base_uri": "https://localhost:8080/" }, "id": "qjA8km6Towa4", "outputId": "eedb2338-bcf1-4d88-ff20-a2b0e15d24d4" }, "outputs": [ { "output_type": "execute_result", "data": { "text/plain": [ "(284807, 31)" ] }, "metadata": {}, "execution_count": 94 } ], "source": [ "data.shape" ] }, { "cell_type": "code", "execution_count": null, "metadata": { "colab": { "base_uri": "https://localhost:8080/", "height": 446 }, "id": "3LdxVG-Noyfb", "outputId": "40fee0e0-74d3-40a4-e9da-6f9020b06411" }, "outputs": [ { "output_type": "execute_result", "data": { "text/plain": [ "0 284315\n", "1 492\n", "Name: Class, dtype: int64" ] }, "metadata": {}, "execution_count": 95 }, { "output_type": "display_data", "data": { "text/plain": [ "
" ], "image/png": "iVBORw0KGgoAAAANSUhEUgAAAhEAAAF5CAYAAAAh0Xi4AAAABHNCSVQICAgIfAhkiAAAAAlwSFlzAAALEgAACxIB0t1+/AAAADh0RVh0U29mdHdhcmUAbWF0cGxvdGxpYiB2ZXJzaW9uMy4yLjIsIGh0dHA6Ly9tYXRwbG90bGliLm9yZy+WH4yJAAAWWElEQVR4nO3dfbCmdX3f8c8X1rgKC4K7pbapS7AoyeLghLU0k7bWauPD1Oq4/yj4QJ2KxpLplETLtAtSH9pOaDttOsYpFopY4ygz4EQ7oYkTJKaTtD10xGYVmdC48QHMYrYLuyBC/PaPc53k5hQOe357nnbP6zVzz7nP9bt+9/ndf6y8va7rvq/q7gAALNdJ670AAOD4JCIAgCEiAgAYIiIAgCEiAgAYIiIAgCFb1nsBx5vt27f32Wefvd7LAIA1c+eddz7Q3TsWbxcRy3T22Wdnbm5uvZcBAGumqvY/2XanMwCAISICABgiIgCAISICABgiIgCAISICABgiIgCAISICABgiIgCAISICABgiIgCAISICABgiIgCAIe7iuYFc+N6b1nsJcMzuvPZt670EYI04EgEADBERAMAQEQEADBERAMAQEQEADBERAMAQEQEADBERAMAQEQEADBERAMAQEQEADBERAMAQEQEADBERAMAQEQEADBERAMAQEQEADBERAMAQEQEADBERAMAQEQEADBERAMAQEQEADBERAMAQEQEADBERAMAQEQEADBERAMAQEQEADBERAMAQEQEADBERAMAQEQEADFmTiKiqZ1bV9VW1v6oeqqovV9VrprGzq6qr6vDM46pFc2+oqger6v6qumLRa7+iqu6uqoer6vaq2rkScwGApa3VkYgtSb6Z5GVJTk+yN8lnqursmX2e092nTo8Pzmy/Jsm5SXYmeXmS91XVq5OkqrYnuSXJVUnOTDKX5NMrNBcAWMKaRER3H+nua7r7G939w+7+fJI/SHLhUUx/e5IPdvfB7v5ako8luXQae2OSfd19c3d/P/PRcEFVnbcCcwGAJazLNRFVdVaSFybZN7N5f1V9q6r+03SUIFV1RpLnJblrZr+7kuyanu+aHevuI0nuTbLrWOYe8xsEgE1gzSOiqp6R5JNJPt7ddyd5IMlLM3/K4cIk26bxJDl1+nlo5iUOTfssjM+OzY4fy9zFa76squaqau7AgQNP9xYBYFNY04ioqpOSfCLJD5JcniTdfbi757r78e7+7rT9Z6pqW5LD09TTZl7mtCQPTc8PLxqbHT+WuU/Q3dd19+7u3r1jx46jeq8AcKJbs4ioqkpyfZKzkuzp7seeYteefp7U3QeT3JfkgpnxC/Jnp0H2zY5V1SlJXpD5ax2G5y77zQHAJrSWRyI+muTHk7yuux9Z2FhVF1XVi6rqpKp6bpJfSvLF7l441XBTkr1VdcZ00eM7k9w4jd2a5Pyq2lNVW5NcneQr02mSY50LACxhrb4nYmeSdyV5SZL7Z74P4pIk5yS5LfOnEX4vyaNJ3jwz/f2Zv+Bxf5I7klzb3bclSXcfSLInyYeTHExyUZI3rdBcAGAJW9bij3T3/iS1xC6fWmLuo0neMT2ebPwLSZ70Y5nHMhcAWJqvvQYAhogIAGCIiAAAhogIAGCIiAAAhogIAGCIiAAAhogIAGCIiAAAhogIAGCIiAAAhogIAGCIiAAAhogIAGCIiAAAhogIAGCIiAAAhogIAGCIiAAAhogIAGCIiAAAhogIAGCIiAAAhogIAGCIiAAAhogIAGCIiAAAhogIAGCIiAAAhogIAGCIiAAAhogIAGCIiAAAhogIAGCIiAAAhogIAGCIiAAAhogIAGCIiAAAhogIAGCIiAAAhogIAGCIiAAAhogIAGCIiAAAhqxJRFTVM6vq+qraX1UPVdWXq+o1M+OvqKq7q+rhqrq9qnYumntDVT1YVfdX1RWLXntV5gIAS1urIxFbknwzycuSnJ5kb5LPVNXZVbU9yS1JrkpyZpK5JJ+emXtNknOT7Ezy8iTvq6pXJ8kqzwUAlrBlLf5Idx/J/H/QF3y+qv4gyYVJnptkX3ffnCRVdU2SB6rqvO6+O8nbk1za3QeTHKyqjyW5NMltSd64inMBgCWsyzURVXVWkhcm2ZdkV5K7Fsam4Lg3ya6qOiPJ82bHp+e7puerMvdJ1ntZVc1V1dyBAwdG3jIAnHDWPCKq6hlJPpnk49P/4z81yaFFux1Ksm0ay6LxhbGs4twn6O7runt3d+/esWPHU785ANhE1jQiquqkJJ9I8oMkl0+bDyc5bdGupyV5aBrLovGFsdWcCwA8jTWLiKqqJNcnOSvJnu5+bBral+SCmf1OSfKCzF+vcDDJfbPj0/N9qzn3mN4oAGwSa3kk4qNJfjzJ67r7kZnttyY5v6r2VNXWJFcn+crMxY03JdlbVWdU1XlJ3pnkxjWYCwAsYa2+J2JnkncleUmS+6vq8PS4pLsPJNmT5MNJDia5KMmbZqa/P/MXPO5PckeSa7v7tiRZ5bkAwBLW6iOe+5PUEuNfSHLeU4w9muQd02PN5gIAS/O11wDAEBEBAAwREQDAEBEBAAwREQDAEBEBAAwREQDAEBEBAAwREQDAEBEBAAwREQDAEBEBAAwREQDAEBEBAAwREQDAEBEBAAwREQDAEBEBAAwREQDAEBEBAAwREQDAEBEBAAwREQDAEBEBAAwREQDAEBEBAAwREQDAEBEBAAwREQDAEBEBAAwREQDAEBEBAAwREQDAEBEBAAw56oioql94iu1XrNxyAIDjxXKORFz9FNv3rsRCAIDjy5an26Gq/tb09OSqenmSmhk+J8lDq7EwAGBje9qISHL99HNrkhtmtneS+5P83EovCgDY+J42Irr7x5Kkqm7q7ret/pIAgOPB0RyJSJLMBkRVnbRo7IcruSgAYONbzqczfrKqfqeqjiR5bHo8Pv0EADaZoz4SkeTjST6X5B1JHl6d5QAAx4vlRMTOJP+0u3u1FgMAHD+W8z0Rtyb5mdVaCABwfFlORGxNcmtV/XpV3TT7OJrJVXV5Vc1V1aNVdePM9rOrqqvq8MzjqpnxZ1bVDVX1YFXdv/gbMqvqFVV1d1U9XFW3V9XOlZgLACxtOaczvjo9Rn0nyYeSvCrJs55k/Dnd/fiTbL8mybmZP53y55PcXlVf7e7bqmp7kluS/P3MX6/xwSSfTvJXV2AuALCE5XzE858dyx/q7luSpKp2J/nRZUx9e5JLu/tgkoNV9bEklya5Lckbk+zr7pun174myQNVdV53332McwGAJRx1RMx8/fX/p7t/cwXWsr+qOslvJHlvdz9QVWckeV6Su2b2uyvJG6bnu2bHuvtIVd2bZFdVfXd0bhIRAQBPYzmnM65f9PuOJD+S5FuZv4fGqAeSvDTJl5M8N8lHknwy86c9Tp32OTSz/6Ek26bnpyY5sOj1FsaPZe4TVNVlSS5Lkuc///lH8ZYA4MS3nNMZPzb7e1WdnPk7eB7TDbi6+3CSuenX71bV5Unuq6ptSQ5P209L8v2Z5wt/8/D0+6yF8WOZu3iN1yW5Lkl2797tI64AkOV9OuMJuvtPknw4yftWbjnzLz39PGm6luG+JBfMjF+QZN/0fN/sWFWdkuQFmb/WYXjuir0TADiBDUfE5G8nOar7ZlTVlqramuTkzN9WfOu07aKqelFVnVRVz03yS0m+2N0LpyFuSrK3qs6oqvOSvDPJjdPYrUnOr6o902tfneQrMxdGHstcAGAJy7l3xjer6g9nHg8kuTnJlUf5EnuTPDLt/5bp+d7MX09xW+ZPI/xekkeTvHlm3vuT3Jtkf5I7klzb3bclSXcfSLIn80dEDia5KMmbVmguALCEOtpvsa6qly3adCTJPd394IqvagPbvXt3z83NPf2OAy5871F9bxdsaHde+7an3wk4rlTVnd29e/H25VxYecf0QiclOSvJd90CHAA2r+Wcztg2fcX1I0m+neSRqvp4VZ2+aqsDADas5VxY+e+TnJLkxZn/2uoXJ3l25i+EBAA2meV82dSrk5zT3Q9Pv99TVX8v8xcuAgCbzHKORHw/899SOWt75j9NAQBsMss5EvEfk/xGVf2bzH9kcmeSf5TkY6uxMABgY1tORHw48xdUXpLkL2T+1t6/2N2L76kBAGwCyzmd8e+SfL27X9ndP9Hdr0zytar6t6u0NgBgA1tORLw5f3ajrAV3Jrl45ZYDABwvlhMRnfn7Xsw6eZmvAQCcIJYTAF9K8sHpGysXvrnymmk7ALDJLOfCyn+Y5PNJ7quq/Umen/lbbb9uNRYGAGxsy7l3xreq6ieT/JUkfynJN5P8D/fPAIDNaTlHIjIFw+9ODwBgE3NRJAAwREQAAENEBAAwREQAAENEBAAwREQAAENEBAAwREQAAENEBAAwREQAAENEBAAwREQAAENEBAAwREQAAENEBAAwREQAAENEBAAwREQAAENEBAAwREQAAENEBAAwREQAAENEBAAwREQAAENEBAAwREQAAENEBAAwREQAAENEBAAwREQAAENEBAAwZM0ioqour6q5qnq0qm5cNPaKqrq7qh6uqturaufM2DOr6oaqerCq7q+qK9ZiLgCwtLU8EvGdJB9KcsPsxqranuSWJFclOTPJXJJPz+xyTZJzk+xM8vIk76uqV6/BXABgCWsWEd19S3d/Nsn3Fg29Mcm+7r65u7+f+f/wX1BV503jb0/ywe4+2N1fS/KxJJeuwVwAYAkb4ZqIXUnuWvilu48kuTfJrqo6I8nzZsen57tWc+6KvCsAOMFthIg4NcmhRdsOJdk2jWXR+MLYas59gqq6bLqeY+7AgQNLvhkA2Cw2QkQcTnLaom2nJXloGsui8YWx1Zz7BN19XXfv7u7dO3bsWPLNAMBmsREiYl+SCxZ+qapTkrwg89crHExy3+z49Hzfas5dkXcFACe4tfyI55aq2prk5CQnV9XWqtqS5NYk51fVnmn86iRf6e67p6k3JdlbVWdMFz2+M8mN09hqzgUAlrCWRyL2JnkkyZVJ3jI939vdB5LsSfLhJAeTXJTkTTPz3p/5Cx73J7kjybXdfVuSrPJcAGAJ1d3rvYbjyu7du3tubm5VXvvC9960Kq8La+nOa9+23ksAVlhV3dnduxdv3wjXRAAAxyERAQAMEREAwBARAQAMEREAwBARAQAMEREAwBARAQAMEREAwBARAQAMEREAwBARAQAMEREAwBARAQAMEREAwBARAQAMEREAwBARAQAMEREAwBARAQAMEREAwBARAQAMEREAwBARAQAMEREAwBARAQAMEREAwBARAQAMEREAwBARAQAMEREAwBARAQAMEREAwBARAQAMEREAwBARAQAMEREAwBARAQAMEREAwBARAQAMEREAwBARAQAMEREAwBARAQAMEREAwJANExFV9cWq+n5VHZ4eX58Zu7iq9lfVkar6bFWdOTN2ZlXdOo3tr6qLF73u8FwA4KltmIiYXN7dp06PFyVJVe1K8h+SvDXJWUkeTvLLM3M+kuQH09glST46zTmmuQDA0ras9wKOwiVJPtfdv5UkVXVVkq9V1bYkP0yyJ8n53X04yW9X1a9mPhquPMa5AMASNtqRiH9RVQ9U1X+rqr85bduV5K6FHbr73swfPXjh9Hi8u++ZeY27pjnHOvdPVdVlVTVXVXMHDhw4xrcIACeGjRQR/zjJOUn+YpLrknyuql6Q5NQkhxbteyjJtmnswacYyzHO/VPdfV137+7u3Tt27FjOewKAE9aGOZ3R3f995tePV9Wbk7w2yeEkpy3a/bQkD2X+lMRTjeUY5wIAS9hIRyIW6ySVZF+SCxY2VtU5SZ6Z5J7psaWqzp2Zd8E0J8c4FwBYwoaIiKp6TlW9qqq2VtWWqrokyd9IcluSTyZ5XVX99ao6JckHktzS3Q9195EktyT5QFWdUlU/neT1ST4xvfSxzAUAlrAhIiLJM5J8KMmBJA8k+bkkb+jue7p7X5J3Zz4I/ijz1yy8Z2bue5I8axr7VJKfnebkWOYCAEvbENdEdPeBJC9dYvxXkvzKU4z9cZI3rMZcAOCpbZQjEQDAcUZEAABDRAQAMEREAABDRAQAMEREAABDRAQAMEREAABDRAQAMEREAABDRAQAMEREAABDRAQAMEREAABDRAQAMEREAABDRAQAMEREAABDRAQAMEREAABDRAQAMEREAABDRAQAMEREAABDRAQAMEREAABDRAQAMEREAABDRAQAMEREAABDRAQAMEREAABDRAQAMEREAABDRAQAMEREAABDRAQAMEREAABDRAQAMEREAABDRAQAMEREAABDRAQAMEREAABDNn1EVNWZVXVrVR2pqv1VdfF6rwkAjgdb1nsBG8BHkvwgyVlJXpLkv1TVXd29b32XBQAb26Y+ElFVpyTZk+Sq7j7c3b+d5FeTvHV9VwYAG99mPxLxwiSPd/c9M9vuSvKydVoPsA7+8AMvXu8lwDF7/tX/e83/5maPiFOTPLho26Ek22Y3VNVlSS6bfj1cVV9fg7WxOrYneWC9F3Eiq3/19vVeAhuTf3ur7f21mq++88k2bvaIOJzktEXbTkvy0OyG7r4uyXVrtShWT1XNdffu9V4HbDb+7Z2YNvU1EUnuSbKlqs6d2XZBEhdVAsDT2NQR0d1HktyS5ANVdUpV/XSS1yf5xPquDAA2vk0dEZP3JHlWkj9K8qkkP+vjnSc0p6Vgffi3dwKq7l7vNQAAxyFHIgCAISICABgiItgU3CMF1kdVXV5Vc1X1aFXduN7rYWVt9u+JYPNwjxRYH99J8qEkr8r8ReycQFxYyQlvukfKwSTnL3zFeVV9Ism3u/vKdV0cbBJV9aEkP9rdl673Wlg5TmewGTzVPVJ2rdN6AE4IIoLN4KjukQLA8ogINoOjukcKAMsjItgM3CMFYBWICE547pEC66eqtlTV1iQnJzm5qrZWlU8GniBEBJuFe6TA+tib5JEkVyZ5y/R877quiBXjI54AwBBHIgCAISICABgiIgCAISICABgiIgCAISICABgiIoANo6quqar/vN7rAI6OiADWXFVdXFVzVXW4qu6rql+rqr+23usClsdXjwJrqqquyPy3F747yX9N8oMkr878V5EfWcelAcvkSASwZqrq9CQfSPIPuvuW7j7S3Y919+e6+71Psv/NVXV/VR2qqt+qql0zY6+tqq9W1UNV9e2q+oVp+/aq+nxV/d+q+uOq+lJV+d86WAX+YQFr6aeSbE1y61Hu/2tJzk3y55L8rySfnBm7Psm7untbkvOT/Oa0/eeTfCvJjiRnJfknSXy/P6wCpzOAtfTcJA909+NHs3N337DwvKquSXKwqk7v7kNJHkvyE1V1V3cfTHJw2vWxJM9LsrO7fz/Jl1byDQB/xpEIYC19L8n2o7kVdFWdXFX/sqruraoHk3xjGto+/dyT5LVJ9lfVHVX1U9P2a5P8fpJfr6r/U1VXruxbABaICGAt/U6SR5O84Sj2vTjzF1u+MsnpSc6etleSdPf/7O7XZ/5Ux2eTfGba/lB3/3x3n5Pk7ya5oqpesZJvApgnIoA1M52GuDrJR6rqDVX17Kp6RlW9pqp+cdHu2zIfHN9L8uwk/3xhoKp+pKoumU5tPJbkwSQ/nMb+TlX95aqqJIeS/MnCGLCyRASwprr7Xye5IsneJAeSfDPJ5Zk/mjDrpiT7k3w7yVeT/O6i8bcm+cZ0quPdSS6Ztp+b5AtJDmf+yMcvd/ftK/9OgOp20TIAsHyORAAAQ0QEADBERAAAQ0QEADBERAAAQ0QEADBERAAAQ0QEADBERAAAQ/4f3Z+al1My3xMAAAAASUVORK5CYII=\n" }, "metadata": { "needs_background": "light" } } ], "source": [ "sns.countplot(x=data['Class'])\n", "data[\"Class\"].value_counts()" ] }, { "cell_type": "code", "execution_count": null, "metadata": { "colab": { "base_uri": "https://localhost:8080/", "height": 394 }, "id": "HE27u1Looyky", "outputId": "64d05722-6540-4ade-d1f1-fdfb4abbf9e1" }, "outputs": [ { "output_type": "execute_result", "data": { "text/plain": [ " Time V1 V2 V3 V4 \\\n", "count 284807.000000 2.848070e+05 2.848070e+05 2.848070e+05 2.848070e+05 \n", "mean 94813.859575 1.168375e-15 3.416908e-16 -1.379537e-15 2.074095e-15 \n", "std 47488.145955 1.958696e+00 1.651309e+00 1.516255e+00 1.415869e+00 \n", "min 0.000000 -5.640751e+01 -7.271573e+01 -4.832559e+01 -5.683171e+00 \n", "25% 54201.500000 -9.203734e-01 -5.985499e-01 -8.903648e-01 -8.486401e-01 \n", "50% 84692.000000 1.810880e-02 6.548556e-02 1.798463e-01 -1.984653e-02 \n", "75% 139320.500000 1.315642e+00 8.037239e-01 1.027196e+00 7.433413e-01 \n", "max 172792.000000 2.454930e+00 2.205773e+01 9.382558e+00 1.687534e+01 \n", "\n", " V5 V6 V7 V8 V9 \\\n", "count 2.848070e+05 2.848070e+05 2.848070e+05 2.848070e+05 2.848070e+05 \n", "mean 9.604066e-16 1.487313e-15 -5.556467e-16 1.213481e-16 -2.406331e-15 \n", "std 1.380247e+00 1.332271e+00 1.237094e+00 1.194353e+00 1.098632e+00 \n", "min -1.137433e+02 -2.616051e+01 -4.355724e+01 -7.321672e+01 -1.343407e+01 \n", "25% -6.915971e-01 -7.682956e-01 -5.540759e-01 -2.086297e-01 -6.430976e-01 \n", "50% -5.433583e-02 -2.741871e-01 4.010308e-02 2.235804e-02 -5.142873e-02 \n", "75% 6.119264e-01 3.985649e-01 5.704361e-01 3.273459e-01 5.971390e-01 \n", "max 3.480167e+01 7.330163e+01 1.205895e+02 2.000721e+01 1.559499e+01 \n", "\n", " ... V21 V22 V23 V24 \\\n", "count ... 2.848070e+05 2.848070e+05 2.848070e+05 2.848070e+05 \n", "mean ... 1.654067e-16 -3.568593e-16 2.578648e-16 4.473266e-15 \n", "std ... 7.345240e-01 7.257016e-01 6.244603e-01 6.056471e-01 \n", "min ... -3.483038e+01 -1.093314e+01 -4.480774e+01 -2.836627e+00 \n", "25% ... -2.283949e-01 -5.423504e-01 -1.618463e-01 -3.545861e-01 \n", "50% ... -2.945017e-02 6.781943e-03 -1.119293e-02 4.097606e-02 \n", "75% ... 1.863772e-01 5.285536e-01 1.476421e-01 4.395266e-01 \n", "max ... 2.720284e+01 1.050309e+01 2.252841e+01 4.584549e+00 \n", "\n", " V25 V26 V27 V28 Amount \\\n", "count 2.848070e+05 2.848070e+05 2.848070e+05 2.848070e+05 284807.000000 \n", "mean 5.340915e-16 1.683437e-15 -3.660091e-16 -1.227390e-16 88.349619 \n", "std 5.212781e-01 4.822270e-01 4.036325e-01 3.300833e-01 250.120109 \n", "min -1.029540e+01 -2.604551e+00 -2.256568e+01 -1.543008e+01 0.000000 \n", "25% -3.171451e-01 -3.269839e-01 -7.083953e-02 -5.295979e-02 5.600000 \n", "50% 1.659350e-02 -5.213911e-02 1.342146e-03 1.124383e-02 22.000000 \n", "75% 3.507156e-01 2.409522e-01 9.104512e-02 7.827995e-02 77.165000 \n", "max 7.519589e+00 3.517346e+00 3.161220e+01 3.384781e+01 25691.160000 \n", "\n", " Class \n", "count 284807.000000 \n", "mean 0.001727 \n", "std 0.041527 \n", "min 0.000000 \n", "25% 0.000000 \n", "50% 0.000000 \n", "75% 0.000000 \n", "max 1.000000 \n", "\n", "[8 rows x 31 columns]" ], "text/html": [ "\n", "
\n", "
\n", "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
TimeV1V2V3V4V5V6V7V8V9...V21V22V23V24V25V26V27V28AmountClass
count284807.0000002.848070e+052.848070e+052.848070e+052.848070e+052.848070e+052.848070e+052.848070e+052.848070e+052.848070e+05...2.848070e+052.848070e+052.848070e+052.848070e+052.848070e+052.848070e+052.848070e+052.848070e+05284807.000000284807.000000
mean94813.8595751.168375e-153.416908e-16-1.379537e-152.074095e-159.604066e-161.487313e-15-5.556467e-161.213481e-16-2.406331e-15...1.654067e-16-3.568593e-162.578648e-164.473266e-155.340915e-161.683437e-15-3.660091e-16-1.227390e-1688.3496190.001727
std47488.1459551.958696e+001.651309e+001.516255e+001.415869e+001.380247e+001.332271e+001.237094e+001.194353e+001.098632e+00...7.345240e-017.257016e-016.244603e-016.056471e-015.212781e-014.822270e-014.036325e-013.300833e-01250.1201090.041527
min0.000000-5.640751e+01-7.271573e+01-4.832559e+01-5.683171e+00-1.137433e+02-2.616051e+01-4.355724e+01-7.321672e+01-1.343407e+01...-3.483038e+01-1.093314e+01-4.480774e+01-2.836627e+00-1.029540e+01-2.604551e+00-2.256568e+01-1.543008e+010.0000000.000000
25%54201.500000-9.203734e-01-5.985499e-01-8.903648e-01-8.486401e-01-6.915971e-01-7.682956e-01-5.540759e-01-2.086297e-01-6.430976e-01...-2.283949e-01-5.423504e-01-1.618463e-01-3.545861e-01-3.171451e-01-3.269839e-01-7.083953e-02-5.295979e-025.6000000.000000
50%84692.0000001.810880e-026.548556e-021.798463e-01-1.984653e-02-5.433583e-02-2.741871e-014.010308e-022.235804e-02-5.142873e-02...-2.945017e-026.781943e-03-1.119293e-024.097606e-021.659350e-02-5.213911e-021.342146e-031.124383e-0222.0000000.000000
75%139320.5000001.315642e+008.037239e-011.027196e+007.433413e-016.119264e-013.985649e-015.704361e-013.273459e-015.971390e-01...1.863772e-015.285536e-011.476421e-014.395266e-013.507156e-012.409522e-019.104512e-027.827995e-0277.1650000.000000
max172792.0000002.454930e+002.205773e+019.382558e+001.687534e+013.480167e+017.330163e+011.205895e+022.000721e+011.559499e+01...2.720284e+011.050309e+012.252841e+014.584549e+007.519589e+003.517346e+003.161220e+013.384781e+0125691.1600001.000000
\n", "

8 rows × 31 columns

\n", "
\n", " \n", " \n", " \n", "\n", " \n", "
\n", "
\n", " " ] }, "metadata": {}, "execution_count": 96 } ], "source": [ "data.describe()" ] }, { "cell_type": "code", "execution_count": null, "metadata": { "colab": { "base_uri": "https://localhost:8080/" }, "id": "0CQCPvxDo5dA", "outputId": "47874a73-0ce8-4745-eb4f-e0e26e1dcf3a" }, "outputs": [ { "output_type": "execute_result", "data": { "text/plain": [ "Time 0\n", "V1 0\n", "V2 0\n", "V3 0\n", "V4 0\n", "V5 0\n", "V6 0\n", "V7 0\n", "V8 0\n", "V9 0\n", "V10 0\n", "V11 0\n", "V12 0\n", "V13 0\n", "V14 0\n", "V15 0\n", "V16 0\n", "V17 0\n", "V18 0\n", "V19 0\n", "V20 0\n", "V21 0\n", "V22 0\n", "V23 0\n", "V24 0\n", "V25 0\n", "V26 0\n", "V27 0\n", "V28 0\n", "Amount 0\n", "Class 0\n", "dtype: int64" ] }, "metadata": {}, "execution_count": 97 } ], "source": [ "data.isnull().sum()" ] }, { "cell_type": "code", "execution_count": null, "metadata": { "id": "LRAH6L95o-je" }, "outputs": [], "source": [ "fraud = data[data[\"Class\"] == 1]\n", "normal = data[data[\"Class\"] == 0]" ] }, { "cell_type": "code", "execution_count": null, "metadata": { "colab": { "base_uri": "https://localhost:8080/", "height": 394 }, "id": "hUHu1D0TpEbx", "outputId": "55e3405f-10fd-4c1d-cce9-1e98a11449c5" }, "outputs": [ { "output_type": "execute_result", "data": { "text/plain": [ " Time V1 V2 V3 V4 \\\n", "count 492.000000 492.000000 492.000000 492.000000 492.000000 \n", "mean 80746.806911 -4.771948 3.623778 -7.033281 4.542029 \n", "std 47835.365138 6.783687 4.291216 7.110937 2.873318 \n", "min 406.000000 -30.552380 -8.402154 -31.103685 -1.313275 \n", "25% 41241.500000 -6.036063 1.188226 -8.643489 2.373050 \n", "50% 75568.500000 -2.342497 2.717869 -5.075257 4.177147 \n", "75% 128483.000000 -0.419200 4.971257 -2.276185 6.348729 \n", "max 170348.000000 2.132386 22.057729 2.250210 12.114672 \n", "\n", " V5 V6 V7 V8 V9 ... \\\n", "count 492.000000 492.000000 492.000000 492.000000 492.000000 ... \n", "mean -3.151225 -1.397737 -5.568731 0.570636 -2.581123 ... \n", "std 5.372468 1.858124 7.206773 6.797831 2.500896 ... \n", "min -22.105532 -6.406267 -43.557242 -41.044261 -13.434066 ... \n", "25% -4.792835 -2.501511 -7.965295 -0.195336 -3.872383 ... \n", "50% -1.522962 -1.424616 -3.034402 0.621508 -2.208768 ... \n", "75% 0.214562 -0.413216 -0.945954 1.764879 -0.787850 ... \n", "max 11.095089 6.474115 5.802537 20.007208 3.353525 ... \n", "\n", " V21 V22 V23 V24 V25 V26 \\\n", "count 492.000000 492.000000 492.000000 492.000000 492.000000 492.000000 \n", "mean 0.713588 0.014049 -0.040308 -0.105130 0.041449 0.051648 \n", "std 3.869304 1.494602 1.579642 0.515577 0.797205 0.471679 \n", "min -22.797604 -8.887017 -19.254328 -2.028024 -4.781606 -1.152671 \n", "25% 0.041787 -0.533764 -0.342175 -0.436809 -0.314348 -0.259416 \n", "50% 0.592146 0.048434 -0.073135 -0.060795 0.088371 0.004321 \n", "75% 1.244611 0.617474 0.308378 0.285328 0.456515 0.396733 \n", "max 27.202839 8.361985 5.466230 1.091435 2.208209 2.745261 \n", "\n", " V27 V28 Amount Class \n", "count 492.000000 492.000000 492.000000 492.0 \n", "mean 0.170575 0.075667 122.211321 1.0 \n", "std 1.376766 0.547291 256.683288 0.0 \n", "min -7.263482 -1.869290 0.000000 1.0 \n", "25% -0.020025 -0.108868 1.000000 1.0 \n", "50% 0.394926 0.146344 9.250000 1.0 \n", "75% 0.826029 0.381152 105.890000 1.0 \n", "max 3.052358 1.779364 2125.870000 1.0 \n", "\n", "[8 rows x 31 columns]" ], "text/html": [ "\n", "
\n", "
\n", "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
TimeV1V2V3V4V5V6V7V8V9...V21V22V23V24V25V26V27V28AmountClass
count492.000000492.000000492.000000492.000000492.000000492.000000492.000000492.000000492.000000492.000000...492.000000492.000000492.000000492.000000492.000000492.000000492.000000492.000000492.000000492.0
mean80746.806911-4.7719483.623778-7.0332814.542029-3.151225-1.397737-5.5687310.570636-2.581123...0.7135880.014049-0.040308-0.1051300.0414490.0516480.1705750.075667122.2113211.0
std47835.3651386.7836874.2912167.1109372.8733185.3724681.8581247.2067736.7978312.500896...3.8693041.4946021.5796420.5155770.7972050.4716791.3767660.547291256.6832880.0
min406.000000-30.552380-8.402154-31.103685-1.313275-22.105532-6.406267-43.557242-41.044261-13.434066...-22.797604-8.887017-19.254328-2.028024-4.781606-1.152671-7.263482-1.8692900.0000001.0
25%41241.500000-6.0360631.188226-8.6434892.373050-4.792835-2.501511-7.965295-0.195336-3.872383...0.041787-0.533764-0.342175-0.436809-0.314348-0.259416-0.020025-0.1088681.0000001.0
50%75568.500000-2.3424972.717869-5.0752574.177147-1.522962-1.424616-3.0344020.621508-2.208768...0.5921460.048434-0.073135-0.0607950.0883710.0043210.3949260.1463449.2500001.0
75%128483.000000-0.4192004.971257-2.2761856.3487290.214562-0.413216-0.9459541.764879-0.787850...1.2446110.6174740.3083780.2853280.4565150.3967330.8260290.381152105.8900001.0
max170348.0000002.13238622.0577292.25021012.11467211.0950896.4741155.80253720.0072083.353525...27.2028398.3619855.4662301.0914352.2082092.7452613.0523581.7793642125.8700001.0
\n", "

8 rows × 31 columns

\n", "
\n", " \n", " \n", " \n", "\n", " \n", "
\n", "
\n", " " ] }, "metadata": {}, "execution_count": 99 } ], "source": [ "fraud.describe()" ] }, { "cell_type": "code", "execution_count": null, "metadata": { "colab": { "base_uri": "https://localhost:8080/", "height": 394 }, "id": "TrZFcF2spHN_", "outputId": "4f512d8f-763e-4384-d0fd-e3504e4db0a0" }, "outputs": [ { "output_type": "execute_result", "data": { "text/plain": [ " Time V1 V2 V3 \\\n", "count 284315.000000 284315.000000 284315.000000 284315.000000 \n", "mean 94838.202258 0.008258 -0.006271 0.012171 \n", "std 47484.015786 1.929814 1.636146 1.459429 \n", "min 0.000000 -56.407510 -72.715728 -48.325589 \n", "25% 54230.000000 -0.917544 -0.599473 -0.884541 \n", "50% 84711.000000 0.020023 0.064070 0.182158 \n", "75% 139333.000000 1.316218 0.800446 1.028372 \n", "max 172792.000000 2.454930 18.902453 9.382558 \n", "\n", " V4 V5 V6 V7 \\\n", "count 284315.000000 284315.000000 284315.000000 284315.000000 \n", "mean -0.007860 0.005453 0.002419 0.009637 \n", "std 1.399333 1.356952 1.329913 1.178812 \n", "min -5.683171 -113.743307 -26.160506 -31.764946 \n", "25% -0.850077 -0.689398 -0.766847 -0.551442 \n", "50% -0.022405 -0.053457 -0.273123 0.041138 \n", "75% 0.737624 0.612181 0.399619 0.571019 \n", "max 16.875344 34.801666 73.301626 120.589494 \n", "\n", " V8 V9 ... V21 V22 \\\n", "count 284315.000000 284315.000000 ... 284315.000000 284315.000000 \n", "mean -0.000987 0.004467 ... -0.001235 -0.000024 \n", "std 1.161283 1.089372 ... 0.716743 0.723668 \n", "min -73.216718 -6.290730 ... -34.830382 -10.933144 \n", "25% -0.208633 -0.640412 ... -0.228509 -0.542403 \n", "50% 0.022041 -0.049964 ... -0.029821 0.006736 \n", "75% 0.326200 0.598230 ... 0.185626 0.528407 \n", "max 18.709255 15.594995 ... 22.614889 10.503090 \n", "\n", " V23 V24 V25 V26 \\\n", "count 284315.000000 284315.000000 284315.000000 284315.000000 \n", "mean 0.000070 0.000182 -0.000072 -0.000089 \n", "std 0.621541 0.605776 0.520673 0.482241 \n", "min -44.807735 -2.836627 -10.295397 -2.604551 \n", "25% -0.161702 -0.354425 -0.317145 -0.327074 \n", "50% -0.011147 0.041082 0.016417 -0.052227 \n", "75% 0.147522 0.439869 0.350594 0.240671 \n", "max 22.528412 4.584549 7.519589 3.517346 \n", "\n", " V27 V28 Amount Class \n", "count 284315.000000 284315.000000 284315.000000 284315.0 \n", "mean -0.000295 -0.000131 88.291022 0.0 \n", "std 0.399847 0.329570 250.105092 0.0 \n", "min -22.565679 -15.430084 0.000000 0.0 \n", "25% -0.070852 -0.052950 5.650000 0.0 \n", "50% 0.001230 0.011199 22.000000 0.0 \n", "75% 0.090573 0.077962 77.050000 0.0 \n", "max 31.612198 33.847808 25691.160000 0.0 \n", "\n", "[8 rows x 31 columns]" ], "text/html": [ "\n", "
\n", "
\n", "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
TimeV1V2V3V4V5V6V7V8V9...V21V22V23V24V25V26V27V28AmountClass
count284315.000000284315.000000284315.000000284315.000000284315.000000284315.000000284315.000000284315.000000284315.000000284315.000000...284315.000000284315.000000284315.000000284315.000000284315.000000284315.000000284315.000000284315.000000284315.000000284315.0
mean94838.2022580.008258-0.0062710.012171-0.0078600.0054530.0024190.009637-0.0009870.004467...-0.001235-0.0000240.0000700.000182-0.000072-0.000089-0.000295-0.00013188.2910220.0
std47484.0157861.9298141.6361461.4594291.3993331.3569521.3299131.1788121.1612831.089372...0.7167430.7236680.6215410.6057760.5206730.4822410.3998470.329570250.1050920.0
min0.000000-56.407510-72.715728-48.325589-5.683171-113.743307-26.160506-31.764946-73.216718-6.290730...-34.830382-10.933144-44.807735-2.836627-10.295397-2.604551-22.565679-15.4300840.0000000.0
25%54230.000000-0.917544-0.599473-0.884541-0.850077-0.689398-0.766847-0.551442-0.208633-0.640412...-0.228509-0.542403-0.161702-0.354425-0.317145-0.327074-0.070852-0.0529505.6500000.0
50%84711.0000000.0200230.0640700.182158-0.022405-0.053457-0.2731230.0411380.022041-0.049964...-0.0298210.006736-0.0111470.0410820.016417-0.0522270.0012300.01119922.0000000.0
75%139333.0000001.3162180.8004461.0283720.7376240.6121810.3996190.5710190.3262000.598230...0.1856260.5284070.1475220.4398690.3505940.2406710.0905730.07796277.0500000.0
max172792.0000002.45493018.9024539.38255816.87534434.80166673.301626120.58949418.70925515.594995...22.61488910.50309022.5284124.5845497.5195893.51734631.61219833.84780825691.1600000.0
\n", "

8 rows × 31 columns

\n", "
\n", " \n", " \n", " \n", "\n", " \n", "
\n", "
\n", " " ] }, "metadata": {}, "execution_count": 100 } ], "source": [ "normal.describe()" ] }, { "cell_type": "code", "execution_count": null, "metadata": { "colab": { "base_uri": "https://localhost:8080/", "height": 428 }, "id": "49naUOY2pnBH", "outputId": "09fe4842-9990-4195-c52f-a641b6903fd3" }, "outputs": [ { "output_type": "execute_result", "data": { "text/plain": [ "" ] }, "metadata": {}, "execution_count": 101 }, { "output_type": "display_data", "data": { "text/plain": [ "
" ], "image/png": "\n" }, "metadata": { "needs_background": "light" } } ], "source": [ "# Adjusting figuresize, and fontsize\n", "plt.rcParams[\"figure.figsize\"] = \"8,6\"\n", "font = {'size': 12}\n", "plt.rc('font', **font)\n", "\n", "# Adding titles to the plots and axes\n", "plt.title(\"Distribution of Amount over Both Classes\")\n", "plt.xlabel(\"Amount\")\n", "plt.ylabel(\"Class\")\n", "\n", "# Plotting the Amount column vs. Class Column\n", "plt.scatter(data[\"Amount\"],data[\"Class\"])\n", "\n", "\n" ] }, { "cell_type": "code", "execution_count": null, "metadata": { "id": "fXMOorpRp8mo" }, "outputs": [], "source": [ "X = data.drop([\"Class\",\"Time\"],axis=1)\n", "y = data[\"Class\"]\n", "\n", "\n", "X_train_Before, X_test, y_train_Before, y_test = train_test_split(\n", " X, y, test_size = 0.3, \n", " random_state = 42)" ] }, { "cell_type": "code", "execution_count": null, "metadata": { "id": "Tw1kdGZ9bJ7B" }, "outputs": [], "source": [ "#Data Normalization\n", "from sklearn.preprocessing import StandardScaler\n", "\n", "scaler = StandardScaler()\n", "for i in X_train_Before:\n", " scaler = StandardScaler()\n", " X_train_Before[i] = scaler.fit_transform(X_train_Before[i].values.reshape(-1,1))\n", " X_test[i] = scaler.transform(X_test[i].values.reshape(-1,1))\n" ] }, { "cell_type": "code", "execution_count": null, "metadata": { "id": "WUI5P98fp_f6" }, "outputs": [], "source": [ "#Balancing with Borderline_SMOTE\n", "borderlineSMOTE = BorderlineSMOTE(k_neighbors = 10, random_state = 42)\n", "X_train, y_train = borderlineSMOTE.fit_resample(X_train_Before,y_train_Before)\n" ] }, { "cell_type": "code", "execution_count": null, "metadata": { "colab": { "base_uri": "https://localhost:8080/", "height": 411 }, "id": "g1jhOEbFqC41", "outputId": "8253552a-18d8-43ef-f1a5-d4b0521d45fe" }, "outputs": [ { "output_type": "execute_result", "data": { "text/plain": [ "" ] }, "metadata": {}, "execution_count": 105 }, { "output_type": "display_data", "data": { "text/plain": [ "
" ], "image/png": "\n" }, "metadata": { "needs_background": "light" } } ], "source": [ "#Unbalanced training data distribution\n", "sns.countplot(x=y_train_Before)" ] }, { "cell_type": "code", "execution_count": null, "metadata": { "colab": { "base_uri": "https://localhost:8080/", "height": 411 }, "id": "S2paolRcqHpr", "outputId": "ae21a0bb-2080-4acf-b518-013d8e0fa62c" }, "outputs": [ { "output_type": "execute_result", "data": { "text/plain": [ "" ] }, "metadata": {}, "execution_count": 106 }, { "output_type": "display_data", "data": { "text/plain": [ "
" ], "image/png": "\n" }, "metadata": { "needs_background": "light" } } ], "source": [ "#Balanced training data distribution\n", "sns.countplot(x=y_train)" ] }, { "cell_type": "code", "execution_count": null, "metadata": { "id": "LaePMvTLqJ8F" }, "outputs": [], "source": [ "#Random Forest Classifier\n", "\n", "rf = RandomForestClassifier(n_estimators = 35,random_state=42)\n", "\n", "\n", "rf.fit(X_train, y_train)\n", "\n", "y_pred = rf.predict(X_test)\n", "\n", "\n", "precision = precision_score(y_test, y_pred)\n", "recall = recall_score(y_test, y_pred)\n", "f1 = f1_score(y_test, y_pred)\n" ] }, { "cell_type": "code", "execution_count": null, "metadata": { "colab": { "base_uri": "https://localhost:8080/", "height": 394 }, "id": "7VvOwsuWxVxv", "outputId": "292e4d78-fac9-4ce0-80a2-0d40be3bf54b" }, "outputs": [ { "output_type": "execute_result", "data": { "text/plain": [ "" ] }, "metadata": {}, "execution_count": 108 }, { "output_type": "display_data", "data": { "text/plain": [ "
" ], "image/png": "\n" }, "metadata": { "needs_background": "light" } } ], "source": [ "#Random Forest Classifier Confusion Matrix\n", "cm = confusion_matrix(y_test,y_pred)\n", "sns.heatmap(cm,annot=True,fmt='g',yticklabels=[\"Real Negative\",\"Real Positive\"],xticklabels=[\"Predicted Negative\", \"Predicted Positive\"])\n" ] }, { "cell_type": "code", "execution_count": null, "metadata": { "colab": { "base_uri": "https://localhost:8080/" }, "id": "TwkJQImjt9tL", "outputId": "417f59a8-099a-4753-8eb0-ed8703e32051" }, "outputs": [ { "output_type": "stream", "name": "stdout", "text": [ "Precision: 87.88 %\n", "Recall: 85.29 %\n", "F1: 86.57 %\n" ] } ], "source": [ "print(\"Precision: \", round(precision*100,2),\"%\")\n", "print(\"Recall: \", round(recall*100,2),\"%\")\n", "print(\"F1: \", round(f1*100,2),\"%\")\n" ] }, { "cell_type": "code", "execution_count": null, "metadata": { "id": "sgkE-auW-CEL" }, "outputs": [], "source": [ "#Logistic Regression Classifier\n", "\n", "logReg = LogisticRegression()\n", "\n", "logReg.fit(X_train, y_train)\n", "\n", "log_y_pred = logReg.predict(X_test)\n", "\n", "log_precision = precision_score(y_test, log_y_pred)\n", "log_recall = recall_score(y_test, log_y_pred)\n", "log_f1 = f1_score(y_test, log_y_pred)" ] }, { "cell_type": "code", "execution_count": null, "metadata": { "colab": { "base_uri": "https://localhost:8080/", "height": 516 }, "id": "L06gPPFk-iqA", "outputId": "00abd74a-0843-4069-97f5-bc744f564f36" }, "outputs": [ { "output_type": "stream", "name": "stdout", "text": [ "Precision: 8.78 %\n", "Recall: 88.97 %\n", "F1: 15.98 %\n", "\n", "\n", "\n", "\n" ] }, { "output_type": "execute_result", "data": { "text/plain": [ "" ] }, "metadata": {}, "execution_count": 111 }, { "output_type": "display_data", "data": { "text/plain": [ "
" ], "image/png": "\n" }, "metadata": { "needs_background": "light" } } ], "source": [ "print(\"Precision: \", round(log_precision*100,2),\"%\")\n", "print(\"Recall: \", round(log_recall*100,2),\"%\")\n", "print(\"F1: \", round(log_f1*100,2),\"%\")\n", "print(\"\\n\"*3)\n", "\n", "cm = confusion_matrix(y_test,log_y_pred)\n", "sns.heatmap(cm,annot=True,fmt='g',yticklabels=[\"Real Negative\",\"Real Positive\"],xticklabels=[\"Predicted Negative\", \"Predicted Positive\"])\n" ] }, { "cell_type": "code", "execution_count": null, "metadata": { "id": "XECYUlEjSCZn" }, "outputs": [], "source": [] } ], "metadata": { "accelerator": "GPU", "colab": { "provenance": [] }, "kernelspec": { "display_name": "Python 3", "name": "python3" }, "language_info": { "name": "python" } }, "nbformat": 4, "nbformat_minor": 0 }