{ "cells": [ { "cell_type": "markdown", "id": "5e4ce795", "metadata": { "papermill": { "duration": 0.033432, "end_time": "2022-05-11T11:03:04.321959", "exception": false, "start_time": "2022-05-11T11:03:04.288527", "status": "completed" }, "tags": [] }, "source": [ "Problem statement\n", "\n", "The May edition of the 2022 Tabular Playground series binary classification problem that includes a number of different feature interactions. This competition is an opportunity to explore various methods for identifying and exploiting these feature interactions." ] }, { "cell_type": "markdown", "id": "af70a983", "metadata": { "papermill": { "duration": 0.032628, "end_time": "2022-05-11T11:03:04.386417", "exception": false, "start_time": "2022-05-11T11:03:04.353789", "status": "completed" }, "tags": [] }, "source": [ "Import libraries" ] }, { "cell_type": "code", "execution_count": 1, "id": "a8932043", "metadata": { "execution": { "iopub.execute_input": "2022-05-11T11:03:04.453540Z", "iopub.status.busy": "2022-05-11T11:03:04.452968Z", "iopub.status.idle": "2022-05-11T11:03:05.559143Z", "shell.execute_reply": "2022-05-11T11:03:05.558125Z" }, "papermill": { "duration": 1.143269, "end_time": "2022-05-11T11:03:05.561715", "exception": false, "start_time": "2022-05-11T11:03:04.418446", "status": "completed" }, "tags": [] }, "outputs": [], "source": [ "import numpy as np\n", "import pandas as pd\n", "import matplotlib.pyplot as plt\n", "import seaborn as sns" ] }, { "cell_type": "code", "execution_count": 5, "id": "66d2b4ae", "metadata": { "execution": { "iopub.execute_input": "2022-05-11T11:03:05.627534Z", "iopub.status.busy": "2022-05-11T11:03:05.627253Z", "iopub.status.idle": "2022-05-11T11:03:05.633896Z", "shell.execute_reply": "2022-05-11T11:03:05.633045Z" }, "papermill": { "duration": 0.043253, "end_time": "2022-05-11T11:03:05.637363", "exception": false, "start_time": "2022-05-11T11:03:05.594110", "status": "completed" }, "tags": [] }, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "../coal-price-data/binary_classification/sample_submission.csv\n", "../coal-price-data/binary_classification/train.csv\n", "../coal-price-data/binary_classification/test.csv\n" ] } ], "source": [ "import os\n", "\n", "path = \"../coal-price-data/binary_classification\"\n", "for dirname, _, filenames in os.walk(path):\n", " for filename in filenames:\n", " print(os.path.join(dirname, filename))" ] }, { "cell_type": "markdown", "id": "be1e26a5", "metadata": { "papermill": { "duration": 0.035619, "end_time": "2022-05-11T11:03:05.708148", "exception": false, "start_time": "2022-05-11T11:03:05.672529", "status": "completed" }, "tags": [] }, "source": [ "Read files" ] }, { "cell_type": "code", "execution_count": 6, "id": "1c56f757", "metadata": { "execution": { "iopub.execute_input": "2022-05-11T11:03:05.776270Z", "iopub.status.busy": "2022-05-11T11:03:05.775581Z", "iopub.status.idle": "2022-05-11T11:03:21.346102Z", "shell.execute_reply": "2022-05-11T11:03:21.345294Z" }, "papermill": { "duration": 15.60683, "end_time": "2022-05-11T11:03:21.348390", "exception": false, "start_time": "2022-05-11T11:03:05.741560", "status": "completed" }, "tags": [] }, "outputs": [], "source": [ "train = pd.read_csv(f\"{path}/train.csv\")\n", "test = pd.read_csv(f\"{path}/test.csv\")\n", "submission = pd.read_csv(f\"{path}/sample_submission.csv\")" ] }, { "cell_type": "code", "execution_count": 7, "id": "7dc3af51", "metadata": { "execution": { "iopub.execute_input": "2022-05-11T11:03:21.416502Z", "iopub.status.busy": "2022-05-11T11:03:21.416126Z", "iopub.status.idle": "2022-05-11T11:03:21.717153Z", "shell.execute_reply": "2022-05-11T11:03:21.716495Z" }, "papermill": { "duration": 0.338273, "end_time": "2022-05-11T11:03:21.719304", "exception": false, "start_time": "2022-05-11T11:03:21.381031", "status": "completed" }, "tags": [] }, "outputs": [ { "data": { "text/html": [ "
\n", " | id | \n", "f_00 | \n", "f_01 | \n", "f_02 | \n", "f_03 | \n", "f_04 | \n", "f_05 | \n", "f_06 | \n", "f_07 | \n", "f_08 | \n", "... | \n", "f_22 | \n", "f_23 | \n", "f_24 | \n", "f_25 | \n", "f_26 | \n", "f_27 | \n", "f_28 | \n", "f_29 | \n", "f_30 | \n", "target | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", "0 | \n", "-1.373246 | \n", "0.238887 | \n", "-0.243376 | \n", "0.567405 | \n", "-0.647715 | \n", "0.839326 | \n", "0.113133 | \n", "1 | \n", "5 | \n", "... | \n", "-2.540739 | \n", "0.766952 | \n", "-2.730628 | \n", "-0.208177 | \n", "1.363402 | \n", "ABABDADBAB | \n", "67.609153 | \n", "0 | \n", "0 | \n", "0 | \n", "
1 | \n", "1 | \n", "1.697021 | \n", "-1.710322 | \n", "-2.230332 | \n", "-0.545661 | \n", "1.113173 | \n", "-1.552175 | \n", "0.447825 | \n", "1 | \n", "3 | \n", "... | \n", "2.278315 | \n", "-0.633658 | \n", "-1.217077 | \n", "-3.782194 | \n", "-0.058316 | \n", "ACACCADCEB | \n", "377.096415 | \n", "0 | \n", "0 | \n", "1 | \n", "
2 | \n", "2 | \n", "1.681726 | \n", "0.616746 | \n", "-1.027689 | \n", "0.810492 | \n", "-0.609086 | \n", "0.113965 | \n", "-0.708660 | \n", "1 | \n", "0 | \n", "... | \n", "-1.385775 | \n", "-0.520558 | \n", "-0.009121 | \n", "2.788536 | \n", "-3.703488 | \n", "AAAEABCKAD | \n", "-195.599702 | \n", "0 | \n", "2 | \n", "1 | \n", "
3 | \n", "3 | \n", "-0.118172 | \n", "-0.587835 | \n", "-0.804638 | \n", "2.086822 | \n", "0.371005 | \n", "-0.128831 | \n", "-0.282575 | \n", "3 | \n", "2 | \n", "... | \n", "0.572594 | \n", "-1.653213 | \n", "1.686035 | \n", "-2.533098 | \n", "-0.608601 | \n", "BDBBAACBCB | \n", "210.826205 | \n", "0 | \n", "0 | \n", "1 | \n", "
4 | \n", "4 | \n", "1.148481 | \n", "-0.176567 | \n", "-0.664871 | \n", "-1.101343 | \n", "0.467875 | \n", "0.500117 | \n", "0.407515 | \n", "3 | \n", "3 | \n", "... | \n", "-3.912929 | \n", "-1.430366 | \n", "2.127649 | \n", "-3.306784 | \n", "4.371371 | \n", "BDBCBBCHFE | \n", "-217.211798 | \n", "0 | \n", "1 | \n", "1 | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
899995 | \n", "899995 | \n", "1.380145 | \n", "-0.038884 | \n", "0.597111 | \n", "0.854560 | \n", "0.684301 | \n", "-1.058618 | \n", "1.310699 | \n", "2 | \n", "1 | \n", "... | \n", "-1.594744 | \n", "0.522019 | \n", "0.833047 | \n", "2.714125 | \n", "1.290094 | \n", "BABBCBBBED | \n", "455.033851 | \n", "0 | \n", "2 | \n", "1 | \n", "
899996 | \n", "899996 | \n", "-1.369789 | \n", "0.044841 | \n", "0.015458 | \n", "0.376565 | \n", "-0.380529 | \n", "-0.830815 | \n", "-1.798458 | \n", "4 | \n", "1 | \n", "... | \n", "2.413899 | \n", "-0.674942 | \n", "-0.412111 | \n", "-0.030436 | \n", "-3.144047 | \n", "BBBGBBDQBE | \n", "134.703577 | \n", "0 | \n", "1 | \n", "0 | \n", "
899997 | \n", "899997 | \n", "1.386201 | \n", "-0.961150 | \n", "0.725994 | \n", "-0.132844 | \n", "0.873911 | \n", "-0.245339 | \n", "-1.045786 | \n", "0 | \n", "0 | \n", "... | \n", "-0.151930 | \n", "-4.560773 | \n", "-1.249154 | \n", "1.793535 | \n", "2.253696 | \n", "AEBEDBBHBA | \n", "-99.536313 | \n", "0 | \n", "1 | \n", "0 | \n", "
899998 | \n", "899998 | \n", "-1.590572 | \n", "-0.509938 | \n", "-1.715397 | \n", "-0.249988 | \n", "1.359933 | \n", "1.650808 | \n", "-0.058592 | \n", "0 | \n", "2 | \n", "... | \n", "2.423670 | \n", "2.110008 | \n", "0.561271 | \n", "-2.149610 | \n", "1.019982 | \n", "ADBAAADDAE | \n", "47.823039 | \n", "1 | \n", "2 | \n", "0 | \n", "
899999 | \n", "899999 | \n", "-0.636210 | \n", "-0.425986 | \n", "-1.826699 | \n", "-0.598797 | \n", "1.589577 | \n", "-0.482298 | \n", "-0.214093 | \n", "7 | \n", "1 | \n", "... | \n", "1.340696 | \n", "3.762351 | \n", "1.797137 | \n", "-0.412837 | \n", "2.090440 | \n", "BCAACADSCE | \n", "-44.559296 | \n", "0 | \n", "2 | \n", "1 | \n", "
900000 rows × 33 columns
\n", "\n", " | id | \n", "f_00 | \n", "f_01 | \n", "f_02 | \n", "f_03 | \n", "f_04 | \n", "f_05 | \n", "f_06 | \n", "f_07 | \n", "f_08 | \n", "... | \n", "f_21 | \n", "f_22 | \n", "f_23 | \n", "f_24 | \n", "f_25 | \n", "f_26 | \n", "f_27 | \n", "f_28 | \n", "f_29 | \n", "f_30 | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", "900000 | \n", "0.442517 | \n", "0.174380 | \n", "-0.999816 | \n", "0.762741 | \n", "0.186778 | \n", "-1.074775 | \n", "0.501888 | \n", "6 | \n", "6 | \n", "... | \n", "-1.006400 | \n", "-1.193879 | \n", "-2.435736 | \n", "-2.427430 | \n", "-1.966887 | \n", "5.734205 | \n", "BAAABADLAC | \n", "99.478419 | \n", "0 | \n", "0 | \n", "
1 | \n", "900001 | \n", "-0.605598 | \n", "-0.305715 | \n", "0.627667 | \n", "-0.578898 | \n", "-1.750931 | \n", "1.355550 | \n", "-0.190911 | \n", "1 | \n", "3 | \n", "... | \n", "2.382405 | \n", "0.149442 | \n", "1.883322 | \n", "-2.848714 | \n", "-0.725155 | \n", "3.194219 | \n", "AFABBAEGCB | \n", "-65.993825 | \n", "1 | \n", "0 | \n", "
2 | \n", "900002 | \n", "0.303990 | \n", "2.445110 | \n", "0.246515 | \n", "0.818248 | \n", "0.359731 | \n", "-1.331845 | \n", "1.358622 | \n", "3 | \n", "3 | \n", "... | \n", "-7.026098 | \n", "1.312277 | \n", "-5.157192 | \n", "1.714005 | \n", "0.585032 | \n", "0.066898 | \n", "BBACABBKEE | \n", "-87.405622 | \n", "0 | \n", "1 | \n", "
3 | \n", "900003 | \n", "0.154053 | \n", "0.260126 | \n", "-1.367092 | \n", "-0.093175 | \n", "-1.111034 | \n", "-0.948481 | \n", "1.119220 | \n", "0 | \n", "0 | \n", "... | \n", "-0.594532 | \n", "-3.939475 | \n", "1.754570 | \n", "-2.364007 | \n", "-1.003320 | \n", "3.893099 | \n", "AEBEAACQCC | \n", "-281.293460 | \n", "0 | \n", "0 | \n", "
4 | \n", "900004 | \n", "-1.651904 | \n", "-0.424266 | \n", "-0.667356 | \n", "-0.322124 | \n", "-0.089462 | \n", "0.181705 | \n", "1.784983 | \n", "2 | \n", "2 | \n", "... | \n", "0.084906 | \n", "-0.985736 | \n", "-0.130467 | \n", "-3.557893 | \n", "1.210687 | \n", "1.861884 | \n", "AEBBBBDABF | \n", "25.629415 | \n", "0 | \n", "2 | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
699995 | \n", "1599995 | \n", "0.640110 | \n", "0.897808 | \n", "-0.523956 | \n", "1.563760 | \n", "-0.092281 | \n", "-0.610867 | \n", "0.535426 | \n", "0 | \n", "1 | \n", "... | \n", "2.604048 | \n", "1.122867 | \n", "0.518110 | \n", "1.243837 | \n", "0.575111 | \n", "0.076372 | \n", "BCBCEBHMCD | \n", "204.186539 | \n", "0 | \n", "0 | \n", "
699996 | \n", "1599996 | \n", "-0.191771 | \n", "-0.035246 | \n", "-0.118533 | \n", "0.584750 | \n", "2.126977 | \n", "0.568659 | \n", "-0.052663 | \n", "4 | \n", "3 | \n", "... | \n", "3.029857 | \n", "1.384682 | \n", "-1.135740 | \n", "2.982713 | \n", "-1.511760 | \n", "2.225218 | \n", "BAABCADQFC | \n", "-97.694591 | \n", "0 | \n", "2 | \n", "
699997 | \n", "1599997 | \n", "-0.331704 | \n", "-0.328845 | \n", "-1.185503 | \n", "1.022128 | \n", "-0.483099 | \n", "-0.107146 | \n", "-0.968281 | \n", "1 | \n", "1 | \n", "... | \n", "4.021273 | \n", "-1.845266 | \n", "1.096011 | \n", "-2.734508 | \n", "-4.885955 | \n", "-2.248739 | \n", "AAAJCBGQBA | \n", "130.622745 | \n", "1 | \n", "0 | \n", "
699998 | \n", "1599998 | \n", "-2.031073 | \n", "-1.238398 | \n", "0.964699 | \n", "-1.045950 | \n", "0.906064 | \n", "0.634301 | \n", "-0.707474 | \n", "5 | \n", "1 | \n", "... | \n", "1.453864 | \n", "-1.696606 | \n", "1.018995 | \n", "1.973697 | \n", "-0.353068 | \n", "-3.333449 | \n", "BCBBCABNDE | \n", "-364.625148 | \n", "0 | \n", "0 | \n", "
699999 | \n", "1599999 | \n", "-0.085906 | \n", "-0.002124 | \n", "2.227375 | \n", "0.217145 | \n", "3.179153 | \n", "-1.660188 | \n", "0.891989 | \n", "0 | \n", "3 | \n", "... | \n", "-3.549082 | \n", "-4.325318 | \n", "-5.017221 | \n", "0.251268 | \n", "-3.236026 | \n", "-0.362070 | \n", "AFBEBACHFF | \n", "-155.417342 | \n", "0 | \n", "1 | \n", "
700000 rows × 32 columns
\n", "\n", " | id | \n", "target | \n", "
---|---|---|
0 | \n", "900000 | \n", "0.5 | \n", "
1 | \n", "900001 | \n", "0.5 | \n", "
2 | \n", "900002 | \n", "0.5 | \n", "
3 | \n", "900003 | \n", "0.5 | \n", "
4 | \n", "900004 | \n", "0.5 | \n", "
... | \n", "... | \n", "... | \n", "
699995 | \n", "1599995 | \n", "0.5 | \n", "
699996 | \n", "1599996 | \n", "0.5 | \n", "
699997 | \n", "1599997 | \n", "0.5 | \n", "
699998 | \n", "1599998 | \n", "0.5 | \n", "
699999 | \n", "1599999 | \n", "0.5 | \n", "
700000 rows × 2 columns
\n", "\n", " | id | \n", "f_00 | \n", "f_01 | \n", "f_02 | \n", "f_03 | \n", "f_04 | \n", "f_05 | \n", "f_06 | \n", "f_07 | \n", "f_08 | \n", "... | \n", "f_21 | \n", "f_22 | \n", "f_23 | \n", "f_24 | \n", "f_25 | \n", "f_26 | \n", "f_28 | \n", "f_29 | \n", "f_30 | \n", "target | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
count | \n", "900000.000000 | \n", "900000.000000 | \n", "900000.000000 | \n", "900000.000000 | \n", "900000.000000 | \n", "900000.000000 | \n", "900000.000000 | \n", "900000.000000 | \n", "900000.000000 | \n", "900000.000000 | \n", "... | \n", "900000.000000 | \n", "900000.000000 | \n", "900000.000000 | \n", "900000.000000 | \n", "900000.000000 | \n", "900000.000000 | \n", "900000.000000 | \n", "900000.000000 | \n", "900000.000000 | \n", "900000.000000 | \n", "
mean | \n", "449999.500000 | \n", "-0.000286 | \n", "0.001165 | \n", "0.001174 | \n", "-0.001368 | \n", "-0.000571 | \n", "0.000284 | \n", "-0.000709 | \n", "2.031460 | \n", "2.057998 | \n", "... | \n", "-0.156307 | \n", "-0.009273 | \n", "-0.369459 | \n", "-0.342738 | \n", "0.176549 | \n", "0.357591 | \n", "-0.380876 | \n", "0.345661 | \n", "1.002654 | \n", "0.486488 | \n", "
std | \n", "259807.765473 | \n", "0.998888 | \n", "0.999193 | \n", "1.000514 | \n", "1.000175 | \n", "1.000167 | \n", "0.999875 | \n", "0.999942 | \n", "1.656172 | \n", "1.590955 | \n", "... | \n", "2.484706 | \n", "2.450797 | \n", "2.453405 | \n", "2.386941 | \n", "2.416959 | \n", "2.476020 | \n", "238.773054 | \n", "0.475584 | \n", "0.818989 | \n", "0.499818 | \n", "
min | \n", "0.000000 | \n", "-4.599856 | \n", "-4.682199 | \n", "-4.642676 | \n", "-4.658816 | \n", "-4.748501 | \n", "-4.750214 | \n", "-4.842919 | \n", "0.000000 | \n", "0.000000 | \n", "... | \n", "-13.310146 | \n", "-11.853530 | \n", "-12.301097 | \n", "-11.416189 | \n", "-11.918306 | \n", "-14.300577 | \n", "-1229.753052 | \n", "0.000000 | \n", "0.000000 | \n", "0.000000 | \n", "
25% | \n", "224999.750000 | \n", "-0.675490 | \n", "-0.675162 | \n", "-0.674369 | \n", "-0.676114 | \n", "-0.675909 | \n", "-0.673437 | \n", "-0.674876 | \n", "1.000000 | \n", "1.000000 | \n", "... | \n", "-1.820063 | \n", "-1.645585 | \n", "-2.019739 | \n", "-1.955956 | \n", "-1.440424 | \n", "-1.261598 | \n", "-159.427418 | \n", "0.000000 | \n", "0.000000 | \n", "0.000000 | \n", "
50% | \n", "449999.500000 | \n", "0.001144 | \n", "0.002014 | \n", "0.002218 | \n", "-0.002227 | \n", "-0.001662 | \n", "-0.000438 | \n", "-0.001492 | \n", "2.000000 | \n", "2.000000 | \n", "... | \n", "-0.152668 | \n", "0.030850 | \n", "-0.390966 | \n", "-0.340746 | \n", "0.160912 | \n", "0.404212 | \n", "-0.519808 | \n", "0.000000 | \n", "1.000000 | \n", "0.000000 | \n", "
75% | \n", "674999.250000 | \n", "0.674337 | \n", "0.675021 | \n", "0.677505 | \n", "0.672544 | \n", "0.673789 | \n", "0.675028 | \n", "0.674749 | \n", "3.000000 | \n", "3.000000 | \n", "... | \n", "1.507071 | \n", "1.661676 | \n", "1.255408 | \n", "1.266673 | \n", "1.795928 | \n", "2.028219 | \n", "158.987357 | \n", "1.000000 | \n", "2.000000 | \n", "1.000000 | \n", "
max | \n", "899999.000000 | \n", "4.749301 | \n", "4.815699 | \n", "4.961982 | \n", "4.454920 | \n", "4.948983 | \n", "4.971881 | \n", "4.822668 | \n", "15.000000 | \n", "16.000000 | \n", "... | \n", "14.455426 | \n", "11.344080 | \n", "12.247100 | \n", "12.389844 | \n", "12.529179 | \n", "12.913041 | \n", "1229.562577 | \n", "1.000000 | \n", "2.000000 | \n", "1.000000 | \n", "
8 rows × 32 columns
\n", "\n", " | f_00 | \n", "f_01 | \n", "f_02 | \n", "f_03 | \n", "f_04 | \n", "f_05 | \n", "f_06 | \n", "f_07 | \n", "f_08 | \n", "f_09 | \n", "... | \n", "f_20 | \n", "f_21 | \n", "f_22 | \n", "f_23 | \n", "f_24 | \n", "f_25 | \n", "f_26 | \n", "f_28 | \n", "f_29 | \n", "f_30 | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", "-1.373246 | \n", "0.238887 | \n", "-0.243376 | \n", "0.567405 | \n", "-0.647715 | \n", "0.839326 | \n", "0.113133 | \n", "1 | \n", "5 | \n", "1 | \n", "... | \n", "-0.919717 | \n", "3.058541 | \n", "-2.540739 | \n", "0.766952 | \n", "-2.730628 | \n", "-0.208177 | \n", "1.363402 | \n", "67.609153 | \n", "0 | \n", "0 | \n", "
1 | \n", "1.697021 | \n", "-1.710322 | \n", "-2.230332 | \n", "-0.545661 | \n", "1.113173 | \n", "-1.552175 | \n", "0.447825 | \n", "1 | \n", "3 | \n", "4 | \n", "... | \n", "-1.075434 | \n", "2.179050 | \n", "2.278315 | \n", "-0.633658 | \n", "-1.217077 | \n", "-3.782194 | \n", "-0.058316 | \n", "377.096415 | \n", "0 | \n", "0 | \n", "
2 | \n", "1.681726 | \n", "0.616746 | \n", "-1.027689 | \n", "0.810492 | \n", "-0.609086 | \n", "0.113965 | \n", "-0.708660 | \n", "1 | \n", "0 | \n", "2 | \n", "... | \n", "-3.485342 | \n", "-0.784235 | \n", "-1.385775 | \n", "-0.520558 | \n", "-0.009121 | \n", "2.788536 | \n", "-3.703488 | \n", "-195.599702 | \n", "0 | \n", "2 | \n", "
3 | \n", "-0.118172 | \n", "-0.587835 | \n", "-0.804638 | \n", "2.086822 | \n", "0.371005 | \n", "-0.128831 | \n", "-0.282575 | \n", "3 | \n", "2 | \n", "1 | \n", "... | \n", "-2.100177 | \n", "-2.343819 | \n", "0.572594 | \n", "-1.653213 | \n", "1.686035 | \n", "-2.533098 | \n", "-0.608601 | \n", "210.826205 | \n", "0 | \n", "0 | \n", "
4 | \n", "1.148481 | \n", "-0.176567 | \n", "-0.664871 | \n", "-1.101343 | \n", "0.467875 | \n", "0.500117 | \n", "0.407515 | \n", "3 | \n", "3 | \n", "0 | \n", "... | \n", "0.605033 | \n", "1.133665 | \n", "-3.912929 | \n", "-1.430366 | \n", "2.127649 | \n", "-3.306784 | \n", "4.371371 | \n", "-217.211798 | \n", "0 | \n", "1 | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
699995 | \n", "0.640110 | \n", "0.897808 | \n", "-0.523956 | \n", "1.563760 | \n", "-0.092281 | \n", "-0.610867 | \n", "0.535426 | \n", "0 | \n", "1 | \n", "6 | \n", "... | \n", "-2.185190 | \n", "2.604048 | \n", "1.122867 | \n", "0.518110 | \n", "1.243837 | \n", "0.575111 | \n", "0.076372 | \n", "204.186539 | \n", "0 | \n", "0 | \n", "
699996 | \n", "-0.191771 | \n", "-0.035246 | \n", "-0.118533 | \n", "0.584750 | \n", "2.126977 | \n", "0.568659 | \n", "-0.052663 | \n", "4 | \n", "3 | \n", "4 | \n", "... | \n", "-0.239552 | \n", "3.029857 | \n", "1.384682 | \n", "-1.135740 | \n", "2.982713 | \n", "-1.511760 | \n", "2.225218 | \n", "-97.694591 | \n", "0 | \n", "2 | \n", "
699997 | \n", "-0.331704 | \n", "-0.328845 | \n", "-1.185503 | \n", "1.022128 | \n", "-0.483099 | \n", "-0.107146 | \n", "-0.968281 | \n", "1 | \n", "1 | \n", "2 | \n", "... | \n", "-0.922626 | \n", "4.021273 | \n", "-1.845266 | \n", "1.096011 | \n", "-2.734508 | \n", "-4.885955 | \n", "-2.248739 | \n", "130.622745 | \n", "1 | \n", "0 | \n", "
699998 | \n", "-2.031073 | \n", "-1.238398 | \n", "0.964699 | \n", "-1.045950 | \n", "0.906064 | \n", "0.634301 | \n", "-0.707474 | \n", "5 | \n", "1 | \n", "1 | \n", "... | \n", "-3.079996 | \n", "1.453864 | \n", "-1.696606 | \n", "1.018995 | \n", "1.973697 | \n", "-0.353068 | \n", "-3.333449 | \n", "-364.625148 | \n", "0 | \n", "0 | \n", "
699999 | \n", "-0.085906 | \n", "-0.002124 | \n", "2.227375 | \n", "0.217145 | \n", "3.179153 | \n", "-1.660188 | \n", "0.891989 | \n", "0 | \n", "3 | \n", "4 | \n", "... | \n", "-2.128546 | \n", "-3.549082 | \n", "-4.325318 | \n", "-5.017221 | \n", "0.251268 | \n", "-3.236026 | \n", "-0.362070 | \n", "-155.417342 | \n", "0 | \n", "1 | \n", "
1600000 rows × 30 columns
\n", "\n", " | f_00 | \n", "f_01 | \n", "f_02 | \n", "f_03 | \n", "f_04 | \n", "f_05 | \n", "f_06 | \n", "f_07 | \n", "f_08 | \n", "f_09 | \n", "... | \n", "f_20 | \n", "f_21 | \n", "f_22 | \n", "f_23 | \n", "f_24 | \n", "f_25 | \n", "f_26 | \n", "f_28 | \n", "f_29 | \n", "f_30 | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", "-1.373246 | \n", "0.238887 | \n", "-0.243376 | \n", "0.567405 | \n", "-0.647715 | \n", "0.839326 | \n", "0.113133 | \n", "1 | \n", "5 | \n", "1 | \n", "... | \n", "-0.919717 | \n", "3.058541 | \n", "-2.540739 | \n", "0.766952 | \n", "-2.730628 | \n", "-0.208177 | \n", "1.363402 | \n", "67.609153 | \n", "0 | \n", "0 | \n", "
1 | \n", "1.697021 | \n", "-1.710322 | \n", "-2.230332 | \n", "-0.545661 | \n", "1.113173 | \n", "-1.552175 | \n", "0.447825 | \n", "1 | \n", "3 | \n", "4 | \n", "... | \n", "-1.075434 | \n", "2.179050 | \n", "2.278315 | \n", "-0.633658 | \n", "-1.217077 | \n", "-3.782194 | \n", "-0.058316 | \n", "377.096415 | \n", "0 | \n", "0 | \n", "
2 | \n", "1.681726 | \n", "0.616746 | \n", "-1.027689 | \n", "0.810492 | \n", "-0.609086 | \n", "0.113965 | \n", "-0.708660 | \n", "1 | \n", "0 | \n", "2 | \n", "... | \n", "-3.485342 | \n", "-0.784235 | \n", "-1.385775 | \n", "-0.520558 | \n", "-0.009121 | \n", "2.788536 | \n", "-3.703488 | \n", "-195.599702 | \n", "0 | \n", "2 | \n", "
3 | \n", "-0.118172 | \n", "-0.587835 | \n", "-0.804638 | \n", "2.086822 | \n", "0.371005 | \n", "-0.128831 | \n", "-0.282575 | \n", "3 | \n", "2 | \n", "1 | \n", "... | \n", "-2.100177 | \n", "-2.343819 | \n", "0.572594 | \n", "-1.653213 | \n", "1.686035 | \n", "-2.533098 | \n", "-0.608601 | \n", "210.826205 | \n", "0 | \n", "0 | \n", "
4 | \n", "1.148481 | \n", "-0.176567 | \n", "-0.664871 | \n", "-1.101343 | \n", "0.467875 | \n", "0.500117 | \n", "0.407515 | \n", "3 | \n", "3 | \n", "0 | \n", "... | \n", "0.605033 | \n", "1.133665 | \n", "-3.912929 | \n", "-1.430366 | \n", "2.127649 | \n", "-3.306784 | \n", "4.371371 | \n", "-217.211798 | \n", "0 | \n", "1 | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
699995 | \n", "0.640110 | \n", "0.897808 | \n", "-0.523956 | \n", "1.563760 | \n", "-0.092281 | \n", "-0.610867 | \n", "0.535426 | \n", "0 | \n", "1 | \n", "6 | \n", "... | \n", "-2.185190 | \n", "2.604048 | \n", "1.122867 | \n", "0.518110 | \n", "1.243837 | \n", "0.575111 | \n", "0.076372 | \n", "204.186539 | \n", "0 | \n", "0 | \n", "
699996 | \n", "-0.191771 | \n", "-0.035246 | \n", "-0.118533 | \n", "0.584750 | \n", "2.126977 | \n", "0.568659 | \n", "-0.052663 | \n", "4 | \n", "3 | \n", "4 | \n", "... | \n", "-0.239552 | \n", "3.029857 | \n", "1.384682 | \n", "-1.135740 | \n", "2.982713 | \n", "-1.511760 | \n", "2.225218 | \n", "-97.694591 | \n", "0 | \n", "2 | \n", "
699997 | \n", "-0.331704 | \n", "-0.328845 | \n", "-1.185503 | \n", "1.022128 | \n", "-0.483099 | \n", "-0.107146 | \n", "-0.968281 | \n", "1 | \n", "1 | \n", "2 | \n", "... | \n", "-0.922626 | \n", "4.021273 | \n", "-1.845266 | \n", "1.096011 | \n", "-2.734508 | \n", "-4.885955 | \n", "-2.248739 | \n", "130.622745 | \n", "1 | \n", "0 | \n", "
699998 | \n", "-2.031073 | \n", "-1.238398 | \n", "0.964699 | \n", "-1.045950 | \n", "0.906064 | \n", "0.634301 | \n", "-0.707474 | \n", "5 | \n", "1 | \n", "1 | \n", "... | \n", "-3.079996 | \n", "1.453864 | \n", "-1.696606 | \n", "1.018995 | \n", "1.973697 | \n", "-0.353068 | \n", "-3.333449 | \n", "-364.625148 | \n", "0 | \n", "0 | \n", "
699999 | \n", "-0.085906 | \n", "-0.002124 | \n", "2.227375 | \n", "0.217145 | \n", "3.179153 | \n", "-1.660188 | \n", "0.891989 | \n", "0 | \n", "3 | \n", "4 | \n", "... | \n", "-2.128546 | \n", "-3.549082 | \n", "-4.325318 | \n", "-5.017221 | \n", "0.251268 | \n", "-3.236026 | \n", "-0.362070 | \n", "-155.417342 | \n", "0 | \n", "1 | \n", "
1600000 rows × 30 columns
\n", "\n", " | f_00 | \n", "f_01 | \n", "f_02 | \n", "f_03 | \n", "f_04 | \n", "f_05 | \n", "f_06 | \n", "f_07 | \n", "f_08 | \n", "f_09 | \n", "... | \n", "f_20 | \n", "f_21 | \n", "f_22 | \n", "f_23 | \n", "f_24 | \n", "f_25 | \n", "f_26 | \n", "f_28 | \n", "f_29 | \n", "f_30 | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", "0.315238 | \n", "0.530025 | \n", "0.458038 | \n", "0.546749 | \n", "0.422871 | \n", "0.591372 | \n", "0.512752 | \n", "0.0625 | \n", "0.3125 | \n", "0.0625 | \n", "... | \n", "0.454761 | \n", "0.589532 | \n", "0.401455 | \n", "0.532343 | \n", "0.375916 | \n", "0.507106 | \n", "0.575593 | \n", "0.527530 | \n", "0.0 | \n", "0.0 | \n", "
1 | \n", "0.609890 | \n", "0.329868 | \n", "0.251164 | \n", "0.430304 | \n", "0.604453 | \n", "0.354899 | \n", "0.547380 | \n", "0.0625 | \n", "0.1875 | \n", "0.2500 | \n", "... | \n", "0.447912 | \n", "0.557856 | \n", "0.609194 | \n", "0.475287 | \n", "0.438386 | \n", "0.368803 | \n", "0.523351 | \n", "0.653373 | \n", "0.0 | \n", "0.0 | \n", "
2 | \n", "0.608423 | \n", "0.568826 | \n", "0.376379 | \n", "0.572180 | \n", "0.426854 | \n", "0.519648 | \n", "0.427730 | \n", "0.0625 | \n", "0.0000 | \n", "0.1250 | \n", "... | \n", "0.341903 | \n", "0.451131 | \n", "0.451243 | \n", "0.479894 | \n", "0.488244 | \n", "0.623069 | \n", "0.389404 | \n", "0.420505 | \n", "0.0 | \n", "1.0 | \n", "
3 | \n", "0.435687 | \n", "0.445132 | \n", "0.399602 | \n", "0.705705 | \n", "0.527921 | \n", "0.495640 | \n", "0.471812 | \n", "0.1875 | \n", "0.1250 | \n", "0.0625 | \n", "... | \n", "0.402835 | \n", "0.394961 | \n", "0.535664 | \n", "0.433754 | \n", "0.558210 | \n", "0.417139 | \n", "0.503130 | \n", "0.585764 | \n", "0.0 | \n", "0.0 | \n", "
4 | \n", "0.557247 | \n", "0.487364 | \n", "0.414154 | \n", "0.372170 | \n", "0.537910 | \n", "0.557831 | \n", "0.543209 | \n", "0.1875 | \n", "0.1875 | \n", "0.0000 | \n", "... | \n", "0.521833 | \n", "0.520206 | \n", "0.342303 | \n", "0.442832 | \n", "0.576437 | \n", "0.387200 | \n", "0.686125 | \n", "0.411717 | \n", "0.0 | \n", "0.5 | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
699995 | \n", "0.508459 | \n", "0.597687 | \n", "0.428825 | \n", "0.650984 | \n", "0.480147 | \n", "0.447976 | \n", "0.556443 | \n", "0.0000 | \n", "0.0625 | \n", "0.3750 | \n", "... | \n", "0.399095 | \n", "0.573163 | \n", "0.559385 | \n", "0.522206 | \n", "0.539958 | \n", "0.537416 | \n", "0.528300 | \n", "0.583064 | \n", "0.0 | \n", "0.0 | \n", "
699996 | \n", "0.428624 | \n", "0.501875 | \n", "0.471036 | \n", "0.548564 | \n", "0.708996 | \n", "0.564608 | \n", "0.495599 | \n", "0.2500 | \n", "0.1875 | \n", "0.2500 | \n", "... | \n", "0.484681 | \n", "0.588499 | \n", "0.570671 | \n", "0.454834 | \n", "0.611729 | \n", "0.456661 | \n", "0.607262 | \n", "0.460314 | \n", "0.0 | \n", "1.0 | \n", "
699997 | \n", "0.415195 | \n", "0.471727 | \n", "0.359948 | \n", "0.594321 | \n", "0.439846 | \n", "0.497784 | \n", "0.400869 | \n", "0.0625 | \n", "0.0625 | \n", "0.1250 | \n", "... | \n", "0.454633 | \n", "0.624205 | \n", "0.431435 | \n", "0.545747 | \n", "0.375756 | \n", "0.326091 | \n", "0.442861 | \n", "0.553152 | \n", "1.0 | \n", "0.0 | \n", "
699998 | \n", "0.252107 | \n", "0.378328 | \n", "0.583818 | \n", "0.377965 | \n", "0.583096 | \n", "0.571099 | \n", "0.427852 | \n", "0.3125 | \n", "0.0625 | \n", "0.0625 | \n", "... | \n", "0.359734 | \n", "0.531738 | \n", "0.437844 | \n", "0.542610 | \n", "0.570083 | \n", "0.501499 | \n", "0.403001 | \n", "0.351776 | \n", "0.0 | \n", "0.0 | \n", "
699999 | \n", "0.438784 | \n", "0.505277 | \n", "0.715283 | \n", "0.510106 | \n", "0.817496 | \n", "0.344219 | \n", "0.593333 | \n", "0.0000 | \n", "0.1875 | \n", "0.2500 | \n", "... | \n", "0.401587 | \n", "0.351553 | \n", "0.324525 | \n", "0.296717 | \n", "0.498991 | \n", "0.389938 | \n", "0.512189 | \n", "0.436843 | \n", "0.0 | \n", "0.5 | \n", "
1600000 rows × 30 columns
\n", "\n", " | id | \n", "target | \n", "
---|---|---|
0 | \n", "900000 | \n", "0 | \n", "
1 | \n", "900001 | \n", "1 | \n", "
2 | \n", "900002 | \n", "0 | \n", "
3 | \n", "900003 | \n", "0 | \n", "
4 | \n", "900004 | \n", "1 | \n", "
... | \n", "... | \n", "... | \n", "
699995 | \n", "1599995 | \n", "1 | \n", "
699996 | \n", "1599996 | \n", "1 | \n", "
699997 | \n", "1599997 | \n", "1 | \n", "
699998 | \n", "1599998 | \n", "0 | \n", "
699999 | \n", "1599999 | \n", "0 | \n", "
700000 rows × 2 columns
\n", "