{ "cells": [ { "cell_type": "code", "execution_count": null, "metadata": { "colab": { "base_uri": "https://localhost:8080/" }, "id": "Y8jA9U3pdddm", "outputId": "ccf507aa-2ada-4d1d-a577-c2b0ac8efb06" }, "outputs": [ { "output_type": "stream", "name": "stdout", "text": [ "Drive already mounted at /content/drive; to attempt to forcibly remount, call drive.mount(\"/content/drive\", force_remount=True).\n" ] } ], "source": [ "from google.colab import drive\n", "drive.mount('/content/drive')" ] }, { "cell_type": "code", "execution_count": null, "metadata": { "id": "sOLAMK6M0u0n" }, "outputs": [], "source": [ "import pandas as pd" ] }, { "cell_type": "code", "execution_count": null, "metadata": { "id": "XGI8jtg00NSX" }, "outputs": [], "source": [ "Data = pd.read_csv('/content/drive/MyDrive/Research Dataset/processed_data/Added_Target/FullyMerged.csv')" ] }, { "cell_type": "code", "execution_count": null, "metadata": { "id": "B31lRinc03xl" }, "outputs": [], "source": [ "Data = Data.drop(['Unnamed: 0'], axis=1)" ] }, { "cell_type": "code", "execution_count": null, "metadata": { "id": "6Q8Qx4dF07mF" }, "outputs": [], "source": [ "Data['ALL'] = Data[['skills','edu_1','edu_2','edu_3','org_1','org_2','org_3','org_4']].agg(' '.join, axis=1)" ] }, { "cell_type": "code", "execution_count": null, "metadata": { "colab": { "base_uri": "https://localhost:8080/", "height": 424 }, "id": "vz-Rh6M61BjU", "outputId": "e22dfce6-ba88-46fc-d728-8cc247626c6f" }, "outputs": [ { "output_type": "execute_result", "data": { "text/plain": [ " Target ALL\n", "0 Software Engineer Java Android Development PHP HTML C Cascading ...\n", "1 Software Engineer ...\n", "2 Software Engineer JavaScript Reactjs MySQL ObjectOriented Progra...\n", "3 Software Engineer Java JavaScript PHP HTML Cascading Style Sheet...\n", "4 Software Engineer Java Android Development C Communication HTML ...\n", "... ... ...\n", "4571 Data Science SQL Git Machine Learning C Deep Learning Pytho...\n", "4572 Data Science Python Programming Language Bootstrap Machine ...\n", "4573 Data Science Java C JavaScript PHP MySQL Cascading Style Sh...\n", "4574 Data Science Python Programming Language HTML Machine Learn...\n", "4575 Data Science SQL Data Analysis Microsoft Excel Deep Learnin...\n", "\n", "[4576 rows x 2 columns]" ], "text/html": [ "\n", "
\n", " | Target | \n", "ALL | \n", "
---|---|---|
0 | \n", "Software Engineer | \n", "Java Android Development PHP HTML C Cascading ... | \n", "
1 | \n", "Software Engineer | \n", "... | \n", "
2 | \n", "Software Engineer | \n", "JavaScript Reactjs MySQL ObjectOriented Progra... | \n", "
3 | \n", "Software Engineer | \n", "Java JavaScript PHP HTML Cascading Style Sheet... | \n", "
4 | \n", "Software Engineer | \n", "Java Android Development C Communication HTML ... | \n", "
... | \n", "... | \n", "... | \n", "
4571 | \n", "Data Science | \n", "SQL Git Machine Learning C Deep Learning Pytho... | \n", "
4572 | \n", "Data Science | \n", "Python Programming Language Bootstrap Machine ... | \n", "
4573 | \n", "Data Science | \n", "Java C JavaScript PHP MySQL Cascading Style Sh... | \n", "
4574 | \n", "Data Science | \n", "Python Programming Language HTML Machine Learn... | \n", "
4575 | \n", "Data Science | \n", "SQL Data Analysis Microsoft Excel Deep Learnin... | \n", "
4576 rows × 2 columns
\n", "\n", " | Target | \n", "ALL | \n", "Target_NO | \n", "
---|---|---|---|
0 | \n", "Software Engineer | \n", "Java Android Development PHP HTML C Cascading ... | \n", "9 | \n", "
1 | \n", "Software Engineer | \n", "... | \n", "9 | \n", "
2 | \n", "Software Engineer | \n", "JavaScript Reactjs MySQL ObjectOriented Progra... | \n", "9 | \n", "
3 | \n", "Software Engineer | \n", "Java JavaScript PHP HTML Cascading Style Sheet... | \n", "9 | \n", "
4 | \n", "Software Engineer | \n", "Java Android Development C Communication HTML ... | \n", "9 | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "
4571 | \n", "Data Science | \n", "SQL Git Machine Learning C Deep Learning Pytho... | \n", "3 | \n", "
4572 | \n", "Data Science | \n", "Python Programming Language Bootstrap Machine ... | \n", "3 | \n", "
4573 | \n", "Data Science | \n", "Java C JavaScript PHP MySQL Cascading Style Sh... | \n", "3 | \n", "
4574 | \n", "Data Science | \n", "Python Programming Language HTML Machine Learn... | \n", "3 | \n", "
4575 | \n", "Data Science | \n", "SQL Data Analysis Microsoft Excel Deep Learnin... | \n", "3 | \n", "
4576 rows × 3 columns
\n", "\n", " | Target | \n", "ALL | \n", "Target_NO | \n", "
---|---|---|---|
0 | \n", "Software Engineer | \n", "Java Android Development PHP HTML C Cascading ... | \n", "9 | \n", "
1 | \n", "Software Engineer | \n", "... | \n", "9 | \n", "
2 | \n", "Software Engineer | \n", "JavaScript Reactjs MySQL ObjectOriented Progra... | \n", "9 | \n", "
3 | \n", "Software Engineer | \n", "Java JavaScript PHP HTML Cascading Style Sheet... | \n", "9 | \n", "
4 | \n", "Software Engineer | \n", "Java Android Development C Communication HTML ... | \n", "9 | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "
4571 | \n", "Data Science | \n", "SQL Git Machine Learning C Deep Learning Pytho... | \n", "3 | \n", "
4572 | \n", "Data Science | \n", "Python Programming Language Bootstrap Machine ... | \n", "3 | \n", "
4573 | \n", "Data Science | \n", "Java C JavaScript PHP MySQL Cascading Style Sh... | \n", "3 | \n", "
4574 | \n", "Data Science | \n", "Python Programming Language HTML Machine Learn... | \n", "3 | \n", "
4575 | \n", "Data Science | \n", "SQL Data Analysis Microsoft Excel Deep Learnin... | \n", "3 | \n", "
4576 rows × 3 columns
\n", "