diff --git a/Jenkinsfile b/Jenkinsfile new file mode 100644 index 0000000..e7d04ab --- /dev/null +++ b/Jenkinsfile @@ -0,0 +1,10 @@ +pipeline { + agent any + stages { + stage('Stage 1') { + steps { + echo 'Hello world!' + } + } + } +} diff --git a/download_data.ipynb b/download_data.ipynb index b3764bc..2406c07 100644 --- a/download_data.ipynb +++ b/download_data.ipynb @@ -2,7 +2,7 @@ "cells": [ { "cell_type": "code", - "execution_count": 12, + "execution_count": 28, "id": "5e2107a5", "metadata": {}, "outputs": [], @@ -12,7 +12,7 @@ }, { "cell_type": "code", - "execution_count": 13, + "execution_count": 29, "id": "bcc889e5", "metadata": {}, "outputs": [ @@ -21,12 +21,12 @@ "output_type": "stream", "text": [ "Requirement already satisfied: kaggle in /home/students/s444463/.local/lib/python3.8/site-packages (1.5.12)\n", - "Requirement already satisfied: python-slugify in /home/students/s444463/.local/lib/python3.8/site-packages (from kaggle) (6.1.1)\n", - "Requirement already satisfied: certifi in /usr/lib/python3/dist-packages (from kaggle) (2019.11.28)\n", - "Requirement already satisfied: urllib3 in /usr/lib/python3/dist-packages (from kaggle) (1.25.8)\n", - "Requirement already satisfied: requests in /usr/lib/python3/dist-packages (from kaggle) (2.22.0)\n", - "Requirement already satisfied: six>=1.10 in /usr/lib/python3/dist-packages (from kaggle) (1.14.0)\n", "Requirement already satisfied: tqdm in /home/students/s444463/.local/lib/python3.8/site-packages (from kaggle) (4.63.0)\n", + "Requirement already satisfied: urllib3 in /usr/lib/python3/dist-packages (from kaggle) (1.25.8)\n", + "Requirement already satisfied: six>=1.10 in /usr/lib/python3/dist-packages (from kaggle) (1.14.0)\n", + "Requirement already satisfied: certifi in /usr/lib/python3/dist-packages (from kaggle) (2019.11.28)\n", + "Requirement already satisfied: requests in /usr/lib/python3/dist-packages (from kaggle) (2.22.0)\n", + "Requirement already satisfied: python-slugify in /home/students/s444463/.local/lib/python3.8/site-packages (from kaggle) (6.1.1)\n", "Requirement already satisfied: python-dateutil in /usr/lib/python3/dist-packages (from kaggle) (2.7.3)\n", "Requirement already satisfied: text-unidecode>=1.3 in /home/students/s444463/.local/lib/python3.8/site-packages (from python-slugify->kaggle) (1.3)\n", "\u001b[33mWARNING: You are using pip version 21.2.4; however, version 22.0.4 is available.\n", @@ -48,7 +48,7 @@ }, { "cell_type": "code", - "execution_count": 14, + "execution_count": 30, "id": "02a4034f", "metadata": {}, "outputs": [ @@ -68,7 +68,7 @@ }, { "cell_type": "code", - "execution_count": 15, + "execution_count": 31, "id": "5035aef0", "metadata": {}, "outputs": [ @@ -86,7 +86,7 @@ }, { "cell_type": "code", - "execution_count": 16, + "execution_count": 32, "id": "14344d2f", "metadata": {}, "outputs": [ @@ -97,13 +97,13 @@ "Requirement already satisfied: seaborn in /home/students/s444463/.local/lib/python3.8/site-packages (0.11.2)\n", "Requirement already satisfied: numpy>=1.15 in /usr/lib/python3/dist-packages (from seaborn) (1.17.4)\n", "Requirement already satisfied: scipy>=1.0 in /usr/lib/python3/dist-packages (from seaborn) (1.3.3)\n", - "Requirement already satisfied: pandas>=0.23 in /usr/lib/python3/dist-packages (from seaborn) (0.25.3)\n", "Requirement already satisfied: matplotlib>=2.2 in /home/students/s444463/.local/lib/python3.8/site-packages (from seaborn) (3.4.3)\n", + "Requirement already satisfied: pandas>=0.23 in /usr/lib/python3/dist-packages (from seaborn) (0.25.3)\n", "Requirement already satisfied: pillow>=6.2.0 in /usr/local/lib/python3.8/dist-packages (from matplotlib>=2.2->seaborn) (8.3.2)\n", - "Requirement already satisfied: python-dateutil>=2.7 in /usr/lib/python3/dist-packages (from matplotlib>=2.2->seaborn) (2.7.3)\n", - "Requirement already satisfied: cycler>=0.10 in /home/students/s444463/.local/lib/python3.8/site-packages (from matplotlib>=2.2->seaborn) (0.10.0)\n", "Requirement already satisfied: pyparsing>=2.2.1 in /usr/local/lib/python3.8/dist-packages (from matplotlib>=2.2->seaborn) (2.4.7)\n", + "Requirement already satisfied: cycler>=0.10 in /home/students/s444463/.local/lib/python3.8/site-packages (from matplotlib>=2.2->seaborn) (0.10.0)\n", "Requirement already satisfied: kiwisolver>=1.0.1 in /home/students/s444463/.local/lib/python3.8/site-packages (from matplotlib>=2.2->seaborn) (1.3.2)\n", + "Requirement already satisfied: python-dateutil>=2.7 in /usr/lib/python3/dist-packages (from matplotlib>=2.2->seaborn) (2.7.3)\n", "Requirement already satisfied: six in /usr/lib/python3/dist-packages (from cycler>=0.10->matplotlib>=2.2->seaborn) (1.14.0)\n", "\u001b[33mWARNING: You are using pip version 21.2.4; however, version 22.0.4 is available.\n", "You should consider upgrading via the '/usr/bin/python3 -m pip install --upgrade pip' command.\u001b[0m\n" @@ -116,7 +116,7 @@ }, { "cell_type": "code", - "execution_count": 17, + "execution_count": 33, "id": "0f5ebfab", "metadata": {}, "outputs": [ @@ -519,7 +519,7 @@ "[17880 rows x 18 columns]" ] }, - "execution_count": 17, + "execution_count": 33, "metadata": {}, "output_type": "execute_result" } @@ -532,7 +532,7 @@ }, { "cell_type": "code", - "execution_count": 18, + "execution_count": 34, "id": "edbf49da", "metadata": {}, "outputs": [ @@ -551,7 +551,7 @@ }, { "cell_type": "code", - "execution_count": 19, + "execution_count": 35, "id": "e60b3f32", "metadata": {}, "outputs": [ @@ -572,7 +572,7 @@ "Name: department, Length: 1337, dtype: int64" ] }, - "execution_count": 19, + "execution_count": 35, "metadata": {}, "output_type": "execute_result" } @@ -583,10 +583,414 @@ }, { "cell_type": "code", - "execution_count": null, - "id": "2612d68b", + "execution_count": 36, + "id": "ddb2fc38", "metadata": {}, - "outputs": [], + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + " | job_id | \n", + "title | \n", + "location | \n", + "department | \n", + "salary_range | \n", + "company_profile | \n", + "description | \n", + "requirements | \n", + "benefits | \n", + "telecommuting | \n", + "has_company_logo | \n", + "has_questions | \n", + "employment_type | \n", + "required_experience | \n", + "required_education | \n", + "industry | \n", + "function | \n", + "fraudulent | \n", + "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", + "1 | \n", + "Marketing Intern | \n", + "US, NY, New York | \n", + "Marketing | \n", + "\n", + " | We're Food52, and we've created a groundbreaki... | \n", + "Food52, a fast-growing, James Beard Award-winn... | \n", + "Experience with content management systems a m... | \n", + "\n", + " | 0 | \n", + "1 | \n", + "0 | \n", + "Other | \n", + "Internship | \n", + "\n", + " | \n", + " | Marketing | \n", + "0 | \n", + "
1 | \n", + "2 | \n", + "Customer Service - Cloud Video Production | \n", + "NZ, , Auckland | \n", + "Success | \n", + "\n", + " | 90 Seconds, the worlds Cloud Video Production ... | \n", + "Organised - Focused - Vibrant - Awesome!Do you... | \n", + "What we expect from you:Your key responsibilit... | \n", + "What you will get from usThrough being part of... | \n", + "0 | \n", + "1 | \n", + "0 | \n", + "Full-time | \n", + "Not Applicable | \n", + "\n", + " | Marketing and Advertising | \n", + "Customer Service | \n", + "0 | \n", + "
2 | \n", + "3 | \n", + "Commissioning Machinery Assistant (CMA) | \n", + "US, IA, Wever | \n", + "\n", + " | \n", + " | Valor Services provides Workforce Solutions th... | \n", + "Our client, located in Houston, is actively se... | \n", + "Implement pre-commissioning and commissioning ... | \n", + "\n", + " | 0 | \n", + "1 | \n", + "0 | \n", + "\n", + " | \n", + " | \n", + " | \n", + " | \n", + " | 0 | \n", + "
3 | \n", + "4 | \n", + "Account Executive - Washington DC | \n", + "US, DC, Washington | \n", + "Sales | \n", + "\n", + " | Our passion for improving quality of life thro... | \n", + "THE COMPANY: ESRI – Environmental Systems Rese... | \n", + "EDUCATION: Bachelor’s or Master’s in GIS, busi... | \n", + "Our culture is anything but corporate—we have ... | \n", + "0 | \n", + "1 | \n", + "0 | \n", + "Full-time | \n", + "Mid-Senior level | \n", + "Bachelor's Degree | \n", + "Computer Software | \n", + "Sales | \n", + "0 | \n", + "
4 | \n", + "5 | \n", + "Bill Review Manager | \n", + "US, FL, Fort Worth | \n", + "\n", + " | \n", + " | SpotSource Solutions LLC is a Global Human Cap... | \n", + "JOB TITLE: Itemization Review ManagerLOCATION:... | \n", + "QUALIFICATIONS:RN license in the State of Texa... | \n", + "Full Benefits Offered | \n", + "0 | \n", + "1 | \n", + "1 | \n", + "Full-time | \n", + "Mid-Senior level | \n", + "Bachelor's Degree | \n", + "Hospital & Health Care | \n", + "Health Care Provider | \n", + "0 | \n", + "
... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "
17875 | \n", + "17876 | \n", + "Account Director - Distribution | \n", + "CA, ON, Toronto | \n", + "Sales | \n", + "\n", + " | Vend is looking for some awesome new talent to... | \n", + "Just in case this is the first time you’ve vis... | \n", + "To ace this role you:Will eat comprehensive St... | \n", + "What can you expect from us?We have an open cu... | \n", + "0 | \n", + "1 | \n", + "1 | \n", + "Full-time | \n", + "Mid-Senior level | \n", + "\n", + " | Computer Software | \n", + "Sales | \n", + "0 | \n", + "
17876 | \n", + "17877 | \n", + "Payroll Accountant | \n", + "US, PA, Philadelphia | \n", + "Accounting | \n", + "\n", + " | WebLinc is the e-commerce platform and service... | \n", + "The Payroll Accountant will focus primarily on... | \n", + "- B.A. or B.S. in Accounting- Desire to have f... | \n", + "Health & WellnessMedical planPrescription ... | \n", + "0 | \n", + "1 | \n", + "1 | \n", + "Full-time | \n", + "Mid-Senior level | \n", + "Bachelor's Degree | \n", + "Internet | \n", + "Accounting/Auditing | \n", + "0 | \n", + "
17877 | \n", + "17878 | \n", + "Project Cost Control Staff Engineer - Cost Con... | \n", + "US, TX, Houston | \n", + "\n", + " | \n", + " | We Provide Full Time Permanent Positions for m... | \n", + "Experienced Project Cost Control Staff Enginee... | \n", + "At least 12 years professional experience.Abil... | \n", + "\n", + " | 0 | \n", + "0 | \n", + "0 | \n", + "Full-time | \n", + "\n", + " | \n", + " | \n", + " | \n", + " | 0 | \n", + "
17878 | \n", + "17879 | \n", + "Graphic Designer | \n", + "NG, LA, Lagos | \n", + "\n", + " | \n", + " | \n", + " | Nemsia Studios is looking for an experienced v... | \n", + "1. Must be fluent in the latest versions of Co... | \n", + "Competitive salary (compensation will be based... | \n", + "0 | \n", + "0 | \n", + "1 | \n", + "Contract | \n", + "Not Applicable | \n", + "Professional | \n", + "Graphic Design | \n", + "Design | \n", + "0 | \n", + "
17879 | \n", + "17880 | \n", + "Web Application Developers | \n", + "NZ, N, Wellington | \n", + "Engineering | \n", + "\n", + " | Vend is looking for some awesome new talent to... | \n", + "Who are we?Vend is an award winning web based ... | \n", + "We want to hear from you if:You have an in-dep... | \n", + "\n", + " | 0 | \n", + "1 | \n", + "1 | \n", + "Full-time | \n", + "Mid-Senior level | \n", + "\n", + " | Computer Software | \n", + "Engineering | \n", + "0 | \n", + "
17880 rows × 18 columns
\n", + "