{ "cells": [ { "cell_type": "markdown", "id": "32e38283", "metadata": {}, "source": [ "# Part 1: exploring and correcting a dataset" ] }, { "cell_type": "code", "execution_count": 2, "id": "565831c6", "metadata": {}, "outputs": [], "source": [ "import numpy as np\n", "import pandas as pd" ] }, { "cell_type": "code", "execution_count": 3, "id": "0d1f0a19", "metadata": { "scrolled": true }, "outputs": [ { "data": { "text/html": [ "
\n", " | customerID | \n", "gender | \n", "SeniorCitizen | \n", "Partner | \n", "Dependents | \n", "tenure | \n", "PhoneService | \n", "MultipleLines | \n", "InternetService | \n", "OnlineSecurity | \n", "... | \n", "DeviceProtection | \n", "TechSupport | \n", "StreamingTV | \n", "StreamingMovies | \n", "Contract | \n", "PaperlessBilling | \n", "PaymentMethod | \n", "MonthlyCharges | \n", "TotalCharges | \n", "Churn | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", "7590-VHVEG | \n", "Female | \n", "0 | \n", "Yes | \n", "No | \n", "1 | \n", "No | \n", "No phone service | \n", "DSL | \n", "No | \n", "... | \n", "No | \n", "No | \n", "No | \n", "No | \n", "Month-to-month | \n", "Yes | \n", "Electronic check | \n", "29.85 | \n", "29.85 | \n", "No | \n", "
1 | \n", "5575-GNVDE | \n", "Male | \n", "0 | \n", "No | \n", "No | \n", "34 | \n", "Yes | \n", "No | \n", "DSL | \n", "Yes | \n", "... | \n", "Yes | \n", "No | \n", "No | \n", "No | \n", "One year | \n", "No | \n", "Mailed check | \n", "56.95 | \n", "1889.50 | \n", "No | \n", "
2 | \n", "3668-QPYBK | \n", "Male | \n", "0 | \n", "No | \n", "No | \n", "2 | \n", "Yes | \n", "No | \n", "DSL | \n", "Yes | \n", "... | \n", "No | \n", "No | \n", "No | \n", "No | \n", "Month-to-month | \n", "Yes | \n", "Mailed check | \n", "53.85 | \n", "108.15 | \n", "Yes | \n", "
3 | \n", "7795-CFOCW | \n", "Male | \n", "0 | \n", "No | \n", "No | \n", "45 | \n", "No | \n", "No phone service | \n", "DSL | \n", "Yes | \n", "... | \n", "Yes | \n", "Yes | \n", "No | \n", "No | \n", "One year | \n", "No | \n", "Bank transfer (automatic) | \n", "42.30 | \n", "1840.75 | \n", "No | \n", "
4 | \n", "9237-HQITU | \n", "Female | \n", "0 | \n", "No | \n", "No | \n", "2 | \n", "Yes | \n", "No | \n", "Fiber optic | \n", "No | \n", "... | \n", "No | \n", "No | \n", "No | \n", "No | \n", "Month-to-month | \n", "Yes | \n", "Electronic check | \n", "70.70 | \n", "151.65 | \n", "Yes | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
7038 | \n", "6840-RESVB | \n", "Male | \n", "0 | \n", "Yes | \n", "Yes | \n", "24 | \n", "Yes | \n", "Yes | \n", "DSL | \n", "Yes | \n", "... | \n", "Yes | \n", "Yes | \n", "Yes | \n", "Yes | \n", "One year | \n", "Yes | \n", "Mailed check | \n", "84.80 | \n", "1990.50 | \n", "No | \n", "
7039 | \n", "2234-XADUH | \n", "Female | \n", "0 | \n", "Yes | \n", "Yes | \n", "72 | \n", "Yes | \n", "Yes | \n", "Fiber optic | \n", "No | \n", "... | \n", "Yes | \n", "No | \n", "Yes | \n", "Yes | \n", "One year | \n", "Yes | \n", "Credit card (automatic) | \n", "103.20 | \n", "7362.90 | \n", "No | \n", "
7040 | \n", "4801-JZAZL | \n", "Female | \n", "0 | \n", "Yes | \n", "Yes | \n", "11 | \n", "No | \n", "No phone service | \n", "DSL | \n", "Yes | \n", "... | \n", "No | \n", "No | \n", "No | \n", "No | \n", "Month-to-month | \n", "Yes | \n", "Electronic check | \n", "29.60 | \n", "346.45 | \n", "No | \n", "
7041 | \n", "8361-LTMKD | \n", "Male | \n", "1 | \n", "Yes | \n", "No | \n", "4 | \n", "Yes | \n", "Yes | \n", "Fiber optic | \n", "No | \n", "... | \n", "No | \n", "No | \n", "No | \n", "No | \n", "Month-to-month | \n", "Yes | \n", "Mailed check | \n", "74.40 | \n", "306.60 | \n", "Yes | \n", "
7042 | \n", "3186-AJIEK | \n", "Male | \n", "0 | \n", "No | \n", "No | \n", "66 | \n", "Yes | \n", "No | \n", "Fiber optic | \n", "Yes | \n", "... | \n", "Yes | \n", "Yes | \n", "Yes | \n", "Yes | \n", "Two year | \n", "Yes | \n", "Bank transfer (automatic) | \n", "105.65 | \n", "6844.50 | \n", "No | \n", "
7043 rows × 21 columns
\n", "