From 831295e55a04f040bbf86a387a07d6f53be6e61b Mon Sep 17 00:00:00 2001
From: Lucie Lopez <lucielopez@pc-202.home>
Date: Sun, 3 Aug 2025 19:42:20 +0200
Subject: [PATCH] Lab OK

---
 lab-dw-data-structuring-and-combining.ipynb | 584 +++++++++++++++++++-
 1 file changed, 574 insertions(+), 10 deletions(-)

diff --git a/lab-dw-data-structuring-and-combining.ipynb b/lab-dw-data-structuring-and-combining.ipynb
index ec4e3f9..829b4f8 100644
--- a/lab-dw-data-structuring-and-combining.ipynb
+++ b/lab-dw-data-structuring-and-combining.ipynb
@@ -34,16 +34,128 @@
     "- Another option would be to read the clean file you saved in the previous lab, and just clean the two new files and concatenate the three clean datasets"
    ]
   },
+  {
+   "cell_type": "code",
+   "execution_count": 1,
+   "id": "bb0e433d",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import pandas as pd\n",
+    "\n",
+    "#Cleaned file\n",
+    "df1 = pd.read_csv(\"cleaned_dataset.csv\")"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 2,
+   "id": "077e47aa",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "#2 others\n",
+    "\n",
+    "url2 = \"https://raw.githubusercontent.com/data-bootcamp-v4/data/main/file2.csv\"\n",
+    "url3 = \"https://raw.githubusercontent.com/data-bootcamp-v4/data/main/file3.csv\"\n",
+    "\n",
+    "df2 = pd.read_csv(url2)\n",
+    "df3 = pd.read_csv(url3)\n",
+    "\n",
+    "# Combine for cleaning\n",
+    "df_new = pd.concat([df2, df3], ignore_index=True)"
+   ]
+  },
   {
    "cell_type": "code",
    "execution_count": null,
-   "id": "492d06e3-92c7-4105-ac72-536db98d3244",
-   "metadata": {
-    "id": "492d06e3-92c7-4105-ac72-536db98d3244"
-   },
+   "id": "dc7b2188",
+   "metadata": {},
    "outputs": [],
    "source": [
-    "# Your code goes here"
+    "# Clean\n",
+    "\n",
+    "df_new.columns = [col.lower() for col in df_new.columns]\n",
+    "df_new.columns = [col.replace(\" \", \"_\") for col in df_new.columns]\n",
+    "\n",
+    "df_new = df_new.rename(columns={\"st\":\"state\"})\n",
+    "\n",
+    "# Standardize Gender\n",
+    "df_new[\"gender\"] = df_new[\"gender\"].str.strip().str.upper().map({\n",
+    "    'F': 'F', 'FEMALE': 'F', 'FEMAL': 'F',\n",
+    "    'M': 'M', 'MALE': 'M'\n",
+    "})\n",
+    "\n",
+    "# State Abbreviations\n",
+    "state_map = {'AZ': 'Arizona', 'Cali': 'California', 'WA': 'Washington'}\n",
+    "df_new['state'] = df_new['state'].replace(state_map)\n",
+    "\n",
+    "# Education\n",
+    "df_new['education'] = df_new['education'].replace({'Bachelors': 'Bachelor'})\n",
+    "\n",
+    "# Customer Lifetime Value\n",
+    "df_new['customer_lifetime_value'] = (\n",
+    "    df_new['customer_lifetime_value']\n",
+    "    .astype(str)\n",
+    "    .str.replace('%', '', regex=False)\n",
+    "    .astype(float)\n",
+    ")\n",
+    "\n",
+    "# Vehicle Class\n",
+    "df_new['vehicle_class'] = df_new['vehicle_class'].replace({\n",
+    "    'Sports Car': 'Luxury',\n",
+    "    'Luxury SUV': 'Luxury',\n",
+    "    'Luxury Car': 'Luxury'\n",
+    "})\n",
+    "\n",
+    "# Number of Open Complaints\n",
+    "df_new['number_of_open_complaints'] = (\n",
+    "    df_new['number_of_open_complaints']\n",
+    "    .astype(str)\n",
+    "    .apply(lambda x: int(x.split('/')[1]) if '/' in x else pd.NA)\n",
+    "    .astype('Int64')\n",
+    ")\n",
+    "\n",
+    "# Null Values\n",
+    "num_cols = df_new.select_dtypes(include=['float', 'int', 'Int64']).columns\n",
+    "cat_cols = df_new.select_dtypes(include=['object', 'category']).columns\n",
+    "\n",
+    "for col in num_cols:\n",
+    "    df_new[col] = df_new[col].fillna(df_new[col].median())\n",
+    "\n",
+    "for col in cat_cols:\n",
+    "    df_new[col] = df_new[col].fillna(df_new[col].mode()[0])\n",
+    "\n",
+    "# Convert numerics to int\n",
+    "for col in num_cols:\n",
+    "    df_new[col] = df_new[col].astype(int)\n",
+    "\n",
+    "# Drop Duplicates\n",
+    "df_new = df_new.drop_duplicates().reset_index(drop=True)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "8fca3be4",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Combine with cleaned df1\n",
+    "df_combined = pd.concat([df1, df_new], ignore_index=True)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "77a456eb",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "df_combined = df_combined.drop_duplicates().reset_index(drop=True)\n",
+    "\n",
+    "# Save cleaned and combined dataset\n",
+    "df_combined.to_csv(\"final_cleaned_data.csv\", index=False)"
    ]
   },
   {
@@ -72,14 +184,404 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 7,
    "id": "aa10d9b0-1c27-4d3f-a8e4-db6ab73bfd26",
    "metadata": {
     "id": "aa10d9b0-1c27-4d3f-a8e4-db6ab73bfd26"
    },
-   "outputs": [],
+   "outputs": [
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<style scoped>\n",
+       "    .dataframe tbody tr th:only-of-type {\n",
+       "        vertical-align: middle;\n",
+       "    }\n",
+       "\n",
+       "    .dataframe tbody tr th {\n",
+       "        vertical-align: top;\n",
+       "    }\n",
+       "\n",
+       "    .dataframe thead th {\n",
+       "        text-align: right;\n",
+       "    }\n",
+       "</style>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr style=\"text-align: right;\">\n",
+       "      <th></th>\n",
+       "      <th>unnamed:_0</th>\n",
+       "      <th>customer</th>\n",
+       "      <th>state</th>\n",
+       "      <th>customer_lifetime_value</th>\n",
+       "      <th>response</th>\n",
+       "      <th>coverage</th>\n",
+       "      <th>education</th>\n",
+       "      <th>effective_to_date</th>\n",
+       "      <th>employmentstatus</th>\n",
+       "      <th>gender</th>\n",
+       "      <th>...</th>\n",
+       "      <th>number_of_policies</th>\n",
+       "      <th>policy_type</th>\n",
+       "      <th>policy</th>\n",
+       "      <th>renew_offer_type</th>\n",
+       "      <th>sales_channel</th>\n",
+       "      <th>total_claim_amount</th>\n",
+       "      <th>vehicle_class</th>\n",
+       "      <th>vehicle_size</th>\n",
+       "      <th>vehicle_type</th>\n",
+       "      <th>month</th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>0</th>\n",
+       "      <td>0</td>\n",
+       "      <td>DK49336</td>\n",
+       "      <td>Arizona</td>\n",
+       "      <td>4809.216960</td>\n",
+       "      <td>No</td>\n",
+       "      <td>Basic</td>\n",
+       "      <td>College</td>\n",
+       "      <td>2011-02-18</td>\n",
+       "      <td>Employed</td>\n",
+       "      <td>M</td>\n",
+       "      <td>...</td>\n",
+       "      <td>9</td>\n",
+       "      <td>Corporate Auto</td>\n",
+       "      <td>Corporate L3</td>\n",
+       "      <td>Offer3</td>\n",
+       "      <td>Agent</td>\n",
+       "      <td>292.800000</td>\n",
+       "      <td>Four-Door Car</td>\n",
+       "      <td>Medsize</td>\n",
+       "      <td>A</td>\n",
+       "      <td>2</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>1</th>\n",
+       "      <td>1</td>\n",
+       "      <td>KX64629</td>\n",
+       "      <td>California</td>\n",
+       "      <td>2228.525238</td>\n",
+       "      <td>No</td>\n",
+       "      <td>Basic</td>\n",
+       "      <td>College</td>\n",
+       "      <td>2011-01-18</td>\n",
+       "      <td>Unemployed</td>\n",
+       "      <td>F</td>\n",
+       "      <td>...</td>\n",
+       "      <td>1</td>\n",
+       "      <td>Personal Auto</td>\n",
+       "      <td>Personal L3</td>\n",
+       "      <td>Offer4</td>\n",
+       "      <td>Call Center</td>\n",
+       "      <td>744.924331</td>\n",
+       "      <td>Four-Door Car</td>\n",
+       "      <td>Medsize</td>\n",
+       "      <td>A</td>\n",
+       "      <td>1</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2</th>\n",
+       "      <td>2</td>\n",
+       "      <td>LZ68649</td>\n",
+       "      <td>Washington</td>\n",
+       "      <td>14947.917300</td>\n",
+       "      <td>No</td>\n",
+       "      <td>Basic</td>\n",
+       "      <td>Bachelor</td>\n",
+       "      <td>2011-02-10</td>\n",
+       "      <td>Employed</td>\n",
+       "      <td>M</td>\n",
+       "      <td>...</td>\n",
+       "      <td>2</td>\n",
+       "      <td>Personal Auto</td>\n",
+       "      <td>Personal L3</td>\n",
+       "      <td>Offer3</td>\n",
+       "      <td>Call Center</td>\n",
+       "      <td>480.000000</td>\n",
+       "      <td>SUV</td>\n",
+       "      <td>Medsize</td>\n",
+       "      <td>A</td>\n",
+       "      <td>2</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>3</th>\n",
+       "      <td>3</td>\n",
+       "      <td>XL78013</td>\n",
+       "      <td>Oregon</td>\n",
+       "      <td>22332.439460</td>\n",
+       "      <td>Yes</td>\n",
+       "      <td>Extended</td>\n",
+       "      <td>College</td>\n",
+       "      <td>2011-01-11</td>\n",
+       "      <td>Employed</td>\n",
+       "      <td>M</td>\n",
+       "      <td>...</td>\n",
+       "      <td>2</td>\n",
+       "      <td>Corporate Auto</td>\n",
+       "      <td>Corporate L3</td>\n",
+       "      <td>Offer2</td>\n",
+       "      <td>Branch</td>\n",
+       "      <td>484.013411</td>\n",
+       "      <td>Four-Door Car</td>\n",
+       "      <td>Medsize</td>\n",
+       "      <td>A</td>\n",
+       "      <td>1</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>4</th>\n",
+       "      <td>4</td>\n",
+       "      <td>QA50777</td>\n",
+       "      <td>Oregon</td>\n",
+       "      <td>9025.067525</td>\n",
+       "      <td>No</td>\n",
+       "      <td>Premium</td>\n",
+       "      <td>Bachelor</td>\n",
+       "      <td>2011-01-17</td>\n",
+       "      <td>Medical Leave</td>\n",
+       "      <td>F</td>\n",
+       "      <td>...</td>\n",
+       "      <td>7</td>\n",
+       "      <td>Personal Auto</td>\n",
+       "      <td>Personal L2</td>\n",
+       "      <td>Offer1</td>\n",
+       "      <td>Branch</td>\n",
+       "      <td>707.925645</td>\n",
+       "      <td>Four-Door Car</td>\n",
+       "      <td>Medsize</td>\n",
+       "      <td>A</td>\n",
+       "      <td>1</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>...</th>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>10905</th>\n",
+       "      <td>10905</td>\n",
+       "      <td>FE99816</td>\n",
+       "      <td>Nevada</td>\n",
+       "      <td>15563.369440</td>\n",
+       "      <td>No</td>\n",
+       "      <td>Premium</td>\n",
+       "      <td>Bachelor</td>\n",
+       "      <td>2011-01-19</td>\n",
+       "      <td>Unemployed</td>\n",
+       "      <td>F</td>\n",
+       "      <td>...</td>\n",
+       "      <td>7</td>\n",
+       "      <td>Personal Auto</td>\n",
+       "      <td>Personal L1</td>\n",
+       "      <td>Offer3</td>\n",
+       "      <td>Web</td>\n",
+       "      <td>1214.400000</td>\n",
+       "      <td>Luxury Car</td>\n",
+       "      <td>Medsize</td>\n",
+       "      <td>A</td>\n",
+       "      <td>1</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>10906</th>\n",
+       "      <td>10906</td>\n",
+       "      <td>KX53892</td>\n",
+       "      <td>Oregon</td>\n",
+       "      <td>5259.444853</td>\n",
+       "      <td>No</td>\n",
+       "      <td>Basic</td>\n",
+       "      <td>College</td>\n",
+       "      <td>2011-01-06</td>\n",
+       "      <td>Employed</td>\n",
+       "      <td>F</td>\n",
+       "      <td>...</td>\n",
+       "      <td>6</td>\n",
+       "      <td>Personal Auto</td>\n",
+       "      <td>Personal L3</td>\n",
+       "      <td>Offer2</td>\n",
+       "      <td>Branch</td>\n",
+       "      <td>273.018929</td>\n",
+       "      <td>Four-Door Car</td>\n",
+       "      <td>Medsize</td>\n",
+       "      <td>A</td>\n",
+       "      <td>1</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>10907</th>\n",
+       "      <td>10907</td>\n",
+       "      <td>TL39050</td>\n",
+       "      <td>Arizona</td>\n",
+       "      <td>23893.304100</td>\n",
+       "      <td>No</td>\n",
+       "      <td>Extended</td>\n",
+       "      <td>Bachelor</td>\n",
+       "      <td>2011-02-06</td>\n",
+       "      <td>Employed</td>\n",
+       "      <td>F</td>\n",
+       "      <td>...</td>\n",
+       "      <td>2</td>\n",
+       "      <td>Corporate Auto</td>\n",
+       "      <td>Corporate L3</td>\n",
+       "      <td>Offer1</td>\n",
+       "      <td>Web</td>\n",
+       "      <td>381.306996</td>\n",
+       "      <td>Luxury SUV</td>\n",
+       "      <td>Medsize</td>\n",
+       "      <td>A</td>\n",
+       "      <td>2</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>10908</th>\n",
+       "      <td>10908</td>\n",
+       "      <td>WA60547</td>\n",
+       "      <td>California</td>\n",
+       "      <td>11971.977650</td>\n",
+       "      <td>No</td>\n",
+       "      <td>Premium</td>\n",
+       "      <td>College</td>\n",
+       "      <td>2011-02-13</td>\n",
+       "      <td>Employed</td>\n",
+       "      <td>F</td>\n",
+       "      <td>...</td>\n",
+       "      <td>6</td>\n",
+       "      <td>Personal Auto</td>\n",
+       "      <td>Personal L1</td>\n",
+       "      <td>Offer1</td>\n",
+       "      <td>Branch</td>\n",
+       "      <td>618.288849</td>\n",
+       "      <td>SUV</td>\n",
+       "      <td>Medsize</td>\n",
+       "      <td>A</td>\n",
+       "      <td>2</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>10909</th>\n",
+       "      <td>10909</td>\n",
+       "      <td>IV32877</td>\n",
+       "      <td>California</td>\n",
+       "      <td>6857.519928</td>\n",
+       "      <td>No</td>\n",
+       "      <td>Basic</td>\n",
+       "      <td>Bachelor</td>\n",
+       "      <td>2011-01-08</td>\n",
+       "      <td>Unemployed</td>\n",
+       "      <td>M</td>\n",
+       "      <td>...</td>\n",
+       "      <td>3</td>\n",
+       "      <td>Personal Auto</td>\n",
+       "      <td>Personal L1</td>\n",
+       "      <td>Offer4</td>\n",
+       "      <td>Web</td>\n",
+       "      <td>1021.719397</td>\n",
+       "      <td>SUV</td>\n",
+       "      <td>Medsize</td>\n",
+       "      <td>A</td>\n",
+       "      <td>1</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "<p>10910 rows × 27 columns</p>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "       unnamed:_0 customer       state  customer_lifetime_value response  \\\n",
+       "0               0  DK49336     Arizona              4809.216960       No   \n",
+       "1               1  KX64629  California              2228.525238       No   \n",
+       "2               2  LZ68649  Washington             14947.917300       No   \n",
+       "3               3  XL78013      Oregon             22332.439460      Yes   \n",
+       "4               4  QA50777      Oregon              9025.067525       No   \n",
+       "...           ...      ...         ...                      ...      ...   \n",
+       "10905       10905  FE99816      Nevada             15563.369440       No   \n",
+       "10906       10906  KX53892      Oregon              5259.444853       No   \n",
+       "10907       10907  TL39050     Arizona             23893.304100       No   \n",
+       "10908       10908  WA60547  California             11971.977650       No   \n",
+       "10909       10909  IV32877  California              6857.519928       No   \n",
+       "\n",
+       "       coverage education effective_to_date employmentstatus gender  ...  \\\n",
+       "0         Basic   College        2011-02-18         Employed      M  ...   \n",
+       "1         Basic   College        2011-01-18       Unemployed      F  ...   \n",
+       "2         Basic  Bachelor        2011-02-10         Employed      M  ...   \n",
+       "3      Extended   College        2011-01-11         Employed      M  ...   \n",
+       "4       Premium  Bachelor        2011-01-17    Medical Leave      F  ...   \n",
+       "...         ...       ...               ...              ...    ...  ...   \n",
+       "10905   Premium  Bachelor        2011-01-19       Unemployed      F  ...   \n",
+       "10906     Basic   College        2011-01-06         Employed      F  ...   \n",
+       "10907  Extended  Bachelor        2011-02-06         Employed      F  ...   \n",
+       "10908   Premium   College        2011-02-13         Employed      F  ...   \n",
+       "10909     Basic  Bachelor        2011-01-08       Unemployed      M  ...   \n",
+       "\n",
+       "       number_of_policies     policy_type        policy  renew_offer_type  \\\n",
+       "0                       9  Corporate Auto  Corporate L3            Offer3   \n",
+       "1                       1   Personal Auto   Personal L3            Offer4   \n",
+       "2                       2   Personal Auto   Personal L3            Offer3   \n",
+       "3                       2  Corporate Auto  Corporate L3            Offer2   \n",
+       "4                       7   Personal Auto   Personal L2            Offer1   \n",
+       "...                   ...             ...           ...               ...   \n",
+       "10905                   7   Personal Auto   Personal L1            Offer3   \n",
+       "10906                   6   Personal Auto   Personal L3            Offer2   \n",
+       "10907                   2  Corporate Auto  Corporate L3            Offer1   \n",
+       "10908                   6   Personal Auto   Personal L1            Offer1   \n",
+       "10909                   3   Personal Auto   Personal L1            Offer4   \n",
+       "\n",
+       "       sales_channel  total_claim_amount  vehicle_class  vehicle_size  \\\n",
+       "0              Agent          292.800000  Four-Door Car       Medsize   \n",
+       "1        Call Center          744.924331  Four-Door Car       Medsize   \n",
+       "2        Call Center          480.000000            SUV       Medsize   \n",
+       "3             Branch          484.013411  Four-Door Car       Medsize   \n",
+       "4             Branch          707.925645  Four-Door Car       Medsize   \n",
+       "...              ...                 ...            ...           ...   \n",
+       "10905            Web         1214.400000     Luxury Car       Medsize   \n",
+       "10906         Branch          273.018929  Four-Door Car       Medsize   \n",
+       "10907            Web          381.306996     Luxury SUV       Medsize   \n",
+       "10908         Branch          618.288849            SUV       Medsize   \n",
+       "10909            Web         1021.719397            SUV       Medsize   \n",
+       "\n",
+       "      vehicle_type month  \n",
+       "0                A     2  \n",
+       "1                A     1  \n",
+       "2                A     2  \n",
+       "3                A     1  \n",
+       "4                A     1  \n",
+       "...            ...   ...  \n",
+       "10905            A     1  \n",
+       "10906            A     1  \n",
+       "10907            A     2  \n",
+       "10908            A     2  \n",
+       "10909            A     1  \n",
+       "\n",
+       "[10910 rows x 27 columns]"
+      ]
+     },
+     "execution_count": 7,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
    "source": [
-    "# Your code goes here"
+    "url = \"https://raw.githubusercontent.com/data-bootcamp-v4/data/main/marketing_customer_analysis_clean.csv\"\n",
+    "df = pd.read_csv(url)\n",
+    "df"
    ]
   },
   {
@@ -93,6 +595,38 @@
     "Round the total revenue to 2 decimal points.  Analyze the resulting table to draw insights."
    ]
   },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "c9e176db",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "               total_claim_amount\n",
+      "sales_channel                    \n",
+      "Agent                  1810226.82\n",
+      "Branch                 1301204.00\n",
+      "Call Center             926600.82\n",
+      "Web                     706600.04\n"
+     ]
+    }
+   ],
+   "source": [
+    "# 1\n",
+    "revenue_by_channel = df.pivot_table(\n",
+    "    index='sales_channel',\n",
+    "    values='total_claim_amount',\n",
+    "    aggfunc='sum'\n",
+    ").round(2)\n",
+    "\n",
+    "revenue_by_channel = revenue_by_channel.sort_values('total_claim_amount', ascending=False)\n",
+    "\n",
+    "print(revenue_by_channel)\n"
+   ]
+  },
   {
    "cell_type": "markdown",
    "id": "640993b2-a291-436c-a34d-a551144f8196",
@@ -103,6 +637,36 @@
     "2. Create a pivot table that shows the average customer lifetime value per gender and education level. Analyze the resulting table to draw insights."
    ]
   },
+  {
+   "cell_type": "code",
+   "execution_count": 10,
+   "id": "9193baa3",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "education  Bachelor  College   Doctor  High School or Below   Master\n",
+      "gender                                                              \n",
+      "F           7874.27  7748.82  7328.51               8675.22  8157.05\n",
+      "M           7703.60  8052.46  7415.33               8149.69  8168.83\n"
+     ]
+    }
+   ],
+   "source": [
+    "#2 \n",
+    "clv_pivot = pd.pivot_table(\n",
+    "    df,\n",
+    "    values='customer_lifetime_value',\n",
+    "    index='gender',\n",
+    "    columns='education',\n",
+    "    aggfunc='mean'\n",
+    ").round(2)\n",
+    "\n",
+    "print(clv_pivot)"
+   ]
+  },
   {
    "cell_type": "markdown",
    "id": "32c7f2e5-3d90-43e5-be33-9781b6069198",
@@ -146,7 +710,7 @@
    "provenance": []
   },
   "kernelspec": {
-   "display_name": "Python 3 (ipykernel)",
+   "display_name": "base",
    "language": "python",
    "name": "python3"
   },
@@ -160,7 +724,7 @@
    "name": "python",
    "nbconvert_exporter": "python",
    "pygments_lexer": "ipython3",
-   "version": "3.9.13"
+   "version": "3.12.2"
   }
  },
  "nbformat": 4,