{
 "cells": [
  {
   "cell_type": "markdown",
   "id": "ed165d4b-15bc-4619-818b-5758efa8abff",
   "metadata": {},
   "source": [
    "### Reading and Writing Data"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 30,
   "id": "27ed7970-9be1-4b4b-96bd-51b984265251",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div><style>\n",
       ".dataframe > thead > tr,\n",
       ".dataframe > tbody > tr {\n",
       "  text-align: right;\n",
       "  white-space: pre-wrap;\n",
       "}\n",
       "</style>\n",
       "<small>shape: (344, 17)</small><table border=\"1\" class=\"dataframe\"><thead><tr><th>studyName</th><th>Sample Number</th><th>Species</th><th>Region</th><th>Island</th><th>Stage</th><th>Individual ID</th><th>Clutch Completion</th><th>Date Egg</th><th>Culmen Length (mm)</th><th>Culmen Depth (mm)</th><th>Flipper Length (mm)</th><th>Body Mass (g)</th><th>Sex</th><th>Delta 15 N (o/oo)</th><th>Delta 13 C (o/oo)</th><th>Comments</th></tr><tr><td>str</td><td>i64</td><td>str</td><td>str</td><td>str</td><td>str</td><td>str</td><td>str</td><td>str</td><td>f64</td><td>f64</td><td>i64</td><td>i64</td><td>str</td><td>f64</td><td>f64</td><td>str</td></tr></thead><tbody><tr><td>&quot;PAL0708&quot;</td><td>1</td><td>&quot;Adelie Penguin (Pygoscelis ade…</td><td>&quot;Anvers&quot;</td><td>&quot;Torgersen&quot;</td><td>&quot;Adult, 1 Egg Stage&quot;</td><td>&quot;N1A1&quot;</td><td>&quot;Yes&quot;</td><td>&quot;11/11/07&quot;</td><td>39.1</td><td>18.7</td><td>181</td><td>3750</td><td>&quot;MALE&quot;</td><td>null</td><td>null</td><td>&quot;Not enough blood for isotopes.&quot;</td></tr><tr><td>&quot;PAL0708&quot;</td><td>2</td><td>&quot;Adelie Penguin (Pygoscelis ade…</td><td>&quot;Anvers&quot;</td><td>&quot;Torgersen&quot;</td><td>&quot;Adult, 1 Egg Stage&quot;</td><td>&quot;N1A2&quot;</td><td>&quot;Yes&quot;</td><td>&quot;11/11/07&quot;</td><td>39.5</td><td>17.4</td><td>186</td><td>3800</td><td>&quot;FEMALE&quot;</td><td>8.94956</td><td>-24.69454</td><td>null</td></tr><tr><td>&quot;PAL0708&quot;</td><td>3</td><td>&quot;Adelie Penguin (Pygoscelis ade…</td><td>&quot;Anvers&quot;</td><td>&quot;Torgersen&quot;</td><td>&quot;Adult, 1 Egg Stage&quot;</td><td>&quot;N2A1&quot;</td><td>&quot;Yes&quot;</td><td>&quot;11/16/07&quot;</td><td>40.3</td><td>18.0</td><td>195</td><td>3250</td><td>&quot;FEMALE&quot;</td><td>8.36821</td><td>-25.33302</td><td>null</td></tr><tr><td>&quot;PAL0708&quot;</td><td>4</td><td>&quot;Adelie Penguin (Pygoscelis ade…</td><td>&quot;Anvers&quot;</td><td>&quot;Torgersen&quot;</td><td>&quot;Adult, 1 Egg Stage&quot;</td><td>&quot;N2A2&quot;</td><td>&quot;Yes&quot;</td><td>&quot;11/16/07&quot;</td><td>null</td><td>null</td><td>null</td><td>null</td><td>null</td><td>null</td><td>null</td><td>&quot;Adult not sampled.&quot;</td></tr><tr><td>&quot;PAL0708&quot;</td><td>5</td><td>&quot;Adelie Penguin (Pygoscelis ade…</td><td>&quot;Anvers&quot;</td><td>&quot;Torgersen&quot;</td><td>&quot;Adult, 1 Egg Stage&quot;</td><td>&quot;N3A1&quot;</td><td>&quot;Yes&quot;</td><td>&quot;11/16/07&quot;</td><td>36.7</td><td>19.3</td><td>193</td><td>3450</td><td>&quot;FEMALE&quot;</td><td>8.76651</td><td>-25.32426</td><td>null</td></tr><tr><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td></tr><tr><td>&quot;PAL0910&quot;</td><td>120</td><td>&quot;Gentoo penguin (Pygoscelis pap…</td><td>&quot;Anvers&quot;</td><td>&quot;Biscoe&quot;</td><td>&quot;Adult, 1 Egg Stage&quot;</td><td>&quot;N38A2&quot;</td><td>&quot;No&quot;</td><td>&quot;12/1/09&quot;</td><td>null</td><td>null</td><td>null</td><td>null</td><td>null</td><td>null</td><td>null</td><td>null</td></tr><tr><td>&quot;PAL0910&quot;</td><td>121</td><td>&quot;Gentoo penguin (Pygoscelis pap…</td><td>&quot;Anvers&quot;</td><td>&quot;Biscoe&quot;</td><td>&quot;Adult, 1 Egg Stage&quot;</td><td>&quot;N39A1&quot;</td><td>&quot;Yes&quot;</td><td>&quot;11/22/09&quot;</td><td>46.8</td><td>14.3</td><td>215</td><td>4850</td><td>&quot;FEMALE&quot;</td><td>8.41151</td><td>-26.13832</td><td>null</td></tr><tr><td>&quot;PAL0910&quot;</td><td>122</td><td>&quot;Gentoo penguin (Pygoscelis pap…</td><td>&quot;Anvers&quot;</td><td>&quot;Biscoe&quot;</td><td>&quot;Adult, 1 Egg Stage&quot;</td><td>&quot;N39A2&quot;</td><td>&quot;Yes&quot;</td><td>&quot;11/22/09&quot;</td><td>50.4</td><td>15.7</td><td>222</td><td>5750</td><td>&quot;MALE&quot;</td><td>8.30166</td><td>-26.04117</td><td>null</td></tr><tr><td>&quot;PAL0910&quot;</td><td>123</td><td>&quot;Gentoo penguin (Pygoscelis pap…</td><td>&quot;Anvers&quot;</td><td>&quot;Biscoe&quot;</td><td>&quot;Adult, 1 Egg Stage&quot;</td><td>&quot;N43A1&quot;</td><td>&quot;Yes&quot;</td><td>&quot;11/22/09&quot;</td><td>45.2</td><td>14.8</td><td>212</td><td>5200</td><td>&quot;FEMALE&quot;</td><td>8.24246</td><td>-26.11969</td><td>null</td></tr><tr><td>&quot;PAL0910&quot;</td><td>124</td><td>&quot;Gentoo penguin (Pygoscelis pap…</td><td>&quot;Anvers&quot;</td><td>&quot;Biscoe&quot;</td><td>&quot;Adult, 1 Egg Stage&quot;</td><td>&quot;N43A2&quot;</td><td>&quot;Yes&quot;</td><td>&quot;11/22/09&quot;</td><td>49.9</td><td>16.1</td><td>213</td><td>5400</td><td>&quot;MALE&quot;</td><td>8.3639</td><td>-26.15531</td><td>null</td></tr></tbody></table></div>"
      ],
      "text/plain": [
       "shape: (344, 17)\n",
       "┌───────────┬────────┬─────────────┬────────┬───┬────────┬─────────────┬─────────────┬─────────────┐\n",
       "│ studyName ┆ Sample ┆ Species     ┆ Region ┆ … ┆ Sex    ┆ Delta 15 N  ┆ Delta 13 C  ┆ Comments    │\n",
       "│ ---       ┆ Number ┆ ---         ┆ ---    ┆   ┆ ---    ┆ (o/oo)      ┆ (o/oo)      ┆ ---         │\n",
       "│ str       ┆ ---    ┆ str         ┆ str    ┆   ┆ str    ┆ ---         ┆ ---         ┆ str         │\n",
       "│           ┆ i64    ┆             ┆        ┆   ┆        ┆ f64         ┆ f64         ┆             │\n",
       "╞═══════════╪════════╪═════════════╪════════╪═══╪════════╪═════════════╪═════════════╪═════════════╡\n",
       "│ PAL0708   ┆ 1      ┆ Adelie      ┆ Anvers ┆ … ┆ MALE   ┆ null        ┆ null        ┆ Not enough  │\n",
       "│           ┆        ┆ Penguin     ┆        ┆   ┆        ┆             ┆             ┆ blood for   │\n",
       "│           ┆        ┆ (Pygoscelis ┆        ┆   ┆        ┆             ┆             ┆ isotopes.   │\n",
       "│           ┆        ┆ ade…        ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "│ PAL0708   ┆ 2      ┆ Adelie      ┆ Anvers ┆ … ┆ FEMALE ┆ 8.94956     ┆ -24.69454   ┆ null        │\n",
       "│           ┆        ┆ Penguin     ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "│           ┆        ┆ (Pygoscelis ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "│           ┆        ┆ ade…        ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "│ PAL0708   ┆ 3      ┆ Adelie      ┆ Anvers ┆ … ┆ FEMALE ┆ 8.36821     ┆ -25.33302   ┆ null        │\n",
       "│           ┆        ┆ Penguin     ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "│           ┆        ┆ (Pygoscelis ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "│           ┆        ┆ ade…        ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "│ PAL0708   ┆ 4      ┆ Adelie      ┆ Anvers ┆ … ┆ null   ┆ null        ┆ null        ┆ Adult not   │\n",
       "│           ┆        ┆ Penguin     ┆        ┆   ┆        ┆             ┆             ┆ sampled.    │\n",
       "│           ┆        ┆ (Pygoscelis ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "│           ┆        ┆ ade…        ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "│ PAL0708   ┆ 5      ┆ Adelie      ┆ Anvers ┆ … ┆ FEMALE ┆ 8.76651     ┆ -25.32426   ┆ null        │\n",
       "│           ┆        ┆ Penguin     ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "│           ┆        ┆ (Pygoscelis ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "│           ┆        ┆ ade…        ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "│ …         ┆ …      ┆ …           ┆ …      ┆ … ┆ …      ┆ …           ┆ …           ┆ …           │\n",
       "│ PAL0910   ┆ 120    ┆ Gentoo      ┆ Anvers ┆ … ┆ null   ┆ null        ┆ null        ┆ null        │\n",
       "│           ┆        ┆ penguin     ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "│           ┆        ┆ (Pygoscelis ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "│           ┆        ┆ pap…        ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "│ PAL0910   ┆ 121    ┆ Gentoo      ┆ Anvers ┆ … ┆ FEMALE ┆ 8.41151     ┆ -26.13832   ┆ null        │\n",
       "│           ┆        ┆ penguin     ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "│           ┆        ┆ (Pygoscelis ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "│           ┆        ┆ pap…        ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "│ PAL0910   ┆ 122    ┆ Gentoo      ┆ Anvers ┆ … ┆ MALE   ┆ 8.30166     ┆ -26.04117   ┆ null        │\n",
       "│           ┆        ┆ penguin     ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "│           ┆        ┆ (Pygoscelis ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "│           ┆        ┆ pap…        ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "│ PAL0910   ┆ 123    ┆ Gentoo      ┆ Anvers ┆ … ┆ FEMALE ┆ 8.24246     ┆ -26.11969   ┆ null        │\n",
       "│           ┆        ┆ penguin     ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "│           ┆        ┆ (Pygoscelis ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "│           ┆        ┆ pap…        ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "│ PAL0910   ┆ 124    ┆ Gentoo      ┆ Anvers ┆ … ┆ MALE   ┆ 8.3639      ┆ -26.15531   ┆ null        │\n",
       "│           ┆        ┆ penguin     ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "│           ┆        ┆ (Pygoscelis ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "│           ┆        ┆ pap…        ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "└───────────┴────────┴─────────────┴────────┴───┴────────┴─────────────┴─────────────┴─────────────┘"
      ]
     },
     "execution_count": 30,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "import polars as pl\n",
    "df = pl.read_csv('penguins_lter.csv')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 31,
   "id": "42e60bf7-0a17-4be4-9c35-241b30325fa9",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>studyName</th>\n",
       "      <th>Sample Number</th>\n",
       "      <th>Species</th>\n",
       "      <th>Region</th>\n",
       "      <th>Island</th>\n",
       "      <th>Stage</th>\n",
       "      <th>Individual ID</th>\n",
       "      <th>Clutch Completion</th>\n",
       "      <th>Date Egg</th>\n",
       "      <th>Culmen Length (mm)</th>\n",
       "      <th>Culmen Depth (mm)</th>\n",
       "      <th>Flipper Length (mm)</th>\n",
       "      <th>Body Mass (g)</th>\n",
       "      <th>Sex</th>\n",
       "      <th>Delta 15 N (o/oo)</th>\n",
       "      <th>Delta 13 C (o/oo)</th>\n",
       "      <th>Comments</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>PAL0708</td>\n",
       "      <td>1</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Torgersen</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N1A1</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/11/07</td>\n",
       "      <td>39.1</td>\n",
       "      <td>18.7</td>\n",
       "      <td>181.0</td>\n",
       "      <td>3750.0</td>\n",
       "      <td>MALE</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>Not enough blood for isotopes.</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>PAL0708</td>\n",
       "      <td>2</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Torgersen</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N1A2</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/11/07</td>\n",
       "      <td>39.5</td>\n",
       "      <td>17.4</td>\n",
       "      <td>186.0</td>\n",
       "      <td>3800.0</td>\n",
       "      <td>FEMALE</td>\n",
       "      <td>8.94956</td>\n",
       "      <td>-24.69454</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>PAL0708</td>\n",
       "      <td>3</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Torgersen</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N2A1</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/16/07</td>\n",
       "      <td>40.3</td>\n",
       "      <td>18.0</td>\n",
       "      <td>195.0</td>\n",
       "      <td>3250.0</td>\n",
       "      <td>FEMALE</td>\n",
       "      <td>8.36821</td>\n",
       "      <td>-25.33302</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>PAL0708</td>\n",
       "      <td>4</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Torgersen</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N2A2</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/16/07</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>Adult not sampled.</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>PAL0708</td>\n",
       "      <td>5</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Torgersen</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N3A1</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/16/07</td>\n",
       "      <td>36.7</td>\n",
       "      <td>19.3</td>\n",
       "      <td>193.0</td>\n",
       "      <td>3450.0</td>\n",
       "      <td>FEMALE</td>\n",
       "      <td>8.76651</td>\n",
       "      <td>-25.32426</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>339</th>\n",
       "      <td>PAL0910</td>\n",
       "      <td>120</td>\n",
       "      <td>Gentoo penguin (Pygoscelis papua)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Biscoe</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N38A2</td>\n",
       "      <td>No</td>\n",
       "      <td>12/1/09</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>340</th>\n",
       "      <td>PAL0910</td>\n",
       "      <td>121</td>\n",
       "      <td>Gentoo penguin (Pygoscelis papua)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Biscoe</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N39A1</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/22/09</td>\n",
       "      <td>46.8</td>\n",
       "      <td>14.3</td>\n",
       "      <td>215.0</td>\n",
       "      <td>4850.0</td>\n",
       "      <td>FEMALE</td>\n",
       "      <td>8.41151</td>\n",
       "      <td>-26.13832</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>341</th>\n",
       "      <td>PAL0910</td>\n",
       "      <td>122</td>\n",
       "      <td>Gentoo penguin (Pygoscelis papua)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Biscoe</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N39A2</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/22/09</td>\n",
       "      <td>50.4</td>\n",
       "      <td>15.7</td>\n",
       "      <td>222.0</td>\n",
       "      <td>5750.0</td>\n",
       "      <td>MALE</td>\n",
       "      <td>8.30166</td>\n",
       "      <td>-26.04117</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>342</th>\n",
       "      <td>PAL0910</td>\n",
       "      <td>123</td>\n",
       "      <td>Gentoo penguin (Pygoscelis papua)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Biscoe</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N43A1</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/22/09</td>\n",
       "      <td>45.2</td>\n",
       "      <td>14.8</td>\n",
       "      <td>212.0</td>\n",
       "      <td>5200.0</td>\n",
       "      <td>FEMALE</td>\n",
       "      <td>8.24246</td>\n",
       "      <td>-26.11969</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>343</th>\n",
       "      <td>PAL0910</td>\n",
       "      <td>124</td>\n",
       "      <td>Gentoo penguin (Pygoscelis papua)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Biscoe</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N43A2</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/22/09</td>\n",
       "      <td>49.9</td>\n",
       "      <td>16.1</td>\n",
       "      <td>213.0</td>\n",
       "      <td>5400.0</td>\n",
       "      <td>MALE</td>\n",
       "      <td>8.36390</td>\n",
       "      <td>-26.15531</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>344 rows × 17 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "    studyName  Sample Number                              Species  Region  \\\n",
       "0     PAL0708              1  Adelie Penguin (Pygoscelis adeliae)  Anvers   \n",
       "1     PAL0708              2  Adelie Penguin (Pygoscelis adeliae)  Anvers   \n",
       "2     PAL0708              3  Adelie Penguin (Pygoscelis adeliae)  Anvers   \n",
       "3     PAL0708              4  Adelie Penguin (Pygoscelis adeliae)  Anvers   \n",
       "4     PAL0708              5  Adelie Penguin (Pygoscelis adeliae)  Anvers   \n",
       "..        ...            ...                                  ...     ...   \n",
       "339   PAL0910            120    Gentoo penguin (Pygoscelis papua)  Anvers   \n",
       "340   PAL0910            121    Gentoo penguin (Pygoscelis papua)  Anvers   \n",
       "341   PAL0910            122    Gentoo penguin (Pygoscelis papua)  Anvers   \n",
       "342   PAL0910            123    Gentoo penguin (Pygoscelis papua)  Anvers   \n",
       "343   PAL0910            124    Gentoo penguin (Pygoscelis papua)  Anvers   \n",
       "\n",
       "        Island               Stage Individual ID Clutch Completion  Date Egg  \\\n",
       "0    Torgersen  Adult, 1 Egg Stage          N1A1               Yes  11/11/07   \n",
       "1    Torgersen  Adult, 1 Egg Stage          N1A2               Yes  11/11/07   \n",
       "2    Torgersen  Adult, 1 Egg Stage          N2A1               Yes  11/16/07   \n",
       "3    Torgersen  Adult, 1 Egg Stage          N2A2               Yes  11/16/07   \n",
       "4    Torgersen  Adult, 1 Egg Stage          N3A1               Yes  11/16/07   \n",
       "..         ...                 ...           ...               ...       ...   \n",
       "339     Biscoe  Adult, 1 Egg Stage         N38A2                No   12/1/09   \n",
       "340     Biscoe  Adult, 1 Egg Stage         N39A1               Yes  11/22/09   \n",
       "341     Biscoe  Adult, 1 Egg Stage         N39A2               Yes  11/22/09   \n",
       "342     Biscoe  Adult, 1 Egg Stage         N43A1               Yes  11/22/09   \n",
       "343     Biscoe  Adult, 1 Egg Stage         N43A2               Yes  11/22/09   \n",
       "\n",
       "     Culmen Length (mm)  Culmen Depth (mm)  Flipper Length (mm)  \\\n",
       "0                  39.1               18.7                181.0   \n",
       "1                  39.5               17.4                186.0   \n",
       "2                  40.3               18.0                195.0   \n",
       "3                   NaN                NaN                  NaN   \n",
       "4                  36.7               19.3                193.0   \n",
       "..                  ...                ...                  ...   \n",
       "339                 NaN                NaN                  NaN   \n",
       "340                46.8               14.3                215.0   \n",
       "341                50.4               15.7                222.0   \n",
       "342                45.2               14.8                212.0   \n",
       "343                49.9               16.1                213.0   \n",
       "\n",
       "     Body Mass (g)     Sex  Delta 15 N (o/oo)  Delta 13 C (o/oo)  \\\n",
       "0           3750.0    MALE                NaN                NaN   \n",
       "1           3800.0  FEMALE            8.94956          -24.69454   \n",
       "2           3250.0  FEMALE            8.36821          -25.33302   \n",
       "3              NaN     NaN                NaN                NaN   \n",
       "4           3450.0  FEMALE            8.76651          -25.32426   \n",
       "..             ...     ...                ...                ...   \n",
       "339            NaN     NaN                NaN                NaN   \n",
       "340         4850.0  FEMALE            8.41151          -26.13832   \n",
       "341         5750.0    MALE            8.30166          -26.04117   \n",
       "342         5200.0  FEMALE            8.24246          -26.11969   \n",
       "343         5400.0    MALE            8.36390          -26.15531   \n",
       "\n",
       "                           Comments  \n",
       "0    Not enough blood for isotopes.  \n",
       "1                               NaN  \n",
       "2                               NaN  \n",
       "3                Adult not sampled.  \n",
       "4                               NaN  \n",
       "..                              ...  \n",
       "339                             NaN  \n",
       "340                             NaN  \n",
       "341                             NaN  \n",
       "342                             NaN  \n",
       "343                             NaN  \n",
       "\n",
       "[344 rows x 17 columns]"
      ]
     },
     "execution_count": 31,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "import pandas as pd\n",
    "dfa = pd.read_csv('penguins_lter.csv')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 32,
   "id": "49813f31-3748-4dd3-95bf-071477acea51",
   "metadata": {},
   "outputs": [],
   "source": [
    "df.write_csv('penguins_lter_new.csv', separator='|', null_value=\"NULL\", include_header=False)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 33,
   "id": "cba2e6c0-3196-4158-87c8-434730f12d3e",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "PAL0708|1|Adelie Penguin (Pygoscelis adeliae)|Anvers|Torgersen|Adult, 1 Egg Stage|N1A1|Yes|11/11/07|39.1|18.7|181|3750|MALE|NULL|NULL|Not enough blood for isotopes.\n",
      "PAL0708|2|Adelie Penguin (Pygoscelis adeliae)|Anvers|Torgersen|Adult, 1 Egg Stage|N1A2|Yes|11/11/07|39.5|17.4|186|3800|FEMALE|8.94956|-24.69454|NULL\n",
      "PAL0708|3|Adelie Penguin (Pygoscelis adeliae)|Anvers|Torgersen|Adult, 1 Egg Stage|N2A1|Yes|11/16/07|40.3|18.0|195|3250|FEMALE|8.36821|-25.33302|NULL\n",
      "PAL0708|4|Adelie Penguin (Pygoscelis adeliae)|Anvers|Torgersen|Adult, 1 Egg Stage|N2A2|Yes|11/16/07|NULL|NULL|NULL|NULL|NULL|NULL|NULL|Adult not sampled.\n"
     ]
    }
   ],
   "source": [
    "!head -4 penguins_lter_new.csv"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 34,
   "id": "80751874-1274-4821-b777-c223cc5c629c",
   "metadata": {},
   "outputs": [],
   "source": [
    "dfa.to_csv('penguins_lter_new.csv', sep='|', na_rep=\"NULL\", header=False)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 35,
   "id": "c54ff244-a2c7-43f3-ac0e-8463b86fa751",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "0|PAL0708|1|Adelie Penguin (Pygoscelis adeliae)|Anvers|Torgersen|Adult, 1 Egg Stage|N1A1|Yes|11/11/07|39.1|18.7|181.0|3750.0|MALE|NULL|NULL|Not enough blood for isotopes.\n",
      "1|PAL0708|2|Adelie Penguin (Pygoscelis adeliae)|Anvers|Torgersen|Adult, 1 Egg Stage|N1A2|Yes|11/11/07|39.5|17.4|186.0|3800.0|FEMALE|8.94956|-24.69454|NULL\n",
      "2|PAL0708|3|Adelie Penguin (Pygoscelis adeliae)|Anvers|Torgersen|Adult, 1 Egg Stage|N2A1|Yes|11/16/07|40.3|18.0|195.0|3250.0|FEMALE|8.36821|-25.33302|NULL\n",
      "3|PAL0708|4|Adelie Penguin (Pygoscelis adeliae)|Anvers|Torgersen|Adult, 1 Egg Stage|N2A2|Yes|11/16/07|NULL|NULL|NULL|NULL|NULL|NULL|NULL|Adult not sampled.\n"
     ]
    }
   ],
   "source": [
    "!head -4 penguins_lter_new.csv"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 36,
   "id": "d1651931-ae85-416b-b3bc-f4d2f5de157a",
   "metadata": {},
   "outputs": [],
   "source": [
    "dfa.to_csv('penguins_lter_new.csv', sep='|', na_rep=\"NULL\", header=False, index=False)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 37,
   "id": "271af887-14c2-43e7-ae7b-af20f1d98eaf",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "PAL0708|1|Adelie Penguin (Pygoscelis adeliae)|Anvers|Torgersen|Adult, 1 Egg Stage|N1A1|Yes|11/11/07|39.1|18.7|181.0|3750.0|MALE|NULL|NULL|Not enough blood for isotopes.\n",
      "PAL0708|2|Adelie Penguin (Pygoscelis adeliae)|Anvers|Torgersen|Adult, 1 Egg Stage|N1A2|Yes|11/11/07|39.5|17.4|186.0|3800.0|FEMALE|8.94956|-24.69454|NULL\n",
      "PAL0708|3|Adelie Penguin (Pygoscelis adeliae)|Anvers|Torgersen|Adult, 1 Egg Stage|N2A1|Yes|11/16/07|40.3|18.0|195.0|3250.0|FEMALE|8.36821|-25.33302|NULL\n",
      "PAL0708|4|Adelie Penguin (Pygoscelis adeliae)|Anvers|Torgersen|Adult, 1 Egg Stage|N2A2|Yes|11/16/07|NULL|NULL|NULL|NULL|NULL|NULL|NULL|Adult not sampled.\n"
     ]
    }
   ],
   "source": [
    "!head -4 penguins_lter_new.csv"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "b694ad61-6c49-42a1-84c2-e276ede88941",
   "metadata": {},
   "source": [
    "### Missing Data"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 38,
   "id": "9fe39aa7-5e41-4b5c-9dc2-90386d502b00",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div><style>\n",
       ".dataframe > thead > tr,\n",
       ".dataframe > tbody > tr {\n",
       "  text-align: right;\n",
       "  white-space: pre-wrap;\n",
       "}\n",
       "</style>\n",
       "<small>shape: (344,)</small><table border=\"1\" class=\"dataframe\"><thead><tr><th>Culmen Length (mm)</th></tr><tr><td>bool</td></tr></thead><tbody><tr><td>false</td></tr><tr><td>false</td></tr><tr><td>false</td></tr><tr><td>true</td></tr><tr><td>false</td></tr><tr><td>&hellip;</td></tr><tr><td>true</td></tr><tr><td>false</td></tr><tr><td>false</td></tr><tr><td>false</td></tr><tr><td>false</td></tr></tbody></table></div>"
      ],
      "text/plain": [
       "shape: (344,)\n",
       "Series: 'Culmen Length (mm)' [bool]\n",
       "[\n",
       "\tfalse\n",
       "\tfalse\n",
       "\tfalse\n",
       "\ttrue\n",
       "\tfalse\n",
       "\t…\n",
       "\ttrue\n",
       "\tfalse\n",
       "\tfalse\n",
       "\tfalse\n",
       "\tfalse\n",
       "]"
      ]
     },
     "execution_count": 38,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df['Culmen Length (mm)'].is_null()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 39,
   "id": "030063e1-e069-47f1-8191-13fe386de23b",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div><style>\n",
       ".dataframe > thead > tr,\n",
       ".dataframe > tbody > tr {\n",
       "  text-align: right;\n",
       "  white-space: pre-wrap;\n",
       "}\n",
       "</style>\n",
       "<small>shape: (2, 17)</small><table border=\"1\" class=\"dataframe\"><thead><tr><th>studyName</th><th>Sample Number</th><th>Species</th><th>Region</th><th>Island</th><th>Stage</th><th>Individual ID</th><th>Clutch Completion</th><th>Date Egg</th><th>Culmen Length (mm)</th><th>Culmen Depth (mm)</th><th>Flipper Length (mm)</th><th>Body Mass (g)</th><th>Sex</th><th>Delta 15 N (o/oo)</th><th>Delta 13 C (o/oo)</th><th>Comments</th></tr><tr><td>str</td><td>i64</td><td>str</td><td>str</td><td>str</td><td>str</td><td>str</td><td>str</td><td>str</td><td>f64</td><td>f64</td><td>i64</td><td>i64</td><td>str</td><td>f64</td><td>f64</td><td>str</td></tr></thead><tbody><tr><td>&quot;PAL0708&quot;</td><td>4</td><td>&quot;Adelie Penguin (Pygoscelis ade…</td><td>&quot;Anvers&quot;</td><td>&quot;Torgersen&quot;</td><td>&quot;Adult, 1 Egg Stage&quot;</td><td>&quot;N2A2&quot;</td><td>&quot;Yes&quot;</td><td>&quot;11/16/07&quot;</td><td>null</td><td>null</td><td>null</td><td>null</td><td>null</td><td>null</td><td>null</td><td>&quot;Adult not sampled.&quot;</td></tr><tr><td>&quot;PAL0910&quot;</td><td>120</td><td>&quot;Gentoo penguin (Pygoscelis pap…</td><td>&quot;Anvers&quot;</td><td>&quot;Biscoe&quot;</td><td>&quot;Adult, 1 Egg Stage&quot;</td><td>&quot;N38A2&quot;</td><td>&quot;No&quot;</td><td>&quot;12/1/09&quot;</td><td>null</td><td>null</td><td>null</td><td>null</td><td>null</td><td>null</td><td>null</td><td>null</td></tr></tbody></table></div>"
      ],
      "text/plain": [
       "shape: (2, 17)\n",
       "┌───────────┬────────┬──────────────┬────────┬───┬──────┬──────────────┬─────────────┬─────────────┐\n",
       "│ studyName ┆ Sample ┆ Species      ┆ Region ┆ … ┆ Sex  ┆ Delta 15 N   ┆ Delta 13 C  ┆ Comments    │\n",
       "│ ---       ┆ Number ┆ ---          ┆ ---    ┆   ┆ ---  ┆ (o/oo)       ┆ (o/oo)      ┆ ---         │\n",
       "│ str       ┆ ---    ┆ str          ┆ str    ┆   ┆ str  ┆ ---          ┆ ---         ┆ str         │\n",
       "│           ┆ i64    ┆              ┆        ┆   ┆      ┆ f64          ┆ f64         ┆             │\n",
       "╞═══════════╪════════╪══════════════╪════════╪═══╪══════╪══════════════╪═════════════╪═════════════╡\n",
       "│ PAL0708   ┆ 4      ┆ Adelie       ┆ Anvers ┆ … ┆ null ┆ null         ┆ null        ┆ Adult not   │\n",
       "│           ┆        ┆ Penguin      ┆        ┆   ┆      ┆              ┆             ┆ sampled.    │\n",
       "│           ┆        ┆ (Pygoscelis  ┆        ┆   ┆      ┆              ┆             ┆             │\n",
       "│           ┆        ┆ ade…         ┆        ┆   ┆      ┆              ┆             ┆             │\n",
       "│ PAL0910   ┆ 120    ┆ Gentoo       ┆ Anvers ┆ … ┆ null ┆ null         ┆ null        ┆ null        │\n",
       "│           ┆        ┆ penguin      ┆        ┆   ┆      ┆              ┆             ┆             │\n",
       "│           ┆        ┆ (Pygoscelis  ┆        ┆   ┆      ┆              ┆             ┆             │\n",
       "│           ┆        ┆ pap…         ┆        ┆   ┆      ┆              ┆             ┆             │\n",
       "└───────────┴────────┴──────────────┴────────┴───┴──────┴──────────────┴─────────────┴─────────────┘"
      ]
     },
     "execution_count": 39,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df.filter(pl.col('Culmen Length (mm)').is_null())"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 40,
   "id": "8f7565d9-11bf-415b-9800-793e2f38dd9d",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div><style>\n",
       ".dataframe > thead > tr,\n",
       ".dataframe > tbody > tr {\n",
       "  text-align: right;\n",
       "  white-space: pre-wrap;\n",
       "}\n",
       "</style>\n",
       "<small>shape: (344, 17)</small><table border=\"1\" class=\"dataframe\"><thead><tr><th>studyName</th><th>Sample Number</th><th>Species</th><th>Region</th><th>Island</th><th>Stage</th><th>Individual ID</th><th>Clutch Completion</th><th>Date Egg</th><th>Culmen Length (mm)</th><th>Culmen Depth (mm)</th><th>Flipper Length (mm)</th><th>Body Mass (g)</th><th>Sex</th><th>Delta 15 N (o/oo)</th><th>Delta 13 C (o/oo)</th><th>Comments</th></tr><tr><td>str</td><td>i64</td><td>str</td><td>str</td><td>str</td><td>str</td><td>str</td><td>str</td><td>str</td><td>f64</td><td>f64</td><td>i64</td><td>i64</td><td>str</td><td>f64</td><td>f64</td><td>str</td></tr></thead><tbody><tr><td>&quot;PAL0708&quot;</td><td>1</td><td>&quot;Adelie Penguin (Pygoscelis ade…</td><td>&quot;Anvers&quot;</td><td>&quot;Torgersen&quot;</td><td>&quot;Adult, 1 Egg Stage&quot;</td><td>&quot;N1A1&quot;</td><td>&quot;Yes&quot;</td><td>&quot;11/11/07&quot;</td><td>39.1</td><td>18.7</td><td>181</td><td>3750</td><td>&quot;MALE&quot;</td><td>null</td><td>null</td><td>&quot;Not enough blood for isotopes.&quot;</td></tr><tr><td>&quot;PAL0708&quot;</td><td>2</td><td>&quot;Adelie Penguin (Pygoscelis ade…</td><td>&quot;Anvers&quot;</td><td>&quot;Torgersen&quot;</td><td>&quot;Adult, 1 Egg Stage&quot;</td><td>&quot;N1A2&quot;</td><td>&quot;Yes&quot;</td><td>&quot;11/11/07&quot;</td><td>39.5</td><td>17.4</td><td>186</td><td>3800</td><td>&quot;FEMALE&quot;</td><td>8.94956</td><td>-24.69454</td><td>null</td></tr><tr><td>&quot;PAL0708&quot;</td><td>3</td><td>&quot;Adelie Penguin (Pygoscelis ade…</td><td>&quot;Anvers&quot;</td><td>&quot;Torgersen&quot;</td><td>&quot;Adult, 1 Egg Stage&quot;</td><td>&quot;N2A1&quot;</td><td>&quot;Yes&quot;</td><td>&quot;11/16/07&quot;</td><td>40.3</td><td>18.0</td><td>195</td><td>3250</td><td>&quot;FEMALE&quot;</td><td>8.36821</td><td>-25.33302</td><td>null</td></tr><tr><td>&quot;PAL0708&quot;</td><td>4</td><td>&quot;Adelie Penguin (Pygoscelis ade…</td><td>&quot;Anvers&quot;</td><td>&quot;Torgersen&quot;</td><td>&quot;Adult, 1 Egg Stage&quot;</td><td>&quot;N2A2&quot;</td><td>&quot;Yes&quot;</td><td>&quot;11/16/07&quot;</td><td>43.92193</td><td>null</td><td>null</td><td>null</td><td>null</td><td>null</td><td>null</td><td>&quot;Adult not sampled.&quot;</td></tr><tr><td>&quot;PAL0708&quot;</td><td>5</td><td>&quot;Adelie Penguin (Pygoscelis ade…</td><td>&quot;Anvers&quot;</td><td>&quot;Torgersen&quot;</td><td>&quot;Adult, 1 Egg Stage&quot;</td><td>&quot;N3A1&quot;</td><td>&quot;Yes&quot;</td><td>&quot;11/16/07&quot;</td><td>36.7</td><td>19.3</td><td>193</td><td>3450</td><td>&quot;FEMALE&quot;</td><td>8.76651</td><td>-25.32426</td><td>null</td></tr><tr><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td></tr><tr><td>&quot;PAL0910&quot;</td><td>120</td><td>&quot;Gentoo penguin (Pygoscelis pap…</td><td>&quot;Anvers&quot;</td><td>&quot;Biscoe&quot;</td><td>&quot;Adult, 1 Egg Stage&quot;</td><td>&quot;N38A2&quot;</td><td>&quot;No&quot;</td><td>&quot;12/1/09&quot;</td><td>43.92193</td><td>null</td><td>null</td><td>null</td><td>null</td><td>null</td><td>null</td><td>null</td></tr><tr><td>&quot;PAL0910&quot;</td><td>121</td><td>&quot;Gentoo penguin (Pygoscelis pap…</td><td>&quot;Anvers&quot;</td><td>&quot;Biscoe&quot;</td><td>&quot;Adult, 1 Egg Stage&quot;</td><td>&quot;N39A1&quot;</td><td>&quot;Yes&quot;</td><td>&quot;11/22/09&quot;</td><td>46.8</td><td>14.3</td><td>215</td><td>4850</td><td>&quot;FEMALE&quot;</td><td>8.41151</td><td>-26.13832</td><td>null</td></tr><tr><td>&quot;PAL0910&quot;</td><td>122</td><td>&quot;Gentoo penguin (Pygoscelis pap…</td><td>&quot;Anvers&quot;</td><td>&quot;Biscoe&quot;</td><td>&quot;Adult, 1 Egg Stage&quot;</td><td>&quot;N39A2&quot;</td><td>&quot;Yes&quot;</td><td>&quot;11/22/09&quot;</td><td>50.4</td><td>15.7</td><td>222</td><td>5750</td><td>&quot;MALE&quot;</td><td>8.30166</td><td>-26.04117</td><td>null</td></tr><tr><td>&quot;PAL0910&quot;</td><td>123</td><td>&quot;Gentoo penguin (Pygoscelis pap…</td><td>&quot;Anvers&quot;</td><td>&quot;Biscoe&quot;</td><td>&quot;Adult, 1 Egg Stage&quot;</td><td>&quot;N43A1&quot;</td><td>&quot;Yes&quot;</td><td>&quot;11/22/09&quot;</td><td>45.2</td><td>14.8</td><td>212</td><td>5200</td><td>&quot;FEMALE&quot;</td><td>8.24246</td><td>-26.11969</td><td>null</td></tr><tr><td>&quot;PAL0910&quot;</td><td>124</td><td>&quot;Gentoo penguin (Pygoscelis pap…</td><td>&quot;Anvers&quot;</td><td>&quot;Biscoe&quot;</td><td>&quot;Adult, 1 Egg Stage&quot;</td><td>&quot;N43A2&quot;</td><td>&quot;Yes&quot;</td><td>&quot;11/22/09&quot;</td><td>49.9</td><td>16.1</td><td>213</td><td>5400</td><td>&quot;MALE&quot;</td><td>8.3639</td><td>-26.15531</td><td>null</td></tr></tbody></table></div>"
      ],
      "text/plain": [
       "shape: (344, 17)\n",
       "┌───────────┬────────┬─────────────┬────────┬───┬────────┬─────────────┬─────────────┬─────────────┐\n",
       "│ studyName ┆ Sample ┆ Species     ┆ Region ┆ … ┆ Sex    ┆ Delta 15 N  ┆ Delta 13 C  ┆ Comments    │\n",
       "│ ---       ┆ Number ┆ ---         ┆ ---    ┆   ┆ ---    ┆ (o/oo)      ┆ (o/oo)      ┆ ---         │\n",
       "│ str       ┆ ---    ┆ str         ┆ str    ┆   ┆ str    ┆ ---         ┆ ---         ┆ str         │\n",
       "│           ┆ i64    ┆             ┆        ┆   ┆        ┆ f64         ┆ f64         ┆             │\n",
       "╞═══════════╪════════╪═════════════╪════════╪═══╪════════╪═════════════╪═════════════╪═════════════╡\n",
       "│ PAL0708   ┆ 1      ┆ Adelie      ┆ Anvers ┆ … ┆ MALE   ┆ null        ┆ null        ┆ Not enough  │\n",
       "│           ┆        ┆ Penguin     ┆        ┆   ┆        ┆             ┆             ┆ blood for   │\n",
       "│           ┆        ┆ (Pygoscelis ┆        ┆   ┆        ┆             ┆             ┆ isotopes.   │\n",
       "│           ┆        ┆ ade…        ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "│ PAL0708   ┆ 2      ┆ Adelie      ┆ Anvers ┆ … ┆ FEMALE ┆ 8.94956     ┆ -24.69454   ┆ null        │\n",
       "│           ┆        ┆ Penguin     ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "│           ┆        ┆ (Pygoscelis ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "│           ┆        ┆ ade…        ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "│ PAL0708   ┆ 3      ┆ Adelie      ┆ Anvers ┆ … ┆ FEMALE ┆ 8.36821     ┆ -25.33302   ┆ null        │\n",
       "│           ┆        ┆ Penguin     ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "│           ┆        ┆ (Pygoscelis ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "│           ┆        ┆ ade…        ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "│ PAL0708   ┆ 4      ┆ Adelie      ┆ Anvers ┆ … ┆ null   ┆ null        ┆ null        ┆ Adult not   │\n",
       "│           ┆        ┆ Penguin     ┆        ┆   ┆        ┆             ┆             ┆ sampled.    │\n",
       "│           ┆        ┆ (Pygoscelis ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "│           ┆        ┆ ade…        ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "│ PAL0708   ┆ 5      ┆ Adelie      ┆ Anvers ┆ … ┆ FEMALE ┆ 8.76651     ┆ -25.32426   ┆ null        │\n",
       "│           ┆        ┆ Penguin     ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "│           ┆        ┆ (Pygoscelis ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "│           ┆        ┆ ade…        ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "│ …         ┆ …      ┆ …           ┆ …      ┆ … ┆ …      ┆ …           ┆ …           ┆ …           │\n",
       "│ PAL0910   ┆ 120    ┆ Gentoo      ┆ Anvers ┆ … ┆ null   ┆ null        ┆ null        ┆ null        │\n",
       "│           ┆        ┆ penguin     ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "│           ┆        ┆ (Pygoscelis ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "│           ┆        ┆ pap…        ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "│ PAL0910   ┆ 121    ┆ Gentoo      ┆ Anvers ┆ … ┆ FEMALE ┆ 8.41151     ┆ -26.13832   ┆ null        │\n",
       "│           ┆        ┆ penguin     ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "│           ┆        ┆ (Pygoscelis ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "│           ┆        ┆ pap…        ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "│ PAL0910   ┆ 122    ┆ Gentoo      ┆ Anvers ┆ … ┆ MALE   ┆ 8.30166     ┆ -26.04117   ┆ null        │\n",
       "│           ┆        ┆ penguin     ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "│           ┆        ┆ (Pygoscelis ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "│           ┆        ┆ pap…        ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "│ PAL0910   ┆ 123    ┆ Gentoo      ┆ Anvers ┆ … ┆ FEMALE ┆ 8.24246     ┆ -26.11969   ┆ null        │\n",
       "│           ┆        ┆ penguin     ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "│           ┆        ┆ (Pygoscelis ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "│           ┆        ┆ pap…        ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "│ PAL0910   ┆ 124    ┆ Gentoo      ┆ Anvers ┆ … ┆ MALE   ┆ 8.3639      ┆ -26.15531   ┆ null        │\n",
       "│           ┆        ┆ penguin     ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "│           ┆        ┆ (Pygoscelis ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "│           ┆        ┆ pap…        ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "└───────────┴────────┴─────────────┴────────┴───┴────────┴─────────────┴─────────────┴─────────────┘"
      ]
     },
     "execution_count": 40,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_nn = df.with_columns(pl.col('Culmen Length (mm)').fill_null(strategy='mean'))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 41,
   "id": "25d78a94-28f7-486a-b57f-f68855889140",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div><style>\n",
       ".dataframe > thead > tr,\n",
       ".dataframe > tbody > tr {\n",
       "  text-align: right;\n",
       "  white-space: pre-wrap;\n",
       "}\n",
       "</style>\n",
       "<small>shape: (3, 17)</small><table border=\"1\" class=\"dataframe\"><thead><tr><th>studyName</th><th>Sample Number</th><th>Species</th><th>Region</th><th>Island</th><th>Stage</th><th>Individual ID</th><th>Clutch Completion</th><th>Date Egg</th><th>Culmen Length (mm)</th><th>Culmen Depth (mm)</th><th>Flipper Length (mm)</th><th>Body Mass (g)</th><th>Sex</th><th>Delta 15 N (o/oo)</th><th>Delta 13 C (o/oo)</th><th>Comments</th></tr><tr><td>str</td><td>i64</td><td>str</td><td>str</td><td>str</td><td>str</td><td>str</td><td>str</td><td>str</td><td>f64</td><td>f64</td><td>i64</td><td>i64</td><td>str</td><td>f64</td><td>f64</td><td>str</td></tr></thead><tbody><tr><td>&quot;PAL0708&quot;</td><td>4</td><td>&quot;Adelie Penguin (Pygoscelis ade…</td><td>&quot;Anvers&quot;</td><td>&quot;Torgersen&quot;</td><td>&quot;Adult, 1 Egg Stage&quot;</td><td>&quot;N2A2&quot;</td><td>&quot;Yes&quot;</td><td>&quot;11/16/07&quot;</td><td>43.92193</td><td>null</td><td>null</td><td>null</td><td>null</td><td>null</td><td>null</td><td>&quot;Adult not sampled.&quot;</td></tr><tr><td>&quot;PAL0708&quot;</td><td>4</td><td>&quot;Chinstrap penguin (Pygoscelis …</td><td>&quot;Anvers&quot;</td><td>&quot;Dream&quot;</td><td>&quot;Adult, 1 Egg Stage&quot;</td><td>&quot;N62A2&quot;</td><td>&quot;Yes&quot;</td><td>&quot;11/26/07&quot;</td><td>45.4</td><td>18.7</td><td>188</td><td>3525</td><td>&quot;FEMALE&quot;</td><td>8.64701</td><td>-24.62717</td><td>null</td></tr><tr><td>&quot;PAL0708&quot;</td><td>4</td><td>&quot;Gentoo penguin (Pygoscelis pap…</td><td>&quot;Anvers&quot;</td><td>&quot;Biscoe&quot;</td><td>&quot;Adult, 1 Egg Stage&quot;</td><td>&quot;N32A2&quot;</td><td>&quot;Yes&quot;</td><td>&quot;11/27/07&quot;</td><td>50.0</td><td>15.2</td><td>218</td><td>5700</td><td>&quot;MALE&quot;</td><td>8.2554</td><td>-25.40075</td><td>null</td></tr></tbody></table></div>"
      ],
      "text/plain": [
       "shape: (3, 17)\n",
       "┌───────────┬────────┬─────────────┬────────┬───┬────────┬─────────────┬─────────────┬─────────────┐\n",
       "│ studyName ┆ Sample ┆ Species     ┆ Region ┆ … ┆ Sex    ┆ Delta 15 N  ┆ Delta 13 C  ┆ Comments    │\n",
       "│ ---       ┆ Number ┆ ---         ┆ ---    ┆   ┆ ---    ┆ (o/oo)      ┆ (o/oo)      ┆ ---         │\n",
       "│ str       ┆ ---    ┆ str         ┆ str    ┆   ┆ str    ┆ ---         ┆ ---         ┆ str         │\n",
       "│           ┆ i64    ┆             ┆        ┆   ┆        ┆ f64         ┆ f64         ┆             │\n",
       "╞═══════════╪════════╪═════════════╪════════╪═══╪════════╪═════════════╪═════════════╪═════════════╡\n",
       "│ PAL0708   ┆ 4      ┆ Adelie      ┆ Anvers ┆ … ┆ null   ┆ null        ┆ null        ┆ Adult not   │\n",
       "│           ┆        ┆ Penguin     ┆        ┆   ┆        ┆             ┆             ┆ sampled.    │\n",
       "│           ┆        ┆ (Pygoscelis ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "│           ┆        ┆ ade…        ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "│ PAL0708   ┆ 4      ┆ Chinstrap   ┆ Anvers ┆ … ┆ FEMALE ┆ 8.64701     ┆ -24.62717   ┆ null        │\n",
       "│           ┆        ┆ penguin     ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "│           ┆        ┆ (Pygoscelis ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "│           ┆        ┆ …           ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "│ PAL0708   ┆ 4      ┆ Gentoo      ┆ Anvers ┆ … ┆ MALE   ┆ 8.2554      ┆ -25.40075   ┆ null        │\n",
       "│           ┆        ┆ penguin     ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "│           ┆        ┆ (Pygoscelis ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "│           ┆        ┆ pap…        ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "└───────────┴────────┴─────────────┴────────┴───┴────────┴─────────────┴─────────────┴─────────────┘"
      ]
     },
     "execution_count": 41,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_nn.filter(pl.col('Sample Number') == 4)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 42,
   "id": "2afd446a-755a-4341-b0fb-efc95998f023",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "0      False\n",
       "1      False\n",
       "2      False\n",
       "3       True\n",
       "4      False\n",
       "       ...  \n",
       "339     True\n",
       "340    False\n",
       "341    False\n",
       "342    False\n",
       "343    False\n",
       "Name: Culmen Length (mm), Length: 344, dtype: bool"
      ]
     },
     "execution_count": 42,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "dfa['Culmen Length (mm)'].isnull()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 43,
   "id": "71169db6-d214-4928-a733-31fdd5ea8776",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>studyName</th>\n",
       "      <th>Sample Number</th>\n",
       "      <th>Species</th>\n",
       "      <th>Region</th>\n",
       "      <th>Island</th>\n",
       "      <th>Stage</th>\n",
       "      <th>Individual ID</th>\n",
       "      <th>Clutch Completion</th>\n",
       "      <th>Date Egg</th>\n",
       "      <th>Culmen Length (mm)</th>\n",
       "      <th>Culmen Depth (mm)</th>\n",
       "      <th>Flipper Length (mm)</th>\n",
       "      <th>Body Mass (g)</th>\n",
       "      <th>Sex</th>\n",
       "      <th>Delta 15 N (o/oo)</th>\n",
       "      <th>Delta 13 C (o/oo)</th>\n",
       "      <th>Comments</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>PAL0708</td>\n",
       "      <td>4</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Torgersen</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N2A2</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/16/07</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>Adult not sampled.</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>339</th>\n",
       "      <td>PAL0910</td>\n",
       "      <td>120</td>\n",
       "      <td>Gentoo penguin (Pygoscelis papua)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Biscoe</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N38A2</td>\n",
       "      <td>No</td>\n",
       "      <td>12/1/09</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "    studyName  Sample Number                              Species  Region  \\\n",
       "3     PAL0708              4  Adelie Penguin (Pygoscelis adeliae)  Anvers   \n",
       "339   PAL0910            120    Gentoo penguin (Pygoscelis papua)  Anvers   \n",
       "\n",
       "        Island               Stage Individual ID Clutch Completion  Date Egg  \\\n",
       "3    Torgersen  Adult, 1 Egg Stage          N2A2               Yes  11/16/07   \n",
       "339     Biscoe  Adult, 1 Egg Stage         N38A2                No   12/1/09   \n",
       "\n",
       "     Culmen Length (mm)  Culmen Depth (mm)  Flipper Length (mm)  \\\n",
       "3                   NaN                NaN                  NaN   \n",
       "339                 NaN                NaN                  NaN   \n",
       "\n",
       "     Body Mass (g)  Sex  Delta 15 N (o/oo)  Delta 13 C (o/oo)  \\\n",
       "3              NaN  NaN                NaN                NaN   \n",
       "339            NaN  NaN                NaN                NaN   \n",
       "\n",
       "               Comments  \n",
       "3    Adult not sampled.  \n",
       "339                 NaN  "
      ]
     },
     "execution_count": 43,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "dfa[dfa['Culmen Length (mm)'].isnull()]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 44,
   "id": "d74d4e3f-8d0c-4a62-8439-b76ac1542a0c",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>studyName</th>\n",
       "      <th>Sample Number</th>\n",
       "      <th>Species</th>\n",
       "      <th>Region</th>\n",
       "      <th>Island</th>\n",
       "      <th>Stage</th>\n",
       "      <th>Individual ID</th>\n",
       "      <th>Clutch Completion</th>\n",
       "      <th>Date Egg</th>\n",
       "      <th>Culmen Length (mm)</th>\n",
       "      <th>Culmen Depth (mm)</th>\n",
       "      <th>Flipper Length (mm)</th>\n",
       "      <th>Body Mass (g)</th>\n",
       "      <th>Sex</th>\n",
       "      <th>Delta 15 N (o/oo)</th>\n",
       "      <th>Delta 13 C (o/oo)</th>\n",
       "      <th>Comments</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>PAL0708</td>\n",
       "      <td>1</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Torgersen</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N1A1</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/11/07</td>\n",
       "      <td>39.1</td>\n",
       "      <td>18.7</td>\n",
       "      <td>181.0</td>\n",
       "      <td>3750.0</td>\n",
       "      <td>MALE</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>Not enough blood for isotopes.</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>PAL0708</td>\n",
       "      <td>2</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Torgersen</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N1A2</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/11/07</td>\n",
       "      <td>39.5</td>\n",
       "      <td>17.4</td>\n",
       "      <td>186.0</td>\n",
       "      <td>3800.0</td>\n",
       "      <td>FEMALE</td>\n",
       "      <td>8.94956</td>\n",
       "      <td>-24.69454</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>PAL0708</td>\n",
       "      <td>3</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Torgersen</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N2A1</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/16/07</td>\n",
       "      <td>40.3</td>\n",
       "      <td>18.0</td>\n",
       "      <td>195.0</td>\n",
       "      <td>3250.0</td>\n",
       "      <td>FEMALE</td>\n",
       "      <td>8.36821</td>\n",
       "      <td>-25.33302</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>PAL0708</td>\n",
       "      <td>4</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Torgersen</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N2A2</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/16/07</td>\n",
       "      <td>40.3</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>Adult not sampled.</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>PAL0708</td>\n",
       "      <td>5</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Torgersen</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N3A1</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/16/07</td>\n",
       "      <td>36.7</td>\n",
       "      <td>19.3</td>\n",
       "      <td>193.0</td>\n",
       "      <td>3450.0</td>\n",
       "      <td>FEMALE</td>\n",
       "      <td>8.76651</td>\n",
       "      <td>-25.32426</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>339</th>\n",
       "      <td>PAL0910</td>\n",
       "      <td>120</td>\n",
       "      <td>Gentoo penguin (Pygoscelis papua)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Biscoe</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N38A2</td>\n",
       "      <td>No</td>\n",
       "      <td>12/1/09</td>\n",
       "      <td>47.2</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>340</th>\n",
       "      <td>PAL0910</td>\n",
       "      <td>121</td>\n",
       "      <td>Gentoo penguin (Pygoscelis papua)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Biscoe</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N39A1</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/22/09</td>\n",
       "      <td>46.8</td>\n",
       "      <td>14.3</td>\n",
       "      <td>215.0</td>\n",
       "      <td>4850.0</td>\n",
       "      <td>FEMALE</td>\n",
       "      <td>8.41151</td>\n",
       "      <td>-26.13832</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>341</th>\n",
       "      <td>PAL0910</td>\n",
       "      <td>122</td>\n",
       "      <td>Gentoo penguin (Pygoscelis papua)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Biscoe</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N39A2</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/22/09</td>\n",
       "      <td>50.4</td>\n",
       "      <td>15.7</td>\n",
       "      <td>222.0</td>\n",
       "      <td>5750.0</td>\n",
       "      <td>MALE</td>\n",
       "      <td>8.30166</td>\n",
       "      <td>-26.04117</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>342</th>\n",
       "      <td>PAL0910</td>\n",
       "      <td>123</td>\n",
       "      <td>Gentoo penguin (Pygoscelis papua)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Biscoe</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N43A1</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/22/09</td>\n",
       "      <td>45.2</td>\n",
       "      <td>14.8</td>\n",
       "      <td>212.0</td>\n",
       "      <td>5200.0</td>\n",
       "      <td>FEMALE</td>\n",
       "      <td>8.24246</td>\n",
       "      <td>-26.11969</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>343</th>\n",
       "      <td>PAL0910</td>\n",
       "      <td>124</td>\n",
       "      <td>Gentoo penguin (Pygoscelis papua)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Biscoe</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N43A2</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/22/09</td>\n",
       "      <td>49.9</td>\n",
       "      <td>16.1</td>\n",
       "      <td>213.0</td>\n",
       "      <td>5400.0</td>\n",
       "      <td>MALE</td>\n",
       "      <td>8.36390</td>\n",
       "      <td>-26.15531</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>344 rows × 17 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "    studyName  Sample Number                              Species  Region  \\\n",
       "0     PAL0708              1  Adelie Penguin (Pygoscelis adeliae)  Anvers   \n",
       "1     PAL0708              2  Adelie Penguin (Pygoscelis adeliae)  Anvers   \n",
       "2     PAL0708              3  Adelie Penguin (Pygoscelis adeliae)  Anvers   \n",
       "3     PAL0708              4  Adelie Penguin (Pygoscelis adeliae)  Anvers   \n",
       "4     PAL0708              5  Adelie Penguin (Pygoscelis adeliae)  Anvers   \n",
       "..        ...            ...                                  ...     ...   \n",
       "339   PAL0910            120    Gentoo penguin (Pygoscelis papua)  Anvers   \n",
       "340   PAL0910            121    Gentoo penguin (Pygoscelis papua)  Anvers   \n",
       "341   PAL0910            122    Gentoo penguin (Pygoscelis papua)  Anvers   \n",
       "342   PAL0910            123    Gentoo penguin (Pygoscelis papua)  Anvers   \n",
       "343   PAL0910            124    Gentoo penguin (Pygoscelis papua)  Anvers   \n",
       "\n",
       "        Island               Stage Individual ID Clutch Completion  Date Egg  \\\n",
       "0    Torgersen  Adult, 1 Egg Stage          N1A1               Yes  11/11/07   \n",
       "1    Torgersen  Adult, 1 Egg Stage          N1A2               Yes  11/11/07   \n",
       "2    Torgersen  Adult, 1 Egg Stage          N2A1               Yes  11/16/07   \n",
       "3    Torgersen  Adult, 1 Egg Stage          N2A2               Yes  11/16/07   \n",
       "4    Torgersen  Adult, 1 Egg Stage          N3A1               Yes  11/16/07   \n",
       "..         ...                 ...           ...               ...       ...   \n",
       "339     Biscoe  Adult, 1 Egg Stage         N38A2                No   12/1/09   \n",
       "340     Biscoe  Adult, 1 Egg Stage         N39A1               Yes  11/22/09   \n",
       "341     Biscoe  Adult, 1 Egg Stage         N39A2               Yes  11/22/09   \n",
       "342     Biscoe  Adult, 1 Egg Stage         N43A1               Yes  11/22/09   \n",
       "343     Biscoe  Adult, 1 Egg Stage         N43A2               Yes  11/22/09   \n",
       "\n",
       "     Culmen Length (mm)  Culmen Depth (mm)  Flipper Length (mm)  \\\n",
       "0                  39.1               18.7                181.0   \n",
       "1                  39.5               17.4                186.0   \n",
       "2                  40.3               18.0                195.0   \n",
       "3                  40.3                NaN                  NaN   \n",
       "4                  36.7               19.3                193.0   \n",
       "..                  ...                ...                  ...   \n",
       "339                47.2                NaN                  NaN   \n",
       "340                46.8               14.3                215.0   \n",
       "341                50.4               15.7                222.0   \n",
       "342                45.2               14.8                212.0   \n",
       "343                49.9               16.1                213.0   \n",
       "\n",
       "     Body Mass (g)     Sex  Delta 15 N (o/oo)  Delta 13 C (o/oo)  \\\n",
       "0           3750.0    MALE                NaN                NaN   \n",
       "1           3800.0  FEMALE            8.94956          -24.69454   \n",
       "2           3250.0  FEMALE            8.36821          -25.33302   \n",
       "3              NaN     NaN                NaN                NaN   \n",
       "4           3450.0  FEMALE            8.76651          -25.32426   \n",
       "..             ...     ...                ...                ...   \n",
       "339            NaN     NaN                NaN                NaN   \n",
       "340         4850.0  FEMALE            8.41151          -26.13832   \n",
       "341         5750.0    MALE            8.30166          -26.04117   \n",
       "342         5200.0  FEMALE            8.24246          -26.11969   \n",
       "343         5400.0    MALE            8.36390          -26.15531   \n",
       "\n",
       "                           Comments  \n",
       "0    Not enough blood for isotopes.  \n",
       "1                               NaN  \n",
       "2                               NaN  \n",
       "3                Adult not sampled.  \n",
       "4                               NaN  \n",
       "..                              ...  \n",
       "339                             NaN  \n",
       "340                             NaN  \n",
       "341                             NaN  \n",
       "342                             NaN  \n",
       "343                             NaN  \n",
       "\n",
       "[344 rows x 17 columns]"
      ]
     },
     "execution_count": 44,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "dfa_nn = dfa.assign(**{'Culmen Length (mm)': dfa['Culmen Length (mm)'].ffill()})"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 45,
   "id": "43ff1b44-9ce0-4ad9-a179-548306189802",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>studyName</th>\n",
       "      <th>Sample Number</th>\n",
       "      <th>Species</th>\n",
       "      <th>Region</th>\n",
       "      <th>Island</th>\n",
       "      <th>Stage</th>\n",
       "      <th>Individual ID</th>\n",
       "      <th>Clutch Completion</th>\n",
       "      <th>Date Egg</th>\n",
       "      <th>Culmen Length (mm)</th>\n",
       "      <th>Culmen Depth (mm)</th>\n",
       "      <th>Flipper Length (mm)</th>\n",
       "      <th>Body Mass (g)</th>\n",
       "      <th>Sex</th>\n",
       "      <th>Delta 15 N (o/oo)</th>\n",
       "      <th>Delta 13 C (o/oo)</th>\n",
       "      <th>Comments</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>PAL0708</td>\n",
       "      <td>4</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Torgersen</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N2A2</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/16/07</td>\n",
       "      <td>40.3</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>Adult not sampled.</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>155</th>\n",
       "      <td>PAL0708</td>\n",
       "      <td>4</td>\n",
       "      <td>Chinstrap penguin (Pygoscelis antarctica)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Dream</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N62A2</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/26/07</td>\n",
       "      <td>45.4</td>\n",
       "      <td>18.7</td>\n",
       "      <td>188.0</td>\n",
       "      <td>3525.0</td>\n",
       "      <td>FEMALE</td>\n",
       "      <td>8.64701</td>\n",
       "      <td>-24.62717</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>223</th>\n",
       "      <td>PAL0708</td>\n",
       "      <td>4</td>\n",
       "      <td>Gentoo penguin (Pygoscelis papua)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Biscoe</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N32A2</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/27/07</td>\n",
       "      <td>50.0</td>\n",
       "      <td>15.2</td>\n",
       "      <td>218.0</td>\n",
       "      <td>5700.0</td>\n",
       "      <td>MALE</td>\n",
       "      <td>8.25540</td>\n",
       "      <td>-25.40075</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "    studyName  Sample Number                                    Species  \\\n",
       "3     PAL0708              4        Adelie Penguin (Pygoscelis adeliae)   \n",
       "155   PAL0708              4  Chinstrap penguin (Pygoscelis antarctica)   \n",
       "223   PAL0708              4          Gentoo penguin (Pygoscelis papua)   \n",
       "\n",
       "     Region     Island               Stage Individual ID Clutch Completion  \\\n",
       "3    Anvers  Torgersen  Adult, 1 Egg Stage          N2A2               Yes   \n",
       "155  Anvers      Dream  Adult, 1 Egg Stage         N62A2               Yes   \n",
       "223  Anvers     Biscoe  Adult, 1 Egg Stage         N32A2               Yes   \n",
       "\n",
       "     Date Egg  Culmen Length (mm)  Culmen Depth (mm)  Flipper Length (mm)  \\\n",
       "3    11/16/07                40.3                NaN                  NaN   \n",
       "155  11/26/07                45.4               18.7                188.0   \n",
       "223  11/27/07                50.0               15.2                218.0   \n",
       "\n",
       "     Body Mass (g)     Sex  Delta 15 N (o/oo)  Delta 13 C (o/oo)  \\\n",
       "3              NaN     NaN                NaN                NaN   \n",
       "155         3525.0  FEMALE            8.64701          -24.62717   \n",
       "223         5700.0    MALE            8.25540          -25.40075   \n",
       "\n",
       "               Comments  \n",
       "3    Adult not sampled.  \n",
       "155                 NaN  \n",
       "223                 NaN  "
      ]
     },
     "execution_count": 45,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "dfa_nn[dfa_nn['Sample Number'] == 4]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 46,
   "id": "2afa90cf-f25c-4366-92b7-4f32fcf971c9",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div><style>\n",
       ".dataframe > thead > tr,\n",
       ".dataframe > tbody > tr {\n",
       "  text-align: right;\n",
       "  white-space: pre-wrap;\n",
       "}\n",
       "</style>\n",
       "<small>shape: (344, 17)</small><table border=\"1\" class=\"dataframe\"><thead><tr><th>studyName</th><th>Sample Number</th><th>Species</th><th>Region</th><th>Island</th><th>Stage</th><th>Individual ID</th><th>Clutch Completion</th><th>Date Egg</th><th>Culmen Length (mm)</th><th>Culmen Depth (mm)</th><th>Flipper Length (mm)</th><th>Body Mass (g)</th><th>Sex</th><th>Delta 15 N (o/oo)</th><th>Delta 13 C (o/oo)</th><th>Comments</th></tr><tr><td>str</td><td>i64</td><td>str</td><td>str</td><td>str</td><td>str</td><td>str</td><td>str</td><td>str</td><td>f64</td><td>f64</td><td>i64</td><td>i64</td><td>str</td><td>f64</td><td>f64</td><td>str</td></tr></thead><tbody><tr><td>&quot;PAL0708&quot;</td><td>1</td><td>&quot;Adelie Penguin (Pygoscelis ade…</td><td>&quot;Anvers&quot;</td><td>&quot;Torgersen&quot;</td><td>&quot;Adult, 1 Egg Stage&quot;</td><td>&quot;N1A1&quot;</td><td>&quot;Yes&quot;</td><td>&quot;11/11/07&quot;</td><td>2.090909</td><td>18.7</td><td>181</td><td>3750</td><td>&quot;MALE&quot;</td><td>null</td><td>null</td><td>&quot;Not enough blood for isotopes.&quot;</td></tr><tr><td>&quot;PAL0708&quot;</td><td>2</td><td>&quot;Adelie Penguin (Pygoscelis ade…</td><td>&quot;Anvers&quot;</td><td>&quot;Torgersen&quot;</td><td>&quot;Adult, 1 Egg Stage&quot;</td><td>&quot;N1A2&quot;</td><td>&quot;Yes&quot;</td><td>&quot;11/11/07&quot;</td><td>2.270115</td><td>17.4</td><td>186</td><td>3800</td><td>&quot;FEMALE&quot;</td><td>8.94956</td><td>-24.69454</td><td>null</td></tr><tr><td>&quot;PAL0708&quot;</td><td>3</td><td>&quot;Adelie Penguin (Pygoscelis ade…</td><td>&quot;Anvers&quot;</td><td>&quot;Torgersen&quot;</td><td>&quot;Adult, 1 Egg Stage&quot;</td><td>&quot;N2A1&quot;</td><td>&quot;Yes&quot;</td><td>&quot;11/16/07&quot;</td><td>2.238889</td><td>18.0</td><td>195</td><td>3250</td><td>&quot;FEMALE&quot;</td><td>8.36821</td><td>-25.33302</td><td>null</td></tr><tr><td>&quot;PAL0708&quot;</td><td>4</td><td>&quot;Adelie Penguin (Pygoscelis ade…</td><td>&quot;Anvers&quot;</td><td>&quot;Torgersen&quot;</td><td>&quot;Adult, 1 Egg Stage&quot;</td><td>&quot;N2A2&quot;</td><td>&quot;Yes&quot;</td><td>&quot;11/16/07&quot;</td><td>null</td><td>null</td><td>null</td><td>null</td><td>null</td><td>null</td><td>null</td><td>&quot;Adult not sampled.&quot;</td></tr><tr><td>&quot;PAL0708&quot;</td><td>5</td><td>&quot;Adelie Penguin (Pygoscelis ade…</td><td>&quot;Anvers&quot;</td><td>&quot;Torgersen&quot;</td><td>&quot;Adult, 1 Egg Stage&quot;</td><td>&quot;N3A1&quot;</td><td>&quot;Yes&quot;</td><td>&quot;11/16/07&quot;</td><td>1.901554</td><td>19.3</td><td>193</td><td>3450</td><td>&quot;FEMALE&quot;</td><td>8.76651</td><td>-25.32426</td><td>null</td></tr><tr><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td></tr><tr><td>&quot;PAL0910&quot;</td><td>120</td><td>&quot;Gentoo penguin (Pygoscelis pap…</td><td>&quot;Anvers&quot;</td><td>&quot;Biscoe&quot;</td><td>&quot;Adult, 1 Egg Stage&quot;</td><td>&quot;N38A2&quot;</td><td>&quot;No&quot;</td><td>&quot;12/1/09&quot;</td><td>null</td><td>null</td><td>null</td><td>null</td><td>null</td><td>null</td><td>null</td><td>null</td></tr><tr><td>&quot;PAL0910&quot;</td><td>121</td><td>&quot;Gentoo penguin (Pygoscelis pap…</td><td>&quot;Anvers&quot;</td><td>&quot;Biscoe&quot;</td><td>&quot;Adult, 1 Egg Stage&quot;</td><td>&quot;N39A1&quot;</td><td>&quot;Yes&quot;</td><td>&quot;11/22/09&quot;</td><td>3.272727</td><td>14.3</td><td>215</td><td>4850</td><td>&quot;FEMALE&quot;</td><td>8.41151</td><td>-26.13832</td><td>null</td></tr><tr><td>&quot;PAL0910&quot;</td><td>122</td><td>&quot;Gentoo penguin (Pygoscelis pap…</td><td>&quot;Anvers&quot;</td><td>&quot;Biscoe&quot;</td><td>&quot;Adult, 1 Egg Stage&quot;</td><td>&quot;N39A2&quot;</td><td>&quot;Yes&quot;</td><td>&quot;11/22/09&quot;</td><td>3.210191</td><td>15.7</td><td>222</td><td>5750</td><td>&quot;MALE&quot;</td><td>8.30166</td><td>-26.04117</td><td>null</td></tr><tr><td>&quot;PAL0910&quot;</td><td>123</td><td>&quot;Gentoo penguin (Pygoscelis pap…</td><td>&quot;Anvers&quot;</td><td>&quot;Biscoe&quot;</td><td>&quot;Adult, 1 Egg Stage&quot;</td><td>&quot;N43A1&quot;</td><td>&quot;Yes&quot;</td><td>&quot;11/22/09&quot;</td><td>3.054054</td><td>14.8</td><td>212</td><td>5200</td><td>&quot;FEMALE&quot;</td><td>8.24246</td><td>-26.11969</td><td>null</td></tr><tr><td>&quot;PAL0910&quot;</td><td>124</td><td>&quot;Gentoo penguin (Pygoscelis pap…</td><td>&quot;Anvers&quot;</td><td>&quot;Biscoe&quot;</td><td>&quot;Adult, 1 Egg Stage&quot;</td><td>&quot;N43A2&quot;</td><td>&quot;Yes&quot;</td><td>&quot;11/22/09&quot;</td><td>3.099379</td><td>16.1</td><td>213</td><td>5400</td><td>&quot;MALE&quot;</td><td>8.3639</td><td>-26.15531</td><td>null</td></tr></tbody></table></div>"
      ],
      "text/plain": [
       "shape: (344, 17)\n",
       "┌───────────┬────────┬─────────────┬────────┬───┬────────┬─────────────┬─────────────┬─────────────┐\n",
       "│ studyName ┆ Sample ┆ Species     ┆ Region ┆ … ┆ Sex    ┆ Delta 15 N  ┆ Delta 13 C  ┆ Comments    │\n",
       "│ ---       ┆ Number ┆ ---         ┆ ---    ┆   ┆ ---    ┆ (o/oo)      ┆ (o/oo)      ┆ ---         │\n",
       "│ str       ┆ ---    ┆ str         ┆ str    ┆   ┆ str    ┆ ---         ┆ ---         ┆ str         │\n",
       "│           ┆ i64    ┆             ┆        ┆   ┆        ┆ f64         ┆ f64         ┆             │\n",
       "╞═══════════╪════════╪═════════════╪════════╪═══╪════════╪═════════════╪═════════════╪═════════════╡\n",
       "│ PAL0708   ┆ 1      ┆ Adelie      ┆ Anvers ┆ … ┆ MALE   ┆ null        ┆ null        ┆ Not enough  │\n",
       "│           ┆        ┆ Penguin     ┆        ┆   ┆        ┆             ┆             ┆ blood for   │\n",
       "│           ┆        ┆ (Pygoscelis ┆        ┆   ┆        ┆             ┆             ┆ isotopes.   │\n",
       "│           ┆        ┆ ade…        ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "│ PAL0708   ┆ 2      ┆ Adelie      ┆ Anvers ┆ … ┆ FEMALE ┆ 8.94956     ┆ -24.69454   ┆ null        │\n",
       "│           ┆        ┆ Penguin     ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "│           ┆        ┆ (Pygoscelis ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "│           ┆        ┆ ade…        ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "│ PAL0708   ┆ 3      ┆ Adelie      ┆ Anvers ┆ … ┆ FEMALE ┆ 8.36821     ┆ -25.33302   ┆ null        │\n",
       "│           ┆        ┆ Penguin     ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "│           ┆        ┆ (Pygoscelis ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "│           ┆        ┆ ade…        ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "│ PAL0708   ┆ 4      ┆ Adelie      ┆ Anvers ┆ … ┆ null   ┆ null        ┆ null        ┆ Adult not   │\n",
       "│           ┆        ┆ Penguin     ┆        ┆   ┆        ┆             ┆             ┆ sampled.    │\n",
       "│           ┆        ┆ (Pygoscelis ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "│           ┆        ┆ ade…        ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "│ PAL0708   ┆ 5      ┆ Adelie      ┆ Anvers ┆ … ┆ FEMALE ┆ 8.76651     ┆ -25.32426   ┆ null        │\n",
       "│           ┆        ┆ Penguin     ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "│           ┆        ┆ (Pygoscelis ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "│           ┆        ┆ ade…        ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "│ …         ┆ …      ┆ …           ┆ …      ┆ … ┆ …      ┆ …           ┆ …           ┆ …           │\n",
       "│ PAL0910   ┆ 120    ┆ Gentoo      ┆ Anvers ┆ … ┆ null   ┆ null        ┆ null        ┆ null        │\n",
       "│           ┆        ┆ penguin     ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "│           ┆        ┆ (Pygoscelis ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "│           ┆        ┆ pap…        ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "│ PAL0910   ┆ 121    ┆ Gentoo      ┆ Anvers ┆ … ┆ FEMALE ┆ 8.41151     ┆ -26.13832   ┆ null        │\n",
       "│           ┆        ┆ penguin     ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "│           ┆        ┆ (Pygoscelis ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "│           ┆        ┆ pap…        ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "│ PAL0910   ┆ 122    ┆ Gentoo      ┆ Anvers ┆ … ┆ MALE   ┆ 8.30166     ┆ -26.04117   ┆ null        │\n",
       "│           ┆        ┆ penguin     ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "│           ┆        ┆ (Pygoscelis ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "│           ┆        ┆ pap…        ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "│ PAL0910   ┆ 123    ┆ Gentoo      ┆ Anvers ┆ … ┆ FEMALE ┆ 8.24246     ┆ -26.11969   ┆ null        │\n",
       "│           ┆        ┆ penguin     ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "│           ┆        ┆ (Pygoscelis ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "│           ┆        ┆ pap…        ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "│ PAL0910   ┆ 124    ┆ Gentoo      ┆ Anvers ┆ … ┆ MALE   ┆ 8.3639      ┆ -26.15531   ┆ null        │\n",
       "│           ┆        ┆ penguin     ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "│           ┆        ┆ (Pygoscelis ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "│           ┆        ┆ pap…        ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "└───────────┴────────┴─────────────┴────────┴───┴────────┴─────────────┴─────────────┴─────────────┘"
      ]
     },
     "execution_count": 46,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# length to depth ratio\n",
    "\n",
    "# replaces 'Culmen Length(mm)' column!\n",
    "df.with_columns((df['Culmen Length (mm)'] / df['Culmen Depth (mm)']))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 47,
   "id": "b6e20726-a4b6-441b-95a2-41d4f29845a1",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div><style>\n",
       ".dataframe > thead > tr,\n",
       ".dataframe > tbody > tr {\n",
       "  text-align: right;\n",
       "  white-space: pre-wrap;\n",
       "}\n",
       "</style>\n",
       "<small>shape: (344, 18)</small><table border=\"1\" class=\"dataframe\"><thead><tr><th>studyName</th><th>Sample Number</th><th>Species</th><th>Region</th><th>Island</th><th>Stage</th><th>Individual ID</th><th>Clutch Completion</th><th>Date Egg</th><th>Culmen Length (mm)</th><th>Culmen Depth (mm)</th><th>Flipper Length (mm)</th><th>Body Mass (g)</th><th>Sex</th><th>Delta 15 N (o/oo)</th><th>Delta 13 C (o/oo)</th><th>Comments</th><th>CulmenRatio</th></tr><tr><td>str</td><td>i64</td><td>str</td><td>str</td><td>str</td><td>str</td><td>str</td><td>str</td><td>str</td><td>f64</td><td>f64</td><td>i64</td><td>i64</td><td>str</td><td>f64</td><td>f64</td><td>str</td><td>f64</td></tr></thead><tbody><tr><td>&quot;PAL0708&quot;</td><td>1</td><td>&quot;Adelie Penguin (Pygoscelis ade…</td><td>&quot;Anvers&quot;</td><td>&quot;Torgersen&quot;</td><td>&quot;Adult, 1 Egg Stage&quot;</td><td>&quot;N1A1&quot;</td><td>&quot;Yes&quot;</td><td>&quot;11/11/07&quot;</td><td>39.1</td><td>18.7</td><td>181</td><td>3750</td><td>&quot;MALE&quot;</td><td>null</td><td>null</td><td>&quot;Not enough blood for isotopes.&quot;</td><td>2.090909</td></tr><tr><td>&quot;PAL0708&quot;</td><td>2</td><td>&quot;Adelie Penguin (Pygoscelis ade…</td><td>&quot;Anvers&quot;</td><td>&quot;Torgersen&quot;</td><td>&quot;Adult, 1 Egg Stage&quot;</td><td>&quot;N1A2&quot;</td><td>&quot;Yes&quot;</td><td>&quot;11/11/07&quot;</td><td>39.5</td><td>17.4</td><td>186</td><td>3800</td><td>&quot;FEMALE&quot;</td><td>8.94956</td><td>-24.69454</td><td>null</td><td>2.270115</td></tr><tr><td>&quot;PAL0708&quot;</td><td>3</td><td>&quot;Adelie Penguin (Pygoscelis ade…</td><td>&quot;Anvers&quot;</td><td>&quot;Torgersen&quot;</td><td>&quot;Adult, 1 Egg Stage&quot;</td><td>&quot;N2A1&quot;</td><td>&quot;Yes&quot;</td><td>&quot;11/16/07&quot;</td><td>40.3</td><td>18.0</td><td>195</td><td>3250</td><td>&quot;FEMALE&quot;</td><td>8.36821</td><td>-25.33302</td><td>null</td><td>2.238889</td></tr><tr><td>&quot;PAL0708&quot;</td><td>4</td><td>&quot;Adelie Penguin (Pygoscelis ade…</td><td>&quot;Anvers&quot;</td><td>&quot;Torgersen&quot;</td><td>&quot;Adult, 1 Egg Stage&quot;</td><td>&quot;N2A2&quot;</td><td>&quot;Yes&quot;</td><td>&quot;11/16/07&quot;</td><td>null</td><td>null</td><td>null</td><td>null</td><td>null</td><td>null</td><td>null</td><td>&quot;Adult not sampled.&quot;</td><td>null</td></tr><tr><td>&quot;PAL0708&quot;</td><td>5</td><td>&quot;Adelie Penguin (Pygoscelis ade…</td><td>&quot;Anvers&quot;</td><td>&quot;Torgersen&quot;</td><td>&quot;Adult, 1 Egg Stage&quot;</td><td>&quot;N3A1&quot;</td><td>&quot;Yes&quot;</td><td>&quot;11/16/07&quot;</td><td>36.7</td><td>19.3</td><td>193</td><td>3450</td><td>&quot;FEMALE&quot;</td><td>8.76651</td><td>-25.32426</td><td>null</td><td>1.901554</td></tr><tr><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td></tr><tr><td>&quot;PAL0910&quot;</td><td>120</td><td>&quot;Gentoo penguin (Pygoscelis pap…</td><td>&quot;Anvers&quot;</td><td>&quot;Biscoe&quot;</td><td>&quot;Adult, 1 Egg Stage&quot;</td><td>&quot;N38A2&quot;</td><td>&quot;No&quot;</td><td>&quot;12/1/09&quot;</td><td>null</td><td>null</td><td>null</td><td>null</td><td>null</td><td>null</td><td>null</td><td>null</td><td>null</td></tr><tr><td>&quot;PAL0910&quot;</td><td>121</td><td>&quot;Gentoo penguin (Pygoscelis pap…</td><td>&quot;Anvers&quot;</td><td>&quot;Biscoe&quot;</td><td>&quot;Adult, 1 Egg Stage&quot;</td><td>&quot;N39A1&quot;</td><td>&quot;Yes&quot;</td><td>&quot;11/22/09&quot;</td><td>46.8</td><td>14.3</td><td>215</td><td>4850</td><td>&quot;FEMALE&quot;</td><td>8.41151</td><td>-26.13832</td><td>null</td><td>3.272727</td></tr><tr><td>&quot;PAL0910&quot;</td><td>122</td><td>&quot;Gentoo penguin (Pygoscelis pap…</td><td>&quot;Anvers&quot;</td><td>&quot;Biscoe&quot;</td><td>&quot;Adult, 1 Egg Stage&quot;</td><td>&quot;N39A2&quot;</td><td>&quot;Yes&quot;</td><td>&quot;11/22/09&quot;</td><td>50.4</td><td>15.7</td><td>222</td><td>5750</td><td>&quot;MALE&quot;</td><td>8.30166</td><td>-26.04117</td><td>null</td><td>3.210191</td></tr><tr><td>&quot;PAL0910&quot;</td><td>123</td><td>&quot;Gentoo penguin (Pygoscelis pap…</td><td>&quot;Anvers&quot;</td><td>&quot;Biscoe&quot;</td><td>&quot;Adult, 1 Egg Stage&quot;</td><td>&quot;N43A1&quot;</td><td>&quot;Yes&quot;</td><td>&quot;11/22/09&quot;</td><td>45.2</td><td>14.8</td><td>212</td><td>5200</td><td>&quot;FEMALE&quot;</td><td>8.24246</td><td>-26.11969</td><td>null</td><td>3.054054</td></tr><tr><td>&quot;PAL0910&quot;</td><td>124</td><td>&quot;Gentoo penguin (Pygoscelis pap…</td><td>&quot;Anvers&quot;</td><td>&quot;Biscoe&quot;</td><td>&quot;Adult, 1 Egg Stage&quot;</td><td>&quot;N43A2&quot;</td><td>&quot;Yes&quot;</td><td>&quot;11/22/09&quot;</td><td>49.9</td><td>16.1</td><td>213</td><td>5400</td><td>&quot;MALE&quot;</td><td>8.3639</td><td>-26.15531</td><td>null</td><td>3.099379</td></tr></tbody></table></div>"
      ],
      "text/plain": [
       "shape: (344, 18)\n",
       "┌───────────┬────────┬────────────┬────────┬───┬────────────┬────────────┬────────────┬────────────┐\n",
       "│ studyName ┆ Sample ┆ Species    ┆ Region ┆ … ┆ Delta 15 N ┆ Delta 13 C ┆ Comments   ┆ CulmenRati │\n",
       "│ ---       ┆ Number ┆ ---        ┆ ---    ┆   ┆ (o/oo)     ┆ (o/oo)     ┆ ---        ┆ o          │\n",
       "│ str       ┆ ---    ┆ str        ┆ str    ┆   ┆ ---        ┆ ---        ┆ str        ┆ ---        │\n",
       "│           ┆ i64    ┆            ┆        ┆   ┆ f64        ┆ f64        ┆            ┆ f64        │\n",
       "╞═══════════╪════════╪════════════╪════════╪═══╪════════════╪════════════╪════════════╪════════════╡\n",
       "│ PAL0708   ┆ 1      ┆ Adelie     ┆ Anvers ┆ … ┆ null       ┆ null       ┆ Not enough ┆ 2.090909   │\n",
       "│           ┆        ┆ Penguin    ┆        ┆   ┆            ┆            ┆ blood for  ┆            │\n",
       "│           ┆        ┆ (Pygosceli ┆        ┆   ┆            ┆            ┆ isotopes.  ┆            │\n",
       "│           ┆        ┆ s ade…     ┆        ┆   ┆            ┆            ┆            ┆            │\n",
       "│ PAL0708   ┆ 2      ┆ Adelie     ┆ Anvers ┆ … ┆ 8.94956    ┆ -24.69454  ┆ null       ┆ 2.270115   │\n",
       "│           ┆        ┆ Penguin    ┆        ┆   ┆            ┆            ┆            ┆            │\n",
       "│           ┆        ┆ (Pygosceli ┆        ┆   ┆            ┆            ┆            ┆            │\n",
       "│           ┆        ┆ s ade…     ┆        ┆   ┆            ┆            ┆            ┆            │\n",
       "│ PAL0708   ┆ 3      ┆ Adelie     ┆ Anvers ┆ … ┆ 8.36821    ┆ -25.33302  ┆ null       ┆ 2.238889   │\n",
       "│           ┆        ┆ Penguin    ┆        ┆   ┆            ┆            ┆            ┆            │\n",
       "│           ┆        ┆ (Pygosceli ┆        ┆   ┆            ┆            ┆            ┆            │\n",
       "│           ┆        ┆ s ade…     ┆        ┆   ┆            ┆            ┆            ┆            │\n",
       "│ PAL0708   ┆ 4      ┆ Adelie     ┆ Anvers ┆ … ┆ null       ┆ null       ┆ Adult not  ┆ null       │\n",
       "│           ┆        ┆ Penguin    ┆        ┆   ┆            ┆            ┆ sampled.   ┆            │\n",
       "│           ┆        ┆ (Pygosceli ┆        ┆   ┆            ┆            ┆            ┆            │\n",
       "│           ┆        ┆ s ade…     ┆        ┆   ┆            ┆            ┆            ┆            │\n",
       "│ PAL0708   ┆ 5      ┆ Adelie     ┆ Anvers ┆ … ┆ 8.76651    ┆ -25.32426  ┆ null       ┆ 1.901554   │\n",
       "│           ┆        ┆ Penguin    ┆        ┆   ┆            ┆            ┆            ┆            │\n",
       "│           ┆        ┆ (Pygosceli ┆        ┆   ┆            ┆            ┆            ┆            │\n",
       "│           ┆        ┆ s ade…     ┆        ┆   ┆            ┆            ┆            ┆            │\n",
       "│ …         ┆ …      ┆ …          ┆ …      ┆ … ┆ …          ┆ …          ┆ …          ┆ …          │\n",
       "│ PAL0910   ┆ 120    ┆ Gentoo     ┆ Anvers ┆ … ┆ null       ┆ null       ┆ null       ┆ null       │\n",
       "│           ┆        ┆ penguin    ┆        ┆   ┆            ┆            ┆            ┆            │\n",
       "│           ┆        ┆ (Pygosceli ┆        ┆   ┆            ┆            ┆            ┆            │\n",
       "│           ┆        ┆ s pap…     ┆        ┆   ┆            ┆            ┆            ┆            │\n",
       "│ PAL0910   ┆ 121    ┆ Gentoo     ┆ Anvers ┆ … ┆ 8.41151    ┆ -26.13832  ┆ null       ┆ 3.272727   │\n",
       "│           ┆        ┆ penguin    ┆        ┆   ┆            ┆            ┆            ┆            │\n",
       "│           ┆        ┆ (Pygosceli ┆        ┆   ┆            ┆            ┆            ┆            │\n",
       "│           ┆        ┆ s pap…     ┆        ┆   ┆            ┆            ┆            ┆            │\n",
       "│ PAL0910   ┆ 122    ┆ Gentoo     ┆ Anvers ┆ … ┆ 8.30166    ┆ -26.04117  ┆ null       ┆ 3.210191   │\n",
       "│           ┆        ┆ penguin    ┆        ┆   ┆            ┆            ┆            ┆            │\n",
       "│           ┆        ┆ (Pygosceli ┆        ┆   ┆            ┆            ┆            ┆            │\n",
       "│           ┆        ┆ s pap…     ┆        ┆   ┆            ┆            ┆            ┆            │\n",
       "│ PAL0910   ┆ 123    ┆ Gentoo     ┆ Anvers ┆ … ┆ 8.24246    ┆ -26.11969  ┆ null       ┆ 3.054054   │\n",
       "│           ┆        ┆ penguin    ┆        ┆   ┆            ┆            ┆            ┆            │\n",
       "│           ┆        ┆ (Pygosceli ┆        ┆   ┆            ┆            ┆            ┆            │\n",
       "│           ┆        ┆ s pap…     ┆        ┆   ┆            ┆            ┆            ┆            │\n",
       "│ PAL0910   ┆ 124    ┆ Gentoo     ┆ Anvers ┆ … ┆ 8.3639     ┆ -26.15531  ┆ null       ┆ 3.099379   │\n",
       "│           ┆        ┆ penguin    ┆        ┆   ┆            ┆            ┆            ┆            │\n",
       "│           ┆        ┆ (Pygosceli ┆        ┆   ┆            ┆            ┆            ┆            │\n",
       "│           ┆        ┆ s pap…     ┆        ┆   ┆            ┆            ┆            ┆            │\n",
       "└───────────┴────────┴────────────┴────────┴───┴────────────┴────────────┴────────────┴────────────┘"
      ]
     },
     "execution_count": 47,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df.with_columns((df['Culmen Length (mm)'] / df['Culmen Depth (mm)']).alias('CulmenRatio'))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 48,
   "id": "c69a46ab-83f3-4aca-8d72-f8fea53071f0",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>studyName</th>\n",
       "      <th>Sample Number</th>\n",
       "      <th>Species</th>\n",
       "      <th>Region</th>\n",
       "      <th>Island</th>\n",
       "      <th>Stage</th>\n",
       "      <th>Individual ID</th>\n",
       "      <th>Clutch Completion</th>\n",
       "      <th>Date Egg</th>\n",
       "      <th>Culmen Length (mm)</th>\n",
       "      <th>Culmen Depth (mm)</th>\n",
       "      <th>Flipper Length (mm)</th>\n",
       "      <th>Body Mass (g)</th>\n",
       "      <th>Sex</th>\n",
       "      <th>Delta 15 N (o/oo)</th>\n",
       "      <th>Delta 13 C (o/oo)</th>\n",
       "      <th>Comments</th>\n",
       "      <th>CulmenRatio</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>PAL0708</td>\n",
       "      <td>1</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Torgersen</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N1A1</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/11/07</td>\n",
       "      <td>39.1</td>\n",
       "      <td>18.7</td>\n",
       "      <td>181.0</td>\n",
       "      <td>3750.0</td>\n",
       "      <td>MALE</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>Not enough blood for isotopes.</td>\n",
       "      <td>2.090909</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>PAL0708</td>\n",
       "      <td>2</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Torgersen</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N1A2</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/11/07</td>\n",
       "      <td>39.5</td>\n",
       "      <td>17.4</td>\n",
       "      <td>186.0</td>\n",
       "      <td>3800.0</td>\n",
       "      <td>FEMALE</td>\n",
       "      <td>8.94956</td>\n",
       "      <td>-24.69454</td>\n",
       "      <td>NaN</td>\n",
       "      <td>2.270115</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>PAL0708</td>\n",
       "      <td>3</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Torgersen</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N2A1</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/16/07</td>\n",
       "      <td>40.3</td>\n",
       "      <td>18.0</td>\n",
       "      <td>195.0</td>\n",
       "      <td>3250.0</td>\n",
       "      <td>FEMALE</td>\n",
       "      <td>8.36821</td>\n",
       "      <td>-25.33302</td>\n",
       "      <td>NaN</td>\n",
       "      <td>2.238889</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>PAL0708</td>\n",
       "      <td>4</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Torgersen</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N2A2</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/16/07</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>Adult not sampled.</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>PAL0708</td>\n",
       "      <td>5</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Torgersen</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N3A1</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/16/07</td>\n",
       "      <td>36.7</td>\n",
       "      <td>19.3</td>\n",
       "      <td>193.0</td>\n",
       "      <td>3450.0</td>\n",
       "      <td>FEMALE</td>\n",
       "      <td>8.76651</td>\n",
       "      <td>-25.32426</td>\n",
       "      <td>NaN</td>\n",
       "      <td>1.901554</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>339</th>\n",
       "      <td>PAL0910</td>\n",
       "      <td>120</td>\n",
       "      <td>Gentoo penguin (Pygoscelis papua)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Biscoe</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N38A2</td>\n",
       "      <td>No</td>\n",
       "      <td>12/1/09</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>340</th>\n",
       "      <td>PAL0910</td>\n",
       "      <td>121</td>\n",
       "      <td>Gentoo penguin (Pygoscelis papua)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Biscoe</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N39A1</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/22/09</td>\n",
       "      <td>46.8</td>\n",
       "      <td>14.3</td>\n",
       "      <td>215.0</td>\n",
       "      <td>4850.0</td>\n",
       "      <td>FEMALE</td>\n",
       "      <td>8.41151</td>\n",
       "      <td>-26.13832</td>\n",
       "      <td>NaN</td>\n",
       "      <td>3.272727</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>341</th>\n",
       "      <td>PAL0910</td>\n",
       "      <td>122</td>\n",
       "      <td>Gentoo penguin (Pygoscelis papua)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Biscoe</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N39A2</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/22/09</td>\n",
       "      <td>50.4</td>\n",
       "      <td>15.7</td>\n",
       "      <td>222.0</td>\n",
       "      <td>5750.0</td>\n",
       "      <td>MALE</td>\n",
       "      <td>8.30166</td>\n",
       "      <td>-26.04117</td>\n",
       "      <td>NaN</td>\n",
       "      <td>3.210191</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>342</th>\n",
       "      <td>PAL0910</td>\n",
       "      <td>123</td>\n",
       "      <td>Gentoo penguin (Pygoscelis papua)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Biscoe</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N43A1</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/22/09</td>\n",
       "      <td>45.2</td>\n",
       "      <td>14.8</td>\n",
       "      <td>212.0</td>\n",
       "      <td>5200.0</td>\n",
       "      <td>FEMALE</td>\n",
       "      <td>8.24246</td>\n",
       "      <td>-26.11969</td>\n",
       "      <td>NaN</td>\n",
       "      <td>3.054054</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>343</th>\n",
       "      <td>PAL0910</td>\n",
       "      <td>124</td>\n",
       "      <td>Gentoo penguin (Pygoscelis papua)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Biscoe</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N43A2</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/22/09</td>\n",
       "      <td>49.9</td>\n",
       "      <td>16.1</td>\n",
       "      <td>213.0</td>\n",
       "      <td>5400.0</td>\n",
       "      <td>MALE</td>\n",
       "      <td>8.36390</td>\n",
       "      <td>-26.15531</td>\n",
       "      <td>NaN</td>\n",
       "      <td>3.099379</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>344 rows × 18 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "    studyName  Sample Number                              Species  Region  \\\n",
       "0     PAL0708              1  Adelie Penguin (Pygoscelis adeliae)  Anvers   \n",
       "1     PAL0708              2  Adelie Penguin (Pygoscelis adeliae)  Anvers   \n",
       "2     PAL0708              3  Adelie Penguin (Pygoscelis adeliae)  Anvers   \n",
       "3     PAL0708              4  Adelie Penguin (Pygoscelis adeliae)  Anvers   \n",
       "4     PAL0708              5  Adelie Penguin (Pygoscelis adeliae)  Anvers   \n",
       "..        ...            ...                                  ...     ...   \n",
       "339   PAL0910            120    Gentoo penguin (Pygoscelis papua)  Anvers   \n",
       "340   PAL0910            121    Gentoo penguin (Pygoscelis papua)  Anvers   \n",
       "341   PAL0910            122    Gentoo penguin (Pygoscelis papua)  Anvers   \n",
       "342   PAL0910            123    Gentoo penguin (Pygoscelis papua)  Anvers   \n",
       "343   PAL0910            124    Gentoo penguin (Pygoscelis papua)  Anvers   \n",
       "\n",
       "        Island               Stage Individual ID Clutch Completion  Date Egg  \\\n",
       "0    Torgersen  Adult, 1 Egg Stage          N1A1               Yes  11/11/07   \n",
       "1    Torgersen  Adult, 1 Egg Stage          N1A2               Yes  11/11/07   \n",
       "2    Torgersen  Adult, 1 Egg Stage          N2A1               Yes  11/16/07   \n",
       "3    Torgersen  Adult, 1 Egg Stage          N2A2               Yes  11/16/07   \n",
       "4    Torgersen  Adult, 1 Egg Stage          N3A1               Yes  11/16/07   \n",
       "..         ...                 ...           ...               ...       ...   \n",
       "339     Biscoe  Adult, 1 Egg Stage         N38A2                No   12/1/09   \n",
       "340     Biscoe  Adult, 1 Egg Stage         N39A1               Yes  11/22/09   \n",
       "341     Biscoe  Adult, 1 Egg Stage         N39A2               Yes  11/22/09   \n",
       "342     Biscoe  Adult, 1 Egg Stage         N43A1               Yes  11/22/09   \n",
       "343     Biscoe  Adult, 1 Egg Stage         N43A2               Yes  11/22/09   \n",
       "\n",
       "     Culmen Length (mm)  Culmen Depth (mm)  Flipper Length (mm)  \\\n",
       "0                  39.1               18.7                181.0   \n",
       "1                  39.5               17.4                186.0   \n",
       "2                  40.3               18.0                195.0   \n",
       "3                   NaN                NaN                  NaN   \n",
       "4                  36.7               19.3                193.0   \n",
       "..                  ...                ...                  ...   \n",
       "339                 NaN                NaN                  NaN   \n",
       "340                46.8               14.3                215.0   \n",
       "341                50.4               15.7                222.0   \n",
       "342                45.2               14.8                212.0   \n",
       "343                49.9               16.1                213.0   \n",
       "\n",
       "     Body Mass (g)     Sex  Delta 15 N (o/oo)  Delta 13 C (o/oo)  \\\n",
       "0           3750.0    MALE                NaN                NaN   \n",
       "1           3800.0  FEMALE            8.94956          -24.69454   \n",
       "2           3250.0  FEMALE            8.36821          -25.33302   \n",
       "3              NaN     NaN                NaN                NaN   \n",
       "4           3450.0  FEMALE            8.76651          -25.32426   \n",
       "..             ...     ...                ...                ...   \n",
       "339            NaN     NaN                NaN                NaN   \n",
       "340         4850.0  FEMALE            8.41151          -26.13832   \n",
       "341         5750.0    MALE            8.30166          -26.04117   \n",
       "342         5200.0  FEMALE            8.24246          -26.11969   \n",
       "343         5400.0    MALE            8.36390          -26.15531   \n",
       "\n",
       "                           Comments  CulmenRatio  \n",
       "0    Not enough blood for isotopes.     2.090909  \n",
       "1                               NaN     2.270115  \n",
       "2                               NaN     2.238889  \n",
       "3                Adult not sampled.          NaN  \n",
       "4                               NaN     1.901554  \n",
       "..                              ...          ...  \n",
       "339                             NaN          NaN  \n",
       "340                             NaN     3.272727  \n",
       "341                             NaN     3.210191  \n",
       "342                             NaN     3.054054  \n",
       "343                             NaN     3.099379  \n",
       "\n",
       "[344 rows x 18 columns]"
      ]
     },
     "execution_count": 48,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# mutates!\n",
    "dfa['CulmenRatio'] = dfa['Culmen Length (mm)'] / dfa['Culmen Depth (mm)']\n",
    "dfa"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 49,
   "id": "5997d5ce-40d6-4c3b-9ad7-838f44cb3423",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>studyName</th>\n",
       "      <th>Sample Number</th>\n",
       "      <th>Species</th>\n",
       "      <th>Region</th>\n",
       "      <th>Island</th>\n",
       "      <th>Stage</th>\n",
       "      <th>Individual ID</th>\n",
       "      <th>Clutch Completion</th>\n",
       "      <th>Date Egg</th>\n",
       "      <th>Culmen Length (mm)</th>\n",
       "      <th>Culmen Depth (mm)</th>\n",
       "      <th>Flipper Length (mm)</th>\n",
       "      <th>Body Mass (g)</th>\n",
       "      <th>Sex</th>\n",
       "      <th>Delta 15 N (o/oo)</th>\n",
       "      <th>Delta 13 C (o/oo)</th>\n",
       "      <th>Comments</th>\n",
       "      <th>CulmenRatio</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>PAL0708</td>\n",
       "      <td>1</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Torgersen</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N1A1</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/11/07</td>\n",
       "      <td>39.1</td>\n",
       "      <td>18.7</td>\n",
       "      <td>181.0</td>\n",
       "      <td>3750.0</td>\n",
       "      <td>MALE</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>Not enough blood for isotopes.</td>\n",
       "      <td>2.090909</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>PAL0708</td>\n",
       "      <td>2</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Torgersen</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N1A2</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/11/07</td>\n",
       "      <td>39.5</td>\n",
       "      <td>17.4</td>\n",
       "      <td>186.0</td>\n",
       "      <td>3800.0</td>\n",
       "      <td>FEMALE</td>\n",
       "      <td>8.94956</td>\n",
       "      <td>-24.69454</td>\n",
       "      <td>NaN</td>\n",
       "      <td>2.270115</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>PAL0708</td>\n",
       "      <td>3</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Torgersen</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N2A1</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/16/07</td>\n",
       "      <td>40.3</td>\n",
       "      <td>18.0</td>\n",
       "      <td>195.0</td>\n",
       "      <td>3250.0</td>\n",
       "      <td>FEMALE</td>\n",
       "      <td>8.36821</td>\n",
       "      <td>-25.33302</td>\n",
       "      <td>NaN</td>\n",
       "      <td>2.238889</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>PAL0708</td>\n",
       "      <td>4</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Torgersen</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N2A2</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/16/07</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>Adult not sampled.</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>PAL0708</td>\n",
       "      <td>5</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Torgersen</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N3A1</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/16/07</td>\n",
       "      <td>36.7</td>\n",
       "      <td>19.3</td>\n",
       "      <td>193.0</td>\n",
       "      <td>3450.0</td>\n",
       "      <td>FEMALE</td>\n",
       "      <td>8.76651</td>\n",
       "      <td>-25.32426</td>\n",
       "      <td>NaN</td>\n",
       "      <td>1.901554</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>339</th>\n",
       "      <td>PAL0910</td>\n",
       "      <td>120</td>\n",
       "      <td>Gentoo penguin (Pygoscelis papua)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Biscoe</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N38A2</td>\n",
       "      <td>No</td>\n",
       "      <td>12/1/09</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>340</th>\n",
       "      <td>PAL0910</td>\n",
       "      <td>121</td>\n",
       "      <td>Gentoo penguin (Pygoscelis papua)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Biscoe</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N39A1</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/22/09</td>\n",
       "      <td>46.8</td>\n",
       "      <td>14.3</td>\n",
       "      <td>215.0</td>\n",
       "      <td>4850.0</td>\n",
       "      <td>FEMALE</td>\n",
       "      <td>8.41151</td>\n",
       "      <td>-26.13832</td>\n",
       "      <td>NaN</td>\n",
       "      <td>3.272727</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>341</th>\n",
       "      <td>PAL0910</td>\n",
       "      <td>122</td>\n",
       "      <td>Gentoo penguin (Pygoscelis papua)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Biscoe</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N39A2</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/22/09</td>\n",
       "      <td>50.4</td>\n",
       "      <td>15.7</td>\n",
       "      <td>222.0</td>\n",
       "      <td>5750.0</td>\n",
       "      <td>MALE</td>\n",
       "      <td>8.30166</td>\n",
       "      <td>-26.04117</td>\n",
       "      <td>NaN</td>\n",
       "      <td>3.210191</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>342</th>\n",
       "      <td>PAL0910</td>\n",
       "      <td>123</td>\n",
       "      <td>Gentoo penguin (Pygoscelis papua)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Biscoe</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N43A1</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/22/09</td>\n",
       "      <td>45.2</td>\n",
       "      <td>14.8</td>\n",
       "      <td>212.0</td>\n",
       "      <td>5200.0</td>\n",
       "      <td>FEMALE</td>\n",
       "      <td>8.24246</td>\n",
       "      <td>-26.11969</td>\n",
       "      <td>NaN</td>\n",
       "      <td>3.054054</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>343</th>\n",
       "      <td>PAL0910</td>\n",
       "      <td>124</td>\n",
       "      <td>Gentoo penguin (Pygoscelis papua)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Biscoe</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N43A2</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/22/09</td>\n",
       "      <td>49.9</td>\n",
       "      <td>16.1</td>\n",
       "      <td>213.0</td>\n",
       "      <td>5400.0</td>\n",
       "      <td>MALE</td>\n",
       "      <td>8.36390</td>\n",
       "      <td>-26.15531</td>\n",
       "      <td>NaN</td>\n",
       "      <td>3.099379</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>344 rows × 18 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "    studyName  Sample Number                              Species  Region  \\\n",
       "0     PAL0708              1  Adelie Penguin (Pygoscelis adeliae)  Anvers   \n",
       "1     PAL0708              2  Adelie Penguin (Pygoscelis adeliae)  Anvers   \n",
       "2     PAL0708              3  Adelie Penguin (Pygoscelis adeliae)  Anvers   \n",
       "3     PAL0708              4  Adelie Penguin (Pygoscelis adeliae)  Anvers   \n",
       "4     PAL0708              5  Adelie Penguin (Pygoscelis adeliae)  Anvers   \n",
       "..        ...            ...                                  ...     ...   \n",
       "339   PAL0910            120    Gentoo penguin (Pygoscelis papua)  Anvers   \n",
       "340   PAL0910            121    Gentoo penguin (Pygoscelis papua)  Anvers   \n",
       "341   PAL0910            122    Gentoo penguin (Pygoscelis papua)  Anvers   \n",
       "342   PAL0910            123    Gentoo penguin (Pygoscelis papua)  Anvers   \n",
       "343   PAL0910            124    Gentoo penguin (Pygoscelis papua)  Anvers   \n",
       "\n",
       "        Island               Stage Individual ID Clutch Completion  Date Egg  \\\n",
       "0    Torgersen  Adult, 1 Egg Stage          N1A1               Yes  11/11/07   \n",
       "1    Torgersen  Adult, 1 Egg Stage          N1A2               Yes  11/11/07   \n",
       "2    Torgersen  Adult, 1 Egg Stage          N2A1               Yes  11/16/07   \n",
       "3    Torgersen  Adult, 1 Egg Stage          N2A2               Yes  11/16/07   \n",
       "4    Torgersen  Adult, 1 Egg Stage          N3A1               Yes  11/16/07   \n",
       "..         ...                 ...           ...               ...       ...   \n",
       "339     Biscoe  Adult, 1 Egg Stage         N38A2                No   12/1/09   \n",
       "340     Biscoe  Adult, 1 Egg Stage         N39A1               Yes  11/22/09   \n",
       "341     Biscoe  Adult, 1 Egg Stage         N39A2               Yes  11/22/09   \n",
       "342     Biscoe  Adult, 1 Egg Stage         N43A1               Yes  11/22/09   \n",
       "343     Biscoe  Adult, 1 Egg Stage         N43A2               Yes  11/22/09   \n",
       "\n",
       "     Culmen Length (mm)  Culmen Depth (mm)  Flipper Length (mm)  \\\n",
       "0                  39.1               18.7                181.0   \n",
       "1                  39.5               17.4                186.0   \n",
       "2                  40.3               18.0                195.0   \n",
       "3                   NaN                NaN                  NaN   \n",
       "4                  36.7               19.3                193.0   \n",
       "..                  ...                ...                  ...   \n",
       "339                 NaN                NaN                  NaN   \n",
       "340                46.8               14.3                215.0   \n",
       "341                50.4               15.7                222.0   \n",
       "342                45.2               14.8                212.0   \n",
       "343                49.9               16.1                213.0   \n",
       "\n",
       "     Body Mass (g)     Sex  Delta 15 N (o/oo)  Delta 13 C (o/oo)  \\\n",
       "0           3750.0    MALE                NaN                NaN   \n",
       "1           3800.0  FEMALE            8.94956          -24.69454   \n",
       "2           3250.0  FEMALE            8.36821          -25.33302   \n",
       "3              NaN     NaN                NaN                NaN   \n",
       "4           3450.0  FEMALE            8.76651          -25.32426   \n",
       "..             ...     ...                ...                ...   \n",
       "339            NaN     NaN                NaN                NaN   \n",
       "340         4850.0  FEMALE            8.41151          -26.13832   \n",
       "341         5750.0    MALE            8.30166          -26.04117   \n",
       "342         5200.0  FEMALE            8.24246          -26.11969   \n",
       "343         5400.0    MALE            8.36390          -26.15531   \n",
       "\n",
       "                           Comments  CulmenRatio  \n",
       "0    Not enough blood for isotopes.     2.090909  \n",
       "1                               NaN     2.270115  \n",
       "2                               NaN     2.238889  \n",
       "3                Adult not sampled.          NaN  \n",
       "4                               NaN     1.901554  \n",
       "..                              ...          ...  \n",
       "339                             NaN          NaN  \n",
       "340                             NaN     3.272727  \n",
       "341                             NaN     3.210191  \n",
       "342                             NaN     3.054054  \n",
       "343                             NaN     3.099379  \n",
       "\n",
       "[344 rows x 18 columns]"
      ]
     },
     "execution_count": 49,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "import pandas as pd\n",
    "dfa = pd.read_csv('penguins_lter.csv') # , skiprows=3, header=None)\n",
    "\n",
    "dfa.assign(CulmenRatio=dfa['Culmen Length (mm)'] / dfa['Culmen Depth (mm)'])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 50,
   "id": "bb82ef2d-fbd9-4480-851c-b4a8f7adabe6",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>studyName</th>\n",
       "      <th>Sample Number</th>\n",
       "      <th>Species</th>\n",
       "      <th>Region</th>\n",
       "      <th>Island</th>\n",
       "      <th>Stage</th>\n",
       "      <th>Individual ID</th>\n",
       "      <th>Clutch Completion</th>\n",
       "      <th>Date Egg</th>\n",
       "      <th>Culmen Length (mm)</th>\n",
       "      <th>Culmen Depth (mm)</th>\n",
       "      <th>Flipper Length (mm)</th>\n",
       "      <th>Body Mass (g)</th>\n",
       "      <th>Sex</th>\n",
       "      <th>Delta 15 N (o/oo)</th>\n",
       "      <th>Delta 13 C (o/oo)</th>\n",
       "      <th>Comments</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>PAL0708</td>\n",
       "      <td>1</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Torgersen</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N1A1</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/11/07</td>\n",
       "      <td>39.1</td>\n",
       "      <td>18.7</td>\n",
       "      <td>181.0</td>\n",
       "      <td>3750.0</td>\n",
       "      <td>MALE</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>Not enough blood for isotopes.</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>PAL0708</td>\n",
       "      <td>2</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Torgersen</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N1A2</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/11/07</td>\n",
       "      <td>39.5</td>\n",
       "      <td>17.4</td>\n",
       "      <td>186.0</td>\n",
       "      <td>3800.0</td>\n",
       "      <td>FEMALE</td>\n",
       "      <td>8.94956</td>\n",
       "      <td>-24.69454</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>PAL0708</td>\n",
       "      <td>3</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Torgersen</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N2A1</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/16/07</td>\n",
       "      <td>40.3</td>\n",
       "      <td>18.0</td>\n",
       "      <td>195.0</td>\n",
       "      <td>3250.0</td>\n",
       "      <td>FEMALE</td>\n",
       "      <td>8.36821</td>\n",
       "      <td>-25.33302</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>PAL0708</td>\n",
       "      <td>4</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Torgersen</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N2A2</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/16/07</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>Adult not sampled.</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>PAL0708</td>\n",
       "      <td>5</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Torgersen</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N3A1</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/16/07</td>\n",
       "      <td>36.7</td>\n",
       "      <td>19.3</td>\n",
       "      <td>193.0</td>\n",
       "      <td>3450.0</td>\n",
       "      <td>FEMALE</td>\n",
       "      <td>8.76651</td>\n",
       "      <td>-25.32426</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>339</th>\n",
       "      <td>PAL0910</td>\n",
       "      <td>120</td>\n",
       "      <td>Gentoo penguin (Pygoscelis papua)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Biscoe</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N38A2</td>\n",
       "      <td>No</td>\n",
       "      <td>12/1/09</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>340</th>\n",
       "      <td>PAL0910</td>\n",
       "      <td>121</td>\n",
       "      <td>Gentoo penguin (Pygoscelis papua)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Biscoe</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N39A1</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/22/09</td>\n",
       "      <td>46.8</td>\n",
       "      <td>14.3</td>\n",
       "      <td>215.0</td>\n",
       "      <td>4850.0</td>\n",
       "      <td>FEMALE</td>\n",
       "      <td>8.41151</td>\n",
       "      <td>-26.13832</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>341</th>\n",
       "      <td>PAL0910</td>\n",
       "      <td>122</td>\n",
       "      <td>Gentoo penguin (Pygoscelis papua)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Biscoe</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N39A2</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/22/09</td>\n",
       "      <td>50.4</td>\n",
       "      <td>15.7</td>\n",
       "      <td>222.0</td>\n",
       "      <td>5750.0</td>\n",
       "      <td>MALE</td>\n",
       "      <td>8.30166</td>\n",
       "      <td>-26.04117</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>342</th>\n",
       "      <td>PAL0910</td>\n",
       "      <td>123</td>\n",
       "      <td>Gentoo penguin (Pygoscelis papua)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Biscoe</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N43A1</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/22/09</td>\n",
       "      <td>45.2</td>\n",
       "      <td>14.8</td>\n",
       "      <td>212.0</td>\n",
       "      <td>5200.0</td>\n",
       "      <td>FEMALE</td>\n",
       "      <td>8.24246</td>\n",
       "      <td>-26.11969</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>343</th>\n",
       "      <td>PAL0910</td>\n",
       "      <td>124</td>\n",
       "      <td>Gentoo penguin (Pygoscelis papua)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Biscoe</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N43A2</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/22/09</td>\n",
       "      <td>49.9</td>\n",
       "      <td>16.1</td>\n",
       "      <td>213.0</td>\n",
       "      <td>5400.0</td>\n",
       "      <td>MALE</td>\n",
       "      <td>8.36390</td>\n",
       "      <td>-26.15531</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>344 rows × 17 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "    studyName  Sample Number                              Species  Region  \\\n",
       "0     PAL0708              1  Adelie Penguin (Pygoscelis adeliae)  Anvers   \n",
       "1     PAL0708              2  Adelie Penguin (Pygoscelis adeliae)  Anvers   \n",
       "2     PAL0708              3  Adelie Penguin (Pygoscelis adeliae)  Anvers   \n",
       "3     PAL0708              4  Adelie Penguin (Pygoscelis adeliae)  Anvers   \n",
       "4     PAL0708              5  Adelie Penguin (Pygoscelis adeliae)  Anvers   \n",
       "..        ...            ...                                  ...     ...   \n",
       "339   PAL0910            120    Gentoo penguin (Pygoscelis papua)  Anvers   \n",
       "340   PAL0910            121    Gentoo penguin (Pygoscelis papua)  Anvers   \n",
       "341   PAL0910            122    Gentoo penguin (Pygoscelis papua)  Anvers   \n",
       "342   PAL0910            123    Gentoo penguin (Pygoscelis papua)  Anvers   \n",
       "343   PAL0910            124    Gentoo penguin (Pygoscelis papua)  Anvers   \n",
       "\n",
       "        Island               Stage Individual ID Clutch Completion  Date Egg  \\\n",
       "0    Torgersen  Adult, 1 Egg Stage          N1A1               Yes  11/11/07   \n",
       "1    Torgersen  Adult, 1 Egg Stage          N1A2               Yes  11/11/07   \n",
       "2    Torgersen  Adult, 1 Egg Stage          N2A1               Yes  11/16/07   \n",
       "3    Torgersen  Adult, 1 Egg Stage          N2A2               Yes  11/16/07   \n",
       "4    Torgersen  Adult, 1 Egg Stage          N3A1               Yes  11/16/07   \n",
       "..         ...                 ...           ...               ...       ...   \n",
       "339     Biscoe  Adult, 1 Egg Stage         N38A2                No   12/1/09   \n",
       "340     Biscoe  Adult, 1 Egg Stage         N39A1               Yes  11/22/09   \n",
       "341     Biscoe  Adult, 1 Egg Stage         N39A2               Yes  11/22/09   \n",
       "342     Biscoe  Adult, 1 Egg Stage         N43A1               Yes  11/22/09   \n",
       "343     Biscoe  Adult, 1 Egg Stage         N43A2               Yes  11/22/09   \n",
       "\n",
       "     Culmen Length (mm)  Culmen Depth (mm)  Flipper Length (mm)  \\\n",
       "0                  39.1               18.7                181.0   \n",
       "1                  39.5               17.4                186.0   \n",
       "2                  40.3               18.0                195.0   \n",
       "3                   NaN                NaN                  NaN   \n",
       "4                  36.7               19.3                193.0   \n",
       "..                  ...                ...                  ...   \n",
       "339                 NaN                NaN                  NaN   \n",
       "340                46.8               14.3                215.0   \n",
       "341                50.4               15.7                222.0   \n",
       "342                45.2               14.8                212.0   \n",
       "343                49.9               16.1                213.0   \n",
       "\n",
       "     Body Mass (g)     Sex  Delta 15 N (o/oo)  Delta 13 C (o/oo)  \\\n",
       "0           3750.0    MALE                NaN                NaN   \n",
       "1           3800.0  FEMALE            8.94956          -24.69454   \n",
       "2           3250.0  FEMALE            8.36821          -25.33302   \n",
       "3              NaN     NaN                NaN                NaN   \n",
       "4           3450.0  FEMALE            8.76651          -25.32426   \n",
       "..             ...     ...                ...                ...   \n",
       "339            NaN     NaN                NaN                NaN   \n",
       "340         4850.0  FEMALE            8.41151          -26.13832   \n",
       "341         5750.0    MALE            8.30166          -26.04117   \n",
       "342         5200.0  FEMALE            8.24246          -26.11969   \n",
       "343         5400.0    MALE            8.36390          -26.15531   \n",
       "\n",
       "                           Comments  \n",
       "0    Not enough blood for isotopes.  \n",
       "1                               NaN  \n",
       "2                               NaN  \n",
       "3                Adult not sampled.  \n",
       "4                               NaN  \n",
       "..                              ...  \n",
       "339                             NaN  \n",
       "340                             NaN  \n",
       "341                             NaN  \n",
       "342                             NaN  \n",
       "343                             NaN  \n",
       "\n",
       "[344 rows x 17 columns]"
      ]
     },
     "execution_count": 50,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "dfa"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "989fbe48-adb8-4fbd-b087-7479a075991a",
   "metadata": {},
   "source": [
    "#### Don't Use inplace!"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 51,
   "id": "da59b51f-610e-4b7f-9e1e-8dc5b323209d",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>studyName</th>\n",
       "      <th>Sample Number</th>\n",
       "      <th>Species</th>\n",
       "      <th>Region</th>\n",
       "      <th>Island</th>\n",
       "      <th>Stage</th>\n",
       "      <th>Individual ID</th>\n",
       "      <th>Clutch Completion</th>\n",
       "      <th>Date Egg</th>\n",
       "      <th>Culmen Length (mm)</th>\n",
       "      <th>Culmen Depth (mm)</th>\n",
       "      <th>Flipper Length (mm)</th>\n",
       "      <th>Body Mass (g)</th>\n",
       "      <th>Sex</th>\n",
       "      <th>Delta 15 N (o/oo)</th>\n",
       "      <th>Delta 13 C (o/oo)</th>\n",
       "      <th>Comments</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>PAL0708</td>\n",
       "      <td>3</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Torgersen</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N2A1</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/16/07</td>\n",
       "      <td>40.3</td>\n",
       "      <td>18.0</td>\n",
       "      <td>195.0</td>\n",
       "      <td>3250.0</td>\n",
       "      <td>FEMALE</td>\n",
       "      <td>8.36821</td>\n",
       "      <td>-25.33302</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>9</th>\n",
       "      <td>PAL0708</td>\n",
       "      <td>10</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Torgersen</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N5A2</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/9/07</td>\n",
       "      <td>42.0</td>\n",
       "      <td>20.2</td>\n",
       "      <td>190.0</td>\n",
       "      <td>4250.0</td>\n",
       "      <td>NaN</td>\n",
       "      <td>9.13362</td>\n",
       "      <td>-25.09368</td>\n",
       "      <td>No blood sample obtained for sexing.</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>12</th>\n",
       "      <td>PAL0708</td>\n",
       "      <td>13</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Torgersen</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N7A1</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/15/07</td>\n",
       "      <td>41.1</td>\n",
       "      <td>17.6</td>\n",
       "      <td>182.0</td>\n",
       "      <td>3200.0</td>\n",
       "      <td>FEMALE</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>Not enough blood for isotopes.</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>17</th>\n",
       "      <td>PAL0708</td>\n",
       "      <td>18</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Torgersen</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N9A2</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/12/07</td>\n",
       "      <td>42.5</td>\n",
       "      <td>20.7</td>\n",
       "      <td>197.0</td>\n",
       "      <td>4500.0</td>\n",
       "      <td>MALE</td>\n",
       "      <td>8.67538</td>\n",
       "      <td>-25.13993</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>19</th>\n",
       "      <td>PAL0708</td>\n",
       "      <td>20</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Torgersen</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N10A2</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/16/07</td>\n",
       "      <td>46.0</td>\n",
       "      <td>21.5</td>\n",
       "      <td>194.0</td>\n",
       "      <td>4200.0</td>\n",
       "      <td>MALE</td>\n",
       "      <td>9.11616</td>\n",
       "      <td>-24.77227</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>338</th>\n",
       "      <td>PAL0910</td>\n",
       "      <td>119</td>\n",
       "      <td>Gentoo penguin (Pygoscelis papua)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Biscoe</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N38A1</td>\n",
       "      <td>No</td>\n",
       "      <td>12/1/09</td>\n",
       "      <td>47.2</td>\n",
       "      <td>13.7</td>\n",
       "      <td>214.0</td>\n",
       "      <td>4925.0</td>\n",
       "      <td>FEMALE</td>\n",
       "      <td>7.99184</td>\n",
       "      <td>-26.20538</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>340</th>\n",
       "      <td>PAL0910</td>\n",
       "      <td>121</td>\n",
       "      <td>Gentoo penguin (Pygoscelis papua)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Biscoe</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N39A1</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/22/09</td>\n",
       "      <td>46.8</td>\n",
       "      <td>14.3</td>\n",
       "      <td>215.0</td>\n",
       "      <td>4850.0</td>\n",
       "      <td>FEMALE</td>\n",
       "      <td>8.41151</td>\n",
       "      <td>-26.13832</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>341</th>\n",
       "      <td>PAL0910</td>\n",
       "      <td>122</td>\n",
       "      <td>Gentoo penguin (Pygoscelis papua)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Biscoe</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N39A2</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/22/09</td>\n",
       "      <td>50.4</td>\n",
       "      <td>15.7</td>\n",
       "      <td>222.0</td>\n",
       "      <td>5750.0</td>\n",
       "      <td>MALE</td>\n",
       "      <td>8.30166</td>\n",
       "      <td>-26.04117</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>342</th>\n",
       "      <td>PAL0910</td>\n",
       "      <td>123</td>\n",
       "      <td>Gentoo penguin (Pygoscelis papua)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Biscoe</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N43A1</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/22/09</td>\n",
       "      <td>45.2</td>\n",
       "      <td>14.8</td>\n",
       "      <td>212.0</td>\n",
       "      <td>5200.0</td>\n",
       "      <td>FEMALE</td>\n",
       "      <td>8.24246</td>\n",
       "      <td>-26.11969</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>343</th>\n",
       "      <td>PAL0910</td>\n",
       "      <td>124</td>\n",
       "      <td>Gentoo penguin (Pygoscelis papua)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Biscoe</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N43A2</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/22/09</td>\n",
       "      <td>49.9</td>\n",
       "      <td>16.1</td>\n",
       "      <td>213.0</td>\n",
       "      <td>5400.0</td>\n",
       "      <td>MALE</td>\n",
       "      <td>8.36390</td>\n",
       "      <td>-26.15531</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>242 rows × 17 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "    studyName  Sample Number                              Species  Region  \\\n",
       "2     PAL0708              3  Adelie Penguin (Pygoscelis adeliae)  Anvers   \n",
       "9     PAL0708             10  Adelie Penguin (Pygoscelis adeliae)  Anvers   \n",
       "12    PAL0708             13  Adelie Penguin (Pygoscelis adeliae)  Anvers   \n",
       "17    PAL0708             18  Adelie Penguin (Pygoscelis adeliae)  Anvers   \n",
       "19    PAL0708             20  Adelie Penguin (Pygoscelis adeliae)  Anvers   \n",
       "..        ...            ...                                  ...     ...   \n",
       "338   PAL0910            119    Gentoo penguin (Pygoscelis papua)  Anvers   \n",
       "340   PAL0910            121    Gentoo penguin (Pygoscelis papua)  Anvers   \n",
       "341   PAL0910            122    Gentoo penguin (Pygoscelis papua)  Anvers   \n",
       "342   PAL0910            123    Gentoo penguin (Pygoscelis papua)  Anvers   \n",
       "343   PAL0910            124    Gentoo penguin (Pygoscelis papua)  Anvers   \n",
       "\n",
       "        Island               Stage Individual ID Clutch Completion  Date Egg  \\\n",
       "2    Torgersen  Adult, 1 Egg Stage          N2A1               Yes  11/16/07   \n",
       "9    Torgersen  Adult, 1 Egg Stage          N5A2               Yes   11/9/07   \n",
       "12   Torgersen  Adult, 1 Egg Stage          N7A1               Yes  11/15/07   \n",
       "17   Torgersen  Adult, 1 Egg Stage          N9A2               Yes  11/12/07   \n",
       "19   Torgersen  Adult, 1 Egg Stage         N10A2               Yes  11/16/07   \n",
       "..         ...                 ...           ...               ...       ...   \n",
       "338     Biscoe  Adult, 1 Egg Stage         N38A1                No   12/1/09   \n",
       "340     Biscoe  Adult, 1 Egg Stage         N39A1               Yes  11/22/09   \n",
       "341     Biscoe  Adult, 1 Egg Stage         N39A2               Yes  11/22/09   \n",
       "342     Biscoe  Adult, 1 Egg Stage         N43A1               Yes  11/22/09   \n",
       "343     Biscoe  Adult, 1 Egg Stage         N43A2               Yes  11/22/09   \n",
       "\n",
       "     Culmen Length (mm)  Culmen Depth (mm)  Flipper Length (mm)  \\\n",
       "2                  40.3               18.0                195.0   \n",
       "9                  42.0               20.2                190.0   \n",
       "12                 41.1               17.6                182.0   \n",
       "17                 42.5               20.7                197.0   \n",
       "19                 46.0               21.5                194.0   \n",
       "..                  ...                ...                  ...   \n",
       "338                47.2               13.7                214.0   \n",
       "340                46.8               14.3                215.0   \n",
       "341                50.4               15.7                222.0   \n",
       "342                45.2               14.8                212.0   \n",
       "343                49.9               16.1                213.0   \n",
       "\n",
       "     Body Mass (g)     Sex  Delta 15 N (o/oo)  Delta 13 C (o/oo)  \\\n",
       "2           3250.0  FEMALE            8.36821          -25.33302   \n",
       "9           4250.0     NaN            9.13362          -25.09368   \n",
       "12          3200.0  FEMALE                NaN                NaN   \n",
       "17          4500.0    MALE            8.67538          -25.13993   \n",
       "19          4200.0    MALE            9.11616          -24.77227   \n",
       "..             ...     ...                ...                ...   \n",
       "338         4925.0  FEMALE            7.99184          -26.20538   \n",
       "340         4850.0  FEMALE            8.41151          -26.13832   \n",
       "341         5750.0    MALE            8.30166          -26.04117   \n",
       "342         5200.0  FEMALE            8.24246          -26.11969   \n",
       "343         5400.0    MALE            8.36390          -26.15531   \n",
       "\n",
       "                                 Comments  \n",
       "2                                     NaN  \n",
       "9    No blood sample obtained for sexing.  \n",
       "12         Not enough blood for isotopes.  \n",
       "17                                    NaN  \n",
       "19                                    NaN  \n",
       "..                                    ...  \n",
       "338                                   NaN  \n",
       "340                                   NaN  \n",
       "341                                   NaN  \n",
       "342                                   NaN  \n",
       "343                                   NaN  \n",
       "\n",
       "[242 rows x 17 columns]"
      ]
     },
     "execution_count": 51,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "dfa[dfa['Culmen Length (mm)'] > 40]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 52,
   "id": "406f0990-f5d0-4755-ac7f-cb20f0221e8b",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>index</th>\n",
       "      <th>studyName</th>\n",
       "      <th>Sample Number</th>\n",
       "      <th>Species</th>\n",
       "      <th>Region</th>\n",
       "      <th>Island</th>\n",
       "      <th>Stage</th>\n",
       "      <th>Individual ID</th>\n",
       "      <th>Clutch Completion</th>\n",
       "      <th>Date Egg</th>\n",
       "      <th>Culmen Length (mm)</th>\n",
       "      <th>Culmen Depth (mm)</th>\n",
       "      <th>Flipper Length (mm)</th>\n",
       "      <th>Body Mass (g)</th>\n",
       "      <th>Sex</th>\n",
       "      <th>Delta 15 N (o/oo)</th>\n",
       "      <th>Delta 13 C (o/oo)</th>\n",
       "      <th>Comments</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>2</td>\n",
       "      <td>PAL0708</td>\n",
       "      <td>3</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Torgersen</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N2A1</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/16/07</td>\n",
       "      <td>40.3</td>\n",
       "      <td>18.0</td>\n",
       "      <td>195.0</td>\n",
       "      <td>3250.0</td>\n",
       "      <td>FEMALE</td>\n",
       "      <td>8.36821</td>\n",
       "      <td>-25.33302</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>9</td>\n",
       "      <td>PAL0708</td>\n",
       "      <td>10</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Torgersen</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N5A2</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/9/07</td>\n",
       "      <td>42.0</td>\n",
       "      <td>20.2</td>\n",
       "      <td>190.0</td>\n",
       "      <td>4250.0</td>\n",
       "      <td>NaN</td>\n",
       "      <td>9.13362</td>\n",
       "      <td>-25.09368</td>\n",
       "      <td>No blood sample obtained for sexing.</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>12</td>\n",
       "      <td>PAL0708</td>\n",
       "      <td>13</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Torgersen</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N7A1</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/15/07</td>\n",
       "      <td>41.1</td>\n",
       "      <td>17.6</td>\n",
       "      <td>182.0</td>\n",
       "      <td>3200.0</td>\n",
       "      <td>FEMALE</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>Not enough blood for isotopes.</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>17</td>\n",
       "      <td>PAL0708</td>\n",
       "      <td>18</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Torgersen</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N9A2</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/12/07</td>\n",
       "      <td>42.5</td>\n",
       "      <td>20.7</td>\n",
       "      <td>197.0</td>\n",
       "      <td>4500.0</td>\n",
       "      <td>MALE</td>\n",
       "      <td>8.67538</td>\n",
       "      <td>-25.13993</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>19</td>\n",
       "      <td>PAL0708</td>\n",
       "      <td>20</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Torgersen</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N10A2</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/16/07</td>\n",
       "      <td>46.0</td>\n",
       "      <td>21.5</td>\n",
       "      <td>194.0</td>\n",
       "      <td>4200.0</td>\n",
       "      <td>MALE</td>\n",
       "      <td>9.11616</td>\n",
       "      <td>-24.77227</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>237</th>\n",
       "      <td>338</td>\n",
       "      <td>PAL0910</td>\n",
       "      <td>119</td>\n",
       "      <td>Gentoo penguin (Pygoscelis papua)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Biscoe</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N38A1</td>\n",
       "      <td>No</td>\n",
       "      <td>12/1/09</td>\n",
       "      <td>47.2</td>\n",
       "      <td>13.7</td>\n",
       "      <td>214.0</td>\n",
       "      <td>4925.0</td>\n",
       "      <td>FEMALE</td>\n",
       "      <td>7.99184</td>\n",
       "      <td>-26.20538</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>238</th>\n",
       "      <td>340</td>\n",
       "      <td>PAL0910</td>\n",
       "      <td>121</td>\n",
       "      <td>Gentoo penguin (Pygoscelis papua)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Biscoe</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N39A1</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/22/09</td>\n",
       "      <td>46.8</td>\n",
       "      <td>14.3</td>\n",
       "      <td>215.0</td>\n",
       "      <td>4850.0</td>\n",
       "      <td>FEMALE</td>\n",
       "      <td>8.41151</td>\n",
       "      <td>-26.13832</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>239</th>\n",
       "      <td>341</td>\n",
       "      <td>PAL0910</td>\n",
       "      <td>122</td>\n",
       "      <td>Gentoo penguin (Pygoscelis papua)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Biscoe</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N39A2</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/22/09</td>\n",
       "      <td>50.4</td>\n",
       "      <td>15.7</td>\n",
       "      <td>222.0</td>\n",
       "      <td>5750.0</td>\n",
       "      <td>MALE</td>\n",
       "      <td>8.30166</td>\n",
       "      <td>-26.04117</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>240</th>\n",
       "      <td>342</td>\n",
       "      <td>PAL0910</td>\n",
       "      <td>123</td>\n",
       "      <td>Gentoo penguin (Pygoscelis papua)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Biscoe</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N43A1</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/22/09</td>\n",
       "      <td>45.2</td>\n",
       "      <td>14.8</td>\n",
       "      <td>212.0</td>\n",
       "      <td>5200.0</td>\n",
       "      <td>FEMALE</td>\n",
       "      <td>8.24246</td>\n",
       "      <td>-26.11969</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>241</th>\n",
       "      <td>343</td>\n",
       "      <td>PAL0910</td>\n",
       "      <td>124</td>\n",
       "      <td>Gentoo penguin (Pygoscelis papua)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Biscoe</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N43A2</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/22/09</td>\n",
       "      <td>49.9</td>\n",
       "      <td>16.1</td>\n",
       "      <td>213.0</td>\n",
       "      <td>5400.0</td>\n",
       "      <td>MALE</td>\n",
       "      <td>8.36390</td>\n",
       "      <td>-26.15531</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>242 rows × 18 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "     index studyName  Sample Number                              Species  \\\n",
       "0        2   PAL0708              3  Adelie Penguin (Pygoscelis adeliae)   \n",
       "1        9   PAL0708             10  Adelie Penguin (Pygoscelis adeliae)   \n",
       "2       12   PAL0708             13  Adelie Penguin (Pygoscelis adeliae)   \n",
       "3       17   PAL0708             18  Adelie Penguin (Pygoscelis adeliae)   \n",
       "4       19   PAL0708             20  Adelie Penguin (Pygoscelis adeliae)   \n",
       "..     ...       ...            ...                                  ...   \n",
       "237    338   PAL0910            119    Gentoo penguin (Pygoscelis papua)   \n",
       "238    340   PAL0910            121    Gentoo penguin (Pygoscelis papua)   \n",
       "239    341   PAL0910            122    Gentoo penguin (Pygoscelis papua)   \n",
       "240    342   PAL0910            123    Gentoo penguin (Pygoscelis papua)   \n",
       "241    343   PAL0910            124    Gentoo penguin (Pygoscelis papua)   \n",
       "\n",
       "     Region     Island               Stage Individual ID Clutch Completion  \\\n",
       "0    Anvers  Torgersen  Adult, 1 Egg Stage          N2A1               Yes   \n",
       "1    Anvers  Torgersen  Adult, 1 Egg Stage          N5A2               Yes   \n",
       "2    Anvers  Torgersen  Adult, 1 Egg Stage          N7A1               Yes   \n",
       "3    Anvers  Torgersen  Adult, 1 Egg Stage          N9A2               Yes   \n",
       "4    Anvers  Torgersen  Adult, 1 Egg Stage         N10A2               Yes   \n",
       "..      ...        ...                 ...           ...               ...   \n",
       "237  Anvers     Biscoe  Adult, 1 Egg Stage         N38A1                No   \n",
       "238  Anvers     Biscoe  Adult, 1 Egg Stage         N39A1               Yes   \n",
       "239  Anvers     Biscoe  Adult, 1 Egg Stage         N39A2               Yes   \n",
       "240  Anvers     Biscoe  Adult, 1 Egg Stage         N43A1               Yes   \n",
       "241  Anvers     Biscoe  Adult, 1 Egg Stage         N43A2               Yes   \n",
       "\n",
       "     Date Egg  Culmen Length (mm)  Culmen Depth (mm)  Flipper Length (mm)  \\\n",
       "0    11/16/07                40.3               18.0                195.0   \n",
       "1     11/9/07                42.0               20.2                190.0   \n",
       "2    11/15/07                41.1               17.6                182.0   \n",
       "3    11/12/07                42.5               20.7                197.0   \n",
       "4    11/16/07                46.0               21.5                194.0   \n",
       "..        ...                 ...                ...                  ...   \n",
       "237   12/1/09                47.2               13.7                214.0   \n",
       "238  11/22/09                46.8               14.3                215.0   \n",
       "239  11/22/09                50.4               15.7                222.0   \n",
       "240  11/22/09                45.2               14.8                212.0   \n",
       "241  11/22/09                49.9               16.1                213.0   \n",
       "\n",
       "     Body Mass (g)     Sex  Delta 15 N (o/oo)  Delta 13 C (o/oo)  \\\n",
       "0           3250.0  FEMALE            8.36821          -25.33302   \n",
       "1           4250.0     NaN            9.13362          -25.09368   \n",
       "2           3200.0  FEMALE                NaN                NaN   \n",
       "3           4500.0    MALE            8.67538          -25.13993   \n",
       "4           4200.0    MALE            9.11616          -24.77227   \n",
       "..             ...     ...                ...                ...   \n",
       "237         4925.0  FEMALE            7.99184          -26.20538   \n",
       "238         4850.0  FEMALE            8.41151          -26.13832   \n",
       "239         5750.0    MALE            8.30166          -26.04117   \n",
       "240         5200.0  FEMALE            8.24246          -26.11969   \n",
       "241         5400.0    MALE            8.36390          -26.15531   \n",
       "\n",
       "                                 Comments  \n",
       "0                                     NaN  \n",
       "1    No blood sample obtained for sexing.  \n",
       "2          Not enough blood for isotopes.  \n",
       "3                                     NaN  \n",
       "4                                     NaN  \n",
       "..                                    ...  \n",
       "237                                   NaN  \n",
       "238                                   NaN  \n",
       "239                                   NaN  \n",
       "240                                   NaN  \n",
       "241                                   NaN  \n",
       "\n",
       "[242 rows x 18 columns]"
      ]
     },
     "execution_count": 52,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "dfa[dfa['Culmen Length (mm)'] > 40].reset_index()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 53,
   "id": "bb2b8e61-7ef8-4c77-9896-5352b11b1530",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>studyName</th>\n",
       "      <th>Sample Number</th>\n",
       "      <th>Species</th>\n",
       "      <th>Region</th>\n",
       "      <th>Island</th>\n",
       "      <th>Stage</th>\n",
       "      <th>Individual ID</th>\n",
       "      <th>Clutch Completion</th>\n",
       "      <th>Date Egg</th>\n",
       "      <th>Culmen Length (mm)</th>\n",
       "      <th>Culmen Depth (mm)</th>\n",
       "      <th>Flipper Length (mm)</th>\n",
       "      <th>Body Mass (g)</th>\n",
       "      <th>Sex</th>\n",
       "      <th>Delta 15 N (o/oo)</th>\n",
       "      <th>Delta 13 C (o/oo)</th>\n",
       "      <th>Comments</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>PAL0708</td>\n",
       "      <td>3</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Torgersen</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N2A1</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/16/07</td>\n",
       "      <td>40.3</td>\n",
       "      <td>18.0</td>\n",
       "      <td>195.0</td>\n",
       "      <td>3250.0</td>\n",
       "      <td>FEMALE</td>\n",
       "      <td>8.36821</td>\n",
       "      <td>-25.33302</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>PAL0708</td>\n",
       "      <td>10</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Torgersen</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N5A2</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/9/07</td>\n",
       "      <td>42.0</td>\n",
       "      <td>20.2</td>\n",
       "      <td>190.0</td>\n",
       "      <td>4250.0</td>\n",
       "      <td>NaN</td>\n",
       "      <td>9.13362</td>\n",
       "      <td>-25.09368</td>\n",
       "      <td>No blood sample obtained for sexing.</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>PAL0708</td>\n",
       "      <td>13</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Torgersen</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N7A1</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/15/07</td>\n",
       "      <td>41.1</td>\n",
       "      <td>17.6</td>\n",
       "      <td>182.0</td>\n",
       "      <td>3200.0</td>\n",
       "      <td>FEMALE</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>Not enough blood for isotopes.</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>PAL0708</td>\n",
       "      <td>18</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Torgersen</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N9A2</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/12/07</td>\n",
       "      <td>42.5</td>\n",
       "      <td>20.7</td>\n",
       "      <td>197.0</td>\n",
       "      <td>4500.0</td>\n",
       "      <td>MALE</td>\n",
       "      <td>8.67538</td>\n",
       "      <td>-25.13993</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>PAL0708</td>\n",
       "      <td>20</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Torgersen</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N10A2</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/16/07</td>\n",
       "      <td>46.0</td>\n",
       "      <td>21.5</td>\n",
       "      <td>194.0</td>\n",
       "      <td>4200.0</td>\n",
       "      <td>MALE</td>\n",
       "      <td>9.11616</td>\n",
       "      <td>-24.77227</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>237</th>\n",
       "      <td>PAL0910</td>\n",
       "      <td>119</td>\n",
       "      <td>Gentoo penguin (Pygoscelis papua)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Biscoe</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N38A1</td>\n",
       "      <td>No</td>\n",
       "      <td>12/1/09</td>\n",
       "      <td>47.2</td>\n",
       "      <td>13.7</td>\n",
       "      <td>214.0</td>\n",
       "      <td>4925.0</td>\n",
       "      <td>FEMALE</td>\n",
       "      <td>7.99184</td>\n",
       "      <td>-26.20538</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>238</th>\n",
       "      <td>PAL0910</td>\n",
       "      <td>121</td>\n",
       "      <td>Gentoo penguin (Pygoscelis papua)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Biscoe</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N39A1</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/22/09</td>\n",
       "      <td>46.8</td>\n",
       "      <td>14.3</td>\n",
       "      <td>215.0</td>\n",
       "      <td>4850.0</td>\n",
       "      <td>FEMALE</td>\n",
       "      <td>8.41151</td>\n",
       "      <td>-26.13832</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>239</th>\n",
       "      <td>PAL0910</td>\n",
       "      <td>122</td>\n",
       "      <td>Gentoo penguin (Pygoscelis papua)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Biscoe</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N39A2</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/22/09</td>\n",
       "      <td>50.4</td>\n",
       "      <td>15.7</td>\n",
       "      <td>222.0</td>\n",
       "      <td>5750.0</td>\n",
       "      <td>MALE</td>\n",
       "      <td>8.30166</td>\n",
       "      <td>-26.04117</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>240</th>\n",
       "      <td>PAL0910</td>\n",
       "      <td>123</td>\n",
       "      <td>Gentoo penguin (Pygoscelis papua)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Biscoe</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N43A1</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/22/09</td>\n",
       "      <td>45.2</td>\n",
       "      <td>14.8</td>\n",
       "      <td>212.0</td>\n",
       "      <td>5200.0</td>\n",
       "      <td>FEMALE</td>\n",
       "      <td>8.24246</td>\n",
       "      <td>-26.11969</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>241</th>\n",
       "      <td>PAL0910</td>\n",
       "      <td>124</td>\n",
       "      <td>Gentoo penguin (Pygoscelis papua)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Biscoe</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N43A2</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/22/09</td>\n",
       "      <td>49.9</td>\n",
       "      <td>16.1</td>\n",
       "      <td>213.0</td>\n",
       "      <td>5400.0</td>\n",
       "      <td>MALE</td>\n",
       "      <td>8.36390</td>\n",
       "      <td>-26.15531</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>242 rows × 17 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "    studyName  Sample Number                              Species  Region  \\\n",
       "0     PAL0708              3  Adelie Penguin (Pygoscelis adeliae)  Anvers   \n",
       "1     PAL0708             10  Adelie Penguin (Pygoscelis adeliae)  Anvers   \n",
       "2     PAL0708             13  Adelie Penguin (Pygoscelis adeliae)  Anvers   \n",
       "3     PAL0708             18  Adelie Penguin (Pygoscelis adeliae)  Anvers   \n",
       "4     PAL0708             20  Adelie Penguin (Pygoscelis adeliae)  Anvers   \n",
       "..        ...            ...                                  ...     ...   \n",
       "237   PAL0910            119    Gentoo penguin (Pygoscelis papua)  Anvers   \n",
       "238   PAL0910            121    Gentoo penguin (Pygoscelis papua)  Anvers   \n",
       "239   PAL0910            122    Gentoo penguin (Pygoscelis papua)  Anvers   \n",
       "240   PAL0910            123    Gentoo penguin (Pygoscelis papua)  Anvers   \n",
       "241   PAL0910            124    Gentoo penguin (Pygoscelis papua)  Anvers   \n",
       "\n",
       "        Island               Stage Individual ID Clutch Completion  Date Egg  \\\n",
       "0    Torgersen  Adult, 1 Egg Stage          N2A1               Yes  11/16/07   \n",
       "1    Torgersen  Adult, 1 Egg Stage          N5A2               Yes   11/9/07   \n",
       "2    Torgersen  Adult, 1 Egg Stage          N7A1               Yes  11/15/07   \n",
       "3    Torgersen  Adult, 1 Egg Stage          N9A2               Yes  11/12/07   \n",
       "4    Torgersen  Adult, 1 Egg Stage         N10A2               Yes  11/16/07   \n",
       "..         ...                 ...           ...               ...       ...   \n",
       "237     Biscoe  Adult, 1 Egg Stage         N38A1                No   12/1/09   \n",
       "238     Biscoe  Adult, 1 Egg Stage         N39A1               Yes  11/22/09   \n",
       "239     Biscoe  Adult, 1 Egg Stage         N39A2               Yes  11/22/09   \n",
       "240     Biscoe  Adult, 1 Egg Stage         N43A1               Yes  11/22/09   \n",
       "241     Biscoe  Adult, 1 Egg Stage         N43A2               Yes  11/22/09   \n",
       "\n",
       "     Culmen Length (mm)  Culmen Depth (mm)  Flipper Length (mm)  \\\n",
       "0                  40.3               18.0                195.0   \n",
       "1                  42.0               20.2                190.0   \n",
       "2                  41.1               17.6                182.0   \n",
       "3                  42.5               20.7                197.0   \n",
       "4                  46.0               21.5                194.0   \n",
       "..                  ...                ...                  ...   \n",
       "237                47.2               13.7                214.0   \n",
       "238                46.8               14.3                215.0   \n",
       "239                50.4               15.7                222.0   \n",
       "240                45.2               14.8                212.0   \n",
       "241                49.9               16.1                213.0   \n",
       "\n",
       "     Body Mass (g)     Sex  Delta 15 N (o/oo)  Delta 13 C (o/oo)  \\\n",
       "0           3250.0  FEMALE            8.36821          -25.33302   \n",
       "1           4250.0     NaN            9.13362          -25.09368   \n",
       "2           3200.0  FEMALE                NaN                NaN   \n",
       "3           4500.0    MALE            8.67538          -25.13993   \n",
       "4           4200.0    MALE            9.11616          -24.77227   \n",
       "..             ...     ...                ...                ...   \n",
       "237         4925.0  FEMALE            7.99184          -26.20538   \n",
       "238         4850.0  FEMALE            8.41151          -26.13832   \n",
       "239         5750.0    MALE            8.30166          -26.04117   \n",
       "240         5200.0  FEMALE            8.24246          -26.11969   \n",
       "241         5400.0    MALE            8.36390          -26.15531   \n",
       "\n",
       "                                 Comments  \n",
       "0                                     NaN  \n",
       "1    No blood sample obtained for sexing.  \n",
       "2          Not enough blood for isotopes.  \n",
       "3                                     NaN  \n",
       "4                                     NaN  \n",
       "..                                    ...  \n",
       "237                                   NaN  \n",
       "238                                   NaN  \n",
       "239                                   NaN  \n",
       "240                                   NaN  \n",
       "241                                   NaN  \n",
       "\n",
       "[242 rows x 17 columns]"
      ]
     },
     "execution_count": 53,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "dfa[dfa['Culmen Length (mm)'] > 40].reset_index(drop=True)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 54,
   "id": "57a073f0-caae-4ca9-b72c-075ae8e98fec",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>studyName</th>\n",
       "      <th>Sample Number</th>\n",
       "      <th>Species</th>\n",
       "      <th>Region</th>\n",
       "      <th>Island</th>\n",
       "      <th>Stage</th>\n",
       "      <th>Individual ID</th>\n",
       "      <th>Clutch Completion</th>\n",
       "      <th>Date Egg</th>\n",
       "      <th>Culmen Length (mm)</th>\n",
       "      <th>Culmen Depth (mm)</th>\n",
       "      <th>Flipper Length (mm)</th>\n",
       "      <th>Body Mass (g)</th>\n",
       "      <th>Sex</th>\n",
       "      <th>Delta 15 N (o/oo)</th>\n",
       "      <th>Delta 13 C (o/oo)</th>\n",
       "      <th>Comments</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>PAL0708</td>\n",
       "      <td>1</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Torgersen</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N1A1</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/11/07</td>\n",
       "      <td>39.1</td>\n",
       "      <td>18.7</td>\n",
       "      <td>181.0</td>\n",
       "      <td>3750.0</td>\n",
       "      <td>MALE</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>Not enough blood for isotopes.</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>PAL0708</td>\n",
       "      <td>2</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Torgersen</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N1A2</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/11/07</td>\n",
       "      <td>39.5</td>\n",
       "      <td>17.4</td>\n",
       "      <td>186.0</td>\n",
       "      <td>3800.0</td>\n",
       "      <td>FEMALE</td>\n",
       "      <td>8.94956</td>\n",
       "      <td>-24.69454</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>PAL0708</td>\n",
       "      <td>3</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Torgersen</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N2A1</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/16/07</td>\n",
       "      <td>40.3</td>\n",
       "      <td>18.0</td>\n",
       "      <td>195.0</td>\n",
       "      <td>3250.0</td>\n",
       "      <td>FEMALE</td>\n",
       "      <td>8.36821</td>\n",
       "      <td>-25.33302</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>PAL0708</td>\n",
       "      <td>4</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Torgersen</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N2A2</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/16/07</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>Adult not sampled.</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>PAL0708</td>\n",
       "      <td>5</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Torgersen</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N3A1</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/16/07</td>\n",
       "      <td>36.7</td>\n",
       "      <td>19.3</td>\n",
       "      <td>193.0</td>\n",
       "      <td>3450.0</td>\n",
       "      <td>FEMALE</td>\n",
       "      <td>8.76651</td>\n",
       "      <td>-25.32426</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>339</th>\n",
       "      <td>PAL0910</td>\n",
       "      <td>120</td>\n",
       "      <td>Gentoo penguin (Pygoscelis papua)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Biscoe</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N38A2</td>\n",
       "      <td>No</td>\n",
       "      <td>12/1/09</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>340</th>\n",
       "      <td>PAL0910</td>\n",
       "      <td>121</td>\n",
       "      <td>Gentoo penguin (Pygoscelis papua)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Biscoe</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N39A1</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/22/09</td>\n",
       "      <td>46.8</td>\n",
       "      <td>14.3</td>\n",
       "      <td>215.0</td>\n",
       "      <td>4850.0</td>\n",
       "      <td>FEMALE</td>\n",
       "      <td>8.41151</td>\n",
       "      <td>-26.13832</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>341</th>\n",
       "      <td>PAL0910</td>\n",
       "      <td>122</td>\n",
       "      <td>Gentoo penguin (Pygoscelis papua)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Biscoe</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N39A2</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/22/09</td>\n",
       "      <td>50.4</td>\n",
       "      <td>15.7</td>\n",
       "      <td>222.0</td>\n",
       "      <td>5750.0</td>\n",
       "      <td>MALE</td>\n",
       "      <td>8.30166</td>\n",
       "      <td>-26.04117</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>342</th>\n",
       "      <td>PAL0910</td>\n",
       "      <td>123</td>\n",
       "      <td>Gentoo penguin (Pygoscelis papua)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Biscoe</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N43A1</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/22/09</td>\n",
       "      <td>45.2</td>\n",
       "      <td>14.8</td>\n",
       "      <td>212.0</td>\n",
       "      <td>5200.0</td>\n",
       "      <td>FEMALE</td>\n",
       "      <td>8.24246</td>\n",
       "      <td>-26.11969</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>343</th>\n",
       "      <td>PAL0910</td>\n",
       "      <td>124</td>\n",
       "      <td>Gentoo penguin (Pygoscelis papua)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Biscoe</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N43A2</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/22/09</td>\n",
       "      <td>49.9</td>\n",
       "      <td>16.1</td>\n",
       "      <td>213.0</td>\n",
       "      <td>5400.0</td>\n",
       "      <td>MALE</td>\n",
       "      <td>8.36390</td>\n",
       "      <td>-26.15531</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>344 rows × 17 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "    studyName  Sample Number                              Species  Region  \\\n",
       "0     PAL0708              1  Adelie Penguin (Pygoscelis adeliae)  Anvers   \n",
       "1     PAL0708              2  Adelie Penguin (Pygoscelis adeliae)  Anvers   \n",
       "2     PAL0708              3  Adelie Penguin (Pygoscelis adeliae)  Anvers   \n",
       "3     PAL0708              4  Adelie Penguin (Pygoscelis adeliae)  Anvers   \n",
       "4     PAL0708              5  Adelie Penguin (Pygoscelis adeliae)  Anvers   \n",
       "..        ...            ...                                  ...     ...   \n",
       "339   PAL0910            120    Gentoo penguin (Pygoscelis papua)  Anvers   \n",
       "340   PAL0910            121    Gentoo penguin (Pygoscelis papua)  Anvers   \n",
       "341   PAL0910            122    Gentoo penguin (Pygoscelis papua)  Anvers   \n",
       "342   PAL0910            123    Gentoo penguin (Pygoscelis papua)  Anvers   \n",
       "343   PAL0910            124    Gentoo penguin (Pygoscelis papua)  Anvers   \n",
       "\n",
       "        Island               Stage Individual ID Clutch Completion  Date Egg  \\\n",
       "0    Torgersen  Adult, 1 Egg Stage          N1A1               Yes  11/11/07   \n",
       "1    Torgersen  Adult, 1 Egg Stage          N1A2               Yes  11/11/07   \n",
       "2    Torgersen  Adult, 1 Egg Stage          N2A1               Yes  11/16/07   \n",
       "3    Torgersen  Adult, 1 Egg Stage          N2A2               Yes  11/16/07   \n",
       "4    Torgersen  Adult, 1 Egg Stage          N3A1               Yes  11/16/07   \n",
       "..         ...                 ...           ...               ...       ...   \n",
       "339     Biscoe  Adult, 1 Egg Stage         N38A2                No   12/1/09   \n",
       "340     Biscoe  Adult, 1 Egg Stage         N39A1               Yes  11/22/09   \n",
       "341     Biscoe  Adult, 1 Egg Stage         N39A2               Yes  11/22/09   \n",
       "342     Biscoe  Adult, 1 Egg Stage         N43A1               Yes  11/22/09   \n",
       "343     Biscoe  Adult, 1 Egg Stage         N43A2               Yes  11/22/09   \n",
       "\n",
       "     Culmen Length (mm)  Culmen Depth (mm)  Flipper Length (mm)  \\\n",
       "0                  39.1               18.7                181.0   \n",
       "1                  39.5               17.4                186.0   \n",
       "2                  40.3               18.0                195.0   \n",
       "3                   NaN                NaN                  NaN   \n",
       "4                  36.7               19.3                193.0   \n",
       "..                  ...                ...                  ...   \n",
       "339                 NaN                NaN                  NaN   \n",
       "340                46.8               14.3                215.0   \n",
       "341                50.4               15.7                222.0   \n",
       "342                45.2               14.8                212.0   \n",
       "343                49.9               16.1                213.0   \n",
       "\n",
       "     Body Mass (g)     Sex  Delta 15 N (o/oo)  Delta 13 C (o/oo)  \\\n",
       "0           3750.0    MALE                NaN                NaN   \n",
       "1           3800.0  FEMALE            8.94956          -24.69454   \n",
       "2           3250.0  FEMALE            8.36821          -25.33302   \n",
       "3              NaN     NaN                NaN                NaN   \n",
       "4           3450.0  FEMALE            8.76651          -25.32426   \n",
       "..             ...     ...                ...                ...   \n",
       "339            NaN     NaN                NaN                NaN   \n",
       "340         4850.0  FEMALE            8.41151          -26.13832   \n",
       "341         5750.0    MALE            8.30166          -26.04117   \n",
       "342         5200.0  FEMALE            8.24246          -26.11969   \n",
       "343         5400.0    MALE            8.36390          -26.15531   \n",
       "\n",
       "                           Comments  \n",
       "0    Not enough blood for isotopes.  \n",
       "1                               NaN  \n",
       "2                               NaN  \n",
       "3                Adult not sampled.  \n",
       "4                               NaN  \n",
       "..                              ...  \n",
       "339                             NaN  \n",
       "340                             NaN  \n",
       "341                             NaN  \n",
       "342                             NaN  \n",
       "343                             NaN  \n",
       "\n",
       "[344 rows x 17 columns]"
      ]
     },
     "execution_count": 54,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "dfa"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 55,
   "id": "7ffe1dda-b914-4c48-a0f1-2e05df99acf8",
   "metadata": {
    "scrolled": true
   },
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>studyName</th>\n",
       "      <th>Sample Number</th>\n",
       "      <th>Species</th>\n",
       "      <th>Region</th>\n",
       "      <th>Island</th>\n",
       "      <th>Stage</th>\n",
       "      <th>Individual ID</th>\n",
       "      <th>Clutch Completion</th>\n",
       "      <th>Date Egg</th>\n",
       "      <th>Culmen Length (mm)</th>\n",
       "      <th>Culmen Depth (mm)</th>\n",
       "      <th>Flipper Length (mm)</th>\n",
       "      <th>Body Mass (g)</th>\n",
       "      <th>Sex</th>\n",
       "      <th>Delta 15 N (o/oo)</th>\n",
       "      <th>Delta 13 C (o/oo)</th>\n",
       "      <th>Comments</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>PAL0708</td>\n",
       "      <td>3</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Torgersen</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N2A1</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/16/07</td>\n",
       "      <td>40.3</td>\n",
       "      <td>18.0</td>\n",
       "      <td>195.0</td>\n",
       "      <td>3250.0</td>\n",
       "      <td>FEMALE</td>\n",
       "      <td>8.36821</td>\n",
       "      <td>-25.33302</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>PAL0708</td>\n",
       "      <td>10</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Torgersen</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N5A2</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/9/07</td>\n",
       "      <td>42.0</td>\n",
       "      <td>20.2</td>\n",
       "      <td>190.0</td>\n",
       "      <td>4250.0</td>\n",
       "      <td>NaN</td>\n",
       "      <td>9.13362</td>\n",
       "      <td>-25.09368</td>\n",
       "      <td>No blood sample obtained for sexing.</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>PAL0708</td>\n",
       "      <td>13</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Torgersen</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N7A1</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/15/07</td>\n",
       "      <td>41.1</td>\n",
       "      <td>17.6</td>\n",
       "      <td>182.0</td>\n",
       "      <td>3200.0</td>\n",
       "      <td>FEMALE</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>Not enough blood for isotopes.</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>PAL0708</td>\n",
       "      <td>18</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Torgersen</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N9A2</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/12/07</td>\n",
       "      <td>42.5</td>\n",
       "      <td>20.7</td>\n",
       "      <td>197.0</td>\n",
       "      <td>4500.0</td>\n",
       "      <td>MALE</td>\n",
       "      <td>8.67538</td>\n",
       "      <td>-25.13993</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>PAL0708</td>\n",
       "      <td>20</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Torgersen</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N10A2</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/16/07</td>\n",
       "      <td>46.0</td>\n",
       "      <td>21.5</td>\n",
       "      <td>194.0</td>\n",
       "      <td>4200.0</td>\n",
       "      <td>MALE</td>\n",
       "      <td>9.11616</td>\n",
       "      <td>-24.77227</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>237</th>\n",
       "      <td>PAL0910</td>\n",
       "      <td>119</td>\n",
       "      <td>Gentoo penguin (Pygoscelis papua)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Biscoe</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N38A1</td>\n",
       "      <td>No</td>\n",
       "      <td>12/1/09</td>\n",
       "      <td>47.2</td>\n",
       "      <td>13.7</td>\n",
       "      <td>214.0</td>\n",
       "      <td>4925.0</td>\n",
       "      <td>FEMALE</td>\n",
       "      <td>7.99184</td>\n",
       "      <td>-26.20538</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>238</th>\n",
       "      <td>PAL0910</td>\n",
       "      <td>121</td>\n",
       "      <td>Gentoo penguin (Pygoscelis papua)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Biscoe</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N39A1</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/22/09</td>\n",
       "      <td>46.8</td>\n",
       "      <td>14.3</td>\n",
       "      <td>215.0</td>\n",
       "      <td>4850.0</td>\n",
       "      <td>FEMALE</td>\n",
       "      <td>8.41151</td>\n",
       "      <td>-26.13832</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>239</th>\n",
       "      <td>PAL0910</td>\n",
       "      <td>122</td>\n",
       "      <td>Gentoo penguin (Pygoscelis papua)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Biscoe</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N39A2</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/22/09</td>\n",
       "      <td>50.4</td>\n",
       "      <td>15.7</td>\n",
       "      <td>222.0</td>\n",
       "      <td>5750.0</td>\n",
       "      <td>MALE</td>\n",
       "      <td>8.30166</td>\n",
       "      <td>-26.04117</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>240</th>\n",
       "      <td>PAL0910</td>\n",
       "      <td>123</td>\n",
       "      <td>Gentoo penguin (Pygoscelis papua)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Biscoe</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N43A1</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/22/09</td>\n",
       "      <td>45.2</td>\n",
       "      <td>14.8</td>\n",
       "      <td>212.0</td>\n",
       "      <td>5200.0</td>\n",
       "      <td>FEMALE</td>\n",
       "      <td>8.24246</td>\n",
       "      <td>-26.11969</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>241</th>\n",
       "      <td>PAL0910</td>\n",
       "      <td>124</td>\n",
       "      <td>Gentoo penguin (Pygoscelis papua)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Biscoe</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N43A2</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/22/09</td>\n",
       "      <td>49.9</td>\n",
       "      <td>16.1</td>\n",
       "      <td>213.0</td>\n",
       "      <td>5400.0</td>\n",
       "      <td>MALE</td>\n",
       "      <td>8.36390</td>\n",
       "      <td>-26.15531</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>242 rows × 17 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "    studyName  Sample Number                              Species  Region  \\\n",
       "0     PAL0708              3  Adelie Penguin (Pygoscelis adeliae)  Anvers   \n",
       "1     PAL0708             10  Adelie Penguin (Pygoscelis adeliae)  Anvers   \n",
       "2     PAL0708             13  Adelie Penguin (Pygoscelis adeliae)  Anvers   \n",
       "3     PAL0708             18  Adelie Penguin (Pygoscelis adeliae)  Anvers   \n",
       "4     PAL0708             20  Adelie Penguin (Pygoscelis adeliae)  Anvers   \n",
       "..        ...            ...                                  ...     ...   \n",
       "237   PAL0910            119    Gentoo penguin (Pygoscelis papua)  Anvers   \n",
       "238   PAL0910            121    Gentoo penguin (Pygoscelis papua)  Anvers   \n",
       "239   PAL0910            122    Gentoo penguin (Pygoscelis papua)  Anvers   \n",
       "240   PAL0910            123    Gentoo penguin (Pygoscelis papua)  Anvers   \n",
       "241   PAL0910            124    Gentoo penguin (Pygoscelis papua)  Anvers   \n",
       "\n",
       "        Island               Stage Individual ID Clutch Completion  Date Egg  \\\n",
       "0    Torgersen  Adult, 1 Egg Stage          N2A1               Yes  11/16/07   \n",
       "1    Torgersen  Adult, 1 Egg Stage          N5A2               Yes   11/9/07   \n",
       "2    Torgersen  Adult, 1 Egg Stage          N7A1               Yes  11/15/07   \n",
       "3    Torgersen  Adult, 1 Egg Stage          N9A2               Yes  11/12/07   \n",
       "4    Torgersen  Adult, 1 Egg Stage         N10A2               Yes  11/16/07   \n",
       "..         ...                 ...           ...               ...       ...   \n",
       "237     Biscoe  Adult, 1 Egg Stage         N38A1                No   12/1/09   \n",
       "238     Biscoe  Adult, 1 Egg Stage         N39A1               Yes  11/22/09   \n",
       "239     Biscoe  Adult, 1 Egg Stage         N39A2               Yes  11/22/09   \n",
       "240     Biscoe  Adult, 1 Egg Stage         N43A1               Yes  11/22/09   \n",
       "241     Biscoe  Adult, 1 Egg Stage         N43A2               Yes  11/22/09   \n",
       "\n",
       "     Culmen Length (mm)  Culmen Depth (mm)  Flipper Length (mm)  \\\n",
       "0                  40.3               18.0                195.0   \n",
       "1                  42.0               20.2                190.0   \n",
       "2                  41.1               17.6                182.0   \n",
       "3                  42.5               20.7                197.0   \n",
       "4                  46.0               21.5                194.0   \n",
       "..                  ...                ...                  ...   \n",
       "237                47.2               13.7                214.0   \n",
       "238                46.8               14.3                215.0   \n",
       "239                50.4               15.7                222.0   \n",
       "240                45.2               14.8                212.0   \n",
       "241                49.9               16.1                213.0   \n",
       "\n",
       "     Body Mass (g)     Sex  Delta 15 N (o/oo)  Delta 13 C (o/oo)  \\\n",
       "0           3250.0  FEMALE            8.36821          -25.33302   \n",
       "1           4250.0     NaN            9.13362          -25.09368   \n",
       "2           3200.0  FEMALE                NaN                NaN   \n",
       "3           4500.0    MALE            8.67538          -25.13993   \n",
       "4           4200.0    MALE            9.11616          -24.77227   \n",
       "..             ...     ...                ...                ...   \n",
       "237         4925.0  FEMALE            7.99184          -26.20538   \n",
       "238         4850.0  FEMALE            8.41151          -26.13832   \n",
       "239         5750.0    MALE            8.30166          -26.04117   \n",
       "240         5200.0  FEMALE            8.24246          -26.11969   \n",
       "241         5400.0    MALE            8.36390          -26.15531   \n",
       "\n",
       "                                 Comments  \n",
       "0                                     NaN  \n",
       "1    No blood sample obtained for sexing.  \n",
       "2          Not enough blood for isotopes.  \n",
       "3                                     NaN  \n",
       "4                                     NaN  \n",
       "..                                    ...  \n",
       "237                                   NaN  \n",
       "238                                   NaN  \n",
       "239                                   NaN  \n",
       "240                                   NaN  \n",
       "241                                   NaN  \n",
       "\n",
       "[242 rows x 17 columns]"
      ]
     },
     "execution_count": 55,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# DON'T DO THIS!\n",
    "dfs = dfa[dfa['Culmen Length (mm)'] > 40]\n",
    "dfs.reset_index(drop=True, inplace=True)\n",
    "dfs"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "3374babd-3eea-4ba6-bd4e-b2f7bb3c9c17",
   "metadata": {},
   "source": [
    "### Split-Apply-Combine"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 56,
   "id": "66e6c38f-1dc0-4c1f-90b2-857ad2616608",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "<polars.dataframe.group_by.GroupBy at 0x11b152120>"
      ]
     },
     "execution_count": 56,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df.group_by('Island')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 59,
   "id": "66f46b0e-48b9-4666-8d13-dcb2c173a263",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "('Torgersen',)"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "data": {
      "text/html": [
       "<div><style>\n",
       ".dataframe > thead > tr,\n",
       ".dataframe > tbody > tr {\n",
       "  text-align: right;\n",
       "  white-space: pre-wrap;\n",
       "}\n",
       "</style>\n",
       "<small>shape: (52, 17)</small><table border=\"1\" class=\"dataframe\"><thead><tr><th>studyName</th><th>Sample Number</th><th>Species</th><th>Region</th><th>Island</th><th>Stage</th><th>Individual ID</th><th>Clutch Completion</th><th>Date Egg</th><th>Culmen Length (mm)</th><th>Culmen Depth (mm)</th><th>Flipper Length (mm)</th><th>Body Mass (g)</th><th>Sex</th><th>Delta 15 N (o/oo)</th><th>Delta 13 C (o/oo)</th><th>Comments</th></tr><tr><td>str</td><td>i64</td><td>str</td><td>str</td><td>str</td><td>str</td><td>str</td><td>str</td><td>str</td><td>f64</td><td>f64</td><td>i64</td><td>i64</td><td>str</td><td>f64</td><td>f64</td><td>str</td></tr></thead><tbody><tr><td>&quot;PAL0708&quot;</td><td>1</td><td>&quot;Adelie Penguin (Pygoscelis ade…</td><td>&quot;Anvers&quot;</td><td>&quot;Torgersen&quot;</td><td>&quot;Adult, 1 Egg Stage&quot;</td><td>&quot;N1A1&quot;</td><td>&quot;Yes&quot;</td><td>&quot;11/11/07&quot;</td><td>39.1</td><td>18.7</td><td>181</td><td>3750</td><td>&quot;MALE&quot;</td><td>null</td><td>null</td><td>&quot;Not enough blood for isotopes.&quot;</td></tr><tr><td>&quot;PAL0708&quot;</td><td>2</td><td>&quot;Adelie Penguin (Pygoscelis ade…</td><td>&quot;Anvers&quot;</td><td>&quot;Torgersen&quot;</td><td>&quot;Adult, 1 Egg Stage&quot;</td><td>&quot;N1A2&quot;</td><td>&quot;Yes&quot;</td><td>&quot;11/11/07&quot;</td><td>39.5</td><td>17.4</td><td>186</td><td>3800</td><td>&quot;FEMALE&quot;</td><td>8.94956</td><td>-24.69454</td><td>null</td></tr><tr><td>&quot;PAL0708&quot;</td><td>3</td><td>&quot;Adelie Penguin (Pygoscelis ade…</td><td>&quot;Anvers&quot;</td><td>&quot;Torgersen&quot;</td><td>&quot;Adult, 1 Egg Stage&quot;</td><td>&quot;N2A1&quot;</td><td>&quot;Yes&quot;</td><td>&quot;11/16/07&quot;</td><td>40.3</td><td>18.0</td><td>195</td><td>3250</td><td>&quot;FEMALE&quot;</td><td>8.36821</td><td>-25.33302</td><td>null</td></tr><tr><td>&quot;PAL0708&quot;</td><td>4</td><td>&quot;Adelie Penguin (Pygoscelis ade…</td><td>&quot;Anvers&quot;</td><td>&quot;Torgersen&quot;</td><td>&quot;Adult, 1 Egg Stage&quot;</td><td>&quot;N2A2&quot;</td><td>&quot;Yes&quot;</td><td>&quot;11/16/07&quot;</td><td>null</td><td>null</td><td>null</td><td>null</td><td>null</td><td>null</td><td>null</td><td>&quot;Adult not sampled.&quot;</td></tr><tr><td>&quot;PAL0708&quot;</td><td>5</td><td>&quot;Adelie Penguin (Pygoscelis ade…</td><td>&quot;Anvers&quot;</td><td>&quot;Torgersen&quot;</td><td>&quot;Adult, 1 Egg Stage&quot;</td><td>&quot;N3A1&quot;</td><td>&quot;Yes&quot;</td><td>&quot;11/16/07&quot;</td><td>36.7</td><td>19.3</td><td>193</td><td>3450</td><td>&quot;FEMALE&quot;</td><td>8.76651</td><td>-25.32426</td><td>null</td></tr><tr><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td></tr><tr><td>&quot;PAL0910&quot;</td><td>128</td><td>&quot;Adelie Penguin (Pygoscelis ade…</td><td>&quot;Anvers&quot;</td><td>&quot;Torgersen&quot;</td><td>&quot;Adult, 1 Egg Stage&quot;</td><td>&quot;N71A2&quot;</td><td>&quot;Yes&quot;</td><td>&quot;11/21/09&quot;</td><td>41.5</td><td>18.3</td><td>195</td><td>4300</td><td>&quot;MALE&quot;</td><td>8.52566</td><td>-26.0245</td><td>null</td></tr><tr><td>&quot;PAL0910&quot;</td><td>129</td><td>&quot;Adelie Penguin (Pygoscelis ade…</td><td>&quot;Anvers&quot;</td><td>&quot;Torgersen&quot;</td><td>&quot;Adult, 1 Egg Stage&quot;</td><td>&quot;N72A1&quot;</td><td>&quot;Yes&quot;</td><td>&quot;11/18/09&quot;</td><td>39.0</td><td>17.1</td><td>191</td><td>3050</td><td>&quot;FEMALE&quot;</td><td>9.19031</td><td>-25.73722</td><td>null</td></tr><tr><td>&quot;PAL0910&quot;</td><td>130</td><td>&quot;Adelie Penguin (Pygoscelis ade…</td><td>&quot;Anvers&quot;</td><td>&quot;Torgersen&quot;</td><td>&quot;Adult, 1 Egg Stage&quot;</td><td>&quot;N72A2&quot;</td><td>&quot;Yes&quot;</td><td>&quot;11/18/09&quot;</td><td>44.1</td><td>18.0</td><td>210</td><td>4000</td><td>&quot;MALE&quot;</td><td>9.10702</td><td>-26.01363</td><td>null</td></tr><tr><td>&quot;PAL0910&quot;</td><td>131</td><td>&quot;Adelie Penguin (Pygoscelis ade…</td><td>&quot;Anvers&quot;</td><td>&quot;Torgersen&quot;</td><td>&quot;Adult, 1 Egg Stage&quot;</td><td>&quot;N73A1&quot;</td><td>&quot;No&quot;</td><td>&quot;11/23/09&quot;</td><td>38.5</td><td>17.9</td><td>190</td><td>3325</td><td>&quot;FEMALE&quot;</td><td>8.9846</td><td>-25.57956</td><td>&quot;Nest never observed with full …</td></tr><tr><td>&quot;PAL0910&quot;</td><td>132</td><td>&quot;Adelie Penguin (Pygoscelis ade…</td><td>&quot;Anvers&quot;</td><td>&quot;Torgersen&quot;</td><td>&quot;Adult, 1 Egg Stage&quot;</td><td>&quot;N73A2&quot;</td><td>&quot;No&quot;</td><td>&quot;11/23/09&quot;</td><td>43.1</td><td>19.2</td><td>197</td><td>3500</td><td>&quot;MALE&quot;</td><td>8.86495</td><td>-26.1396</td><td>&quot;Nest never observed with full …</td></tr></tbody></table></div>"
      ],
      "text/plain": [
       "shape: (52, 17)\n",
       "┌───────────┬────────┬─────────────┬────────┬───┬────────┬─────────────┬─────────────┬─────────────┐\n",
       "│ studyName ┆ Sample ┆ Species     ┆ Region ┆ … ┆ Sex    ┆ Delta 15 N  ┆ Delta 13 C  ┆ Comments    │\n",
       "│ ---       ┆ Number ┆ ---         ┆ ---    ┆   ┆ ---    ┆ (o/oo)      ┆ (o/oo)      ┆ ---         │\n",
       "│ str       ┆ ---    ┆ str         ┆ str    ┆   ┆ str    ┆ ---         ┆ ---         ┆ str         │\n",
       "│           ┆ i64    ┆             ┆        ┆   ┆        ┆ f64         ┆ f64         ┆             │\n",
       "╞═══════════╪════════╪═════════════╪════════╪═══╪════════╪═════════════╪═════════════╪═════════════╡\n",
       "│ PAL0708   ┆ 1      ┆ Adelie      ┆ Anvers ┆ … ┆ MALE   ┆ null        ┆ null        ┆ Not enough  │\n",
       "│           ┆        ┆ Penguin     ┆        ┆   ┆        ┆             ┆             ┆ blood for   │\n",
       "│           ┆        ┆ (Pygoscelis ┆        ┆   ┆        ┆             ┆             ┆ isotopes.   │\n",
       "│           ┆        ┆ ade…        ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "│ PAL0708   ┆ 2      ┆ Adelie      ┆ Anvers ┆ … ┆ FEMALE ┆ 8.94956     ┆ -24.69454   ┆ null        │\n",
       "│           ┆        ┆ Penguin     ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "│           ┆        ┆ (Pygoscelis ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "│           ┆        ┆ ade…        ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "│ PAL0708   ┆ 3      ┆ Adelie      ┆ Anvers ┆ … ┆ FEMALE ┆ 8.36821     ┆ -25.33302   ┆ null        │\n",
       "│           ┆        ┆ Penguin     ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "│           ┆        ┆ (Pygoscelis ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "│           ┆        ┆ ade…        ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "│ PAL0708   ┆ 4      ┆ Adelie      ┆ Anvers ┆ … ┆ null   ┆ null        ┆ null        ┆ Adult not   │\n",
       "│           ┆        ┆ Penguin     ┆        ┆   ┆        ┆             ┆             ┆ sampled.    │\n",
       "│           ┆        ┆ (Pygoscelis ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "│           ┆        ┆ ade…        ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "│ PAL0708   ┆ 5      ┆ Adelie      ┆ Anvers ┆ … ┆ FEMALE ┆ 8.76651     ┆ -25.32426   ┆ null        │\n",
       "│           ┆        ┆ Penguin     ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "│           ┆        ┆ (Pygoscelis ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "│           ┆        ┆ ade…        ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "│ …         ┆ …      ┆ …           ┆ …      ┆ … ┆ …      ┆ …           ┆ …           ┆ …           │\n",
       "│ PAL0910   ┆ 128    ┆ Adelie      ┆ Anvers ┆ … ┆ MALE   ┆ 8.52566     ┆ -26.0245    ┆ null        │\n",
       "│           ┆        ┆ Penguin     ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "│           ┆        ┆ (Pygoscelis ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "│           ┆        ┆ ade…        ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "│ PAL0910   ┆ 129    ┆ Adelie      ┆ Anvers ┆ … ┆ FEMALE ┆ 9.19031     ┆ -25.73722   ┆ null        │\n",
       "│           ┆        ┆ Penguin     ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "│           ┆        ┆ (Pygoscelis ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "│           ┆        ┆ ade…        ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "│ PAL0910   ┆ 130    ┆ Adelie      ┆ Anvers ┆ … ┆ MALE   ┆ 9.10702     ┆ -26.01363   ┆ null        │\n",
       "│           ┆        ┆ Penguin     ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "│           ┆        ┆ (Pygoscelis ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "│           ┆        ┆ ade…        ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "│ PAL0910   ┆ 131    ┆ Adelie      ┆ Anvers ┆ … ┆ FEMALE ┆ 8.9846      ┆ -25.57956   ┆ Nest never  │\n",
       "│           ┆        ┆ Penguin     ┆        ┆   ┆        ┆             ┆             ┆ observed    │\n",
       "│           ┆        ┆ (Pygoscelis ┆        ┆   ┆        ┆             ┆             ┆ with full … │\n",
       "│           ┆        ┆ ade…        ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "│ PAL0910   ┆ 132    ┆ Adelie      ┆ Anvers ┆ … ┆ MALE   ┆ 8.86495     ┆ -26.1396    ┆ Nest never  │\n",
       "│           ┆        ┆ Penguin     ┆        ┆   ┆        ┆             ┆             ┆ observed    │\n",
       "│           ┆        ┆ (Pygoscelis ┆        ┆   ┆        ┆             ┆             ┆ with full … │\n",
       "│           ┆        ┆ ade…        ┆        ┆   ┆        ┆             ┆             ┆             │\n",
       "└───────────┴────────┴─────────────┴────────┴───┴────────┴─────────────┴─────────────┴─────────────┘"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "data": {
      "text/plain": [
       "('Dream',)"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "data": {
      "text/html": [
       "<div><style>\n",
       ".dataframe > thead > tr,\n",
       ".dataframe > tbody > tr {\n",
       "  text-align: right;\n",
       "  white-space: pre-wrap;\n",
       "}\n",
       "</style>\n",
       "<small>shape: (124, 17)</small><table border=\"1\" class=\"dataframe\"><thead><tr><th>studyName</th><th>Sample Number</th><th>Species</th><th>Region</th><th>Island</th><th>Stage</th><th>Individual ID</th><th>Clutch Completion</th><th>Date Egg</th><th>Culmen Length (mm)</th><th>Culmen Depth (mm)</th><th>Flipper Length (mm)</th><th>Body Mass (g)</th><th>Sex</th><th>Delta 15 N (o/oo)</th><th>Delta 13 C (o/oo)</th><th>Comments</th></tr><tr><td>str</td><td>i64</td><td>str</td><td>str</td><td>str</td><td>str</td><td>str</td><td>str</td><td>str</td><td>f64</td><td>f64</td><td>i64</td><td>i64</td><td>str</td><td>f64</td><td>f64</td><td>str</td></tr></thead><tbody><tr><td>&quot;PAL0708&quot;</td><td>31</td><td>&quot;Adelie Penguin (Pygoscelis ade…</td><td>&quot;Anvers&quot;</td><td>&quot;Dream&quot;</td><td>&quot;Adult, 1 Egg Stage&quot;</td><td>&quot;N21A1&quot;</td><td>&quot;Yes&quot;</td><td>&quot;11/9/07&quot;</td><td>39.5</td><td>16.7</td><td>178</td><td>3250</td><td>&quot;FEMALE&quot;</td><td>9.69756</td><td>-25.11223</td><td>null</td></tr><tr><td>&quot;PAL0708&quot;</td><td>32</td><td>&quot;Adelie Penguin (Pygoscelis ade…</td><td>&quot;Anvers&quot;</td><td>&quot;Dream&quot;</td><td>&quot;Adult, 1 Egg Stage&quot;</td><td>&quot;N21A2&quot;</td><td>&quot;Yes&quot;</td><td>&quot;11/9/07&quot;</td><td>37.2</td><td>18.1</td><td>178</td><td>3900</td><td>&quot;MALE&quot;</td><td>9.72764</td><td>-25.0102</td><td>null</td></tr><tr><td>&quot;PAL0708&quot;</td><td>33</td><td>&quot;Adelie Penguin (Pygoscelis ade…</td><td>&quot;Anvers&quot;</td><td>&quot;Dream&quot;</td><td>&quot;Adult, 1 Egg Stage&quot;</td><td>&quot;N22A1&quot;</td><td>&quot;Yes&quot;</td><td>&quot;11/9/07&quot;</td><td>39.5</td><td>17.8</td><td>188</td><td>3300</td><td>&quot;FEMALE&quot;</td><td>9.66523</td><td>-25.0602</td><td>null</td></tr><tr><td>&quot;PAL0708&quot;</td><td>34</td><td>&quot;Adelie Penguin (Pygoscelis ade…</td><td>&quot;Anvers&quot;</td><td>&quot;Dream&quot;</td><td>&quot;Adult, 1 Egg Stage&quot;</td><td>&quot;N22A2&quot;</td><td>&quot;Yes&quot;</td><td>&quot;11/9/07&quot;</td><td>40.9</td><td>18.9</td><td>184</td><td>3900</td><td>&quot;MALE&quot;</td><td>8.79665</td><td>-25.14591</td><td>null</td></tr><tr><td>&quot;PAL0708&quot;</td><td>35</td><td>&quot;Adelie Penguin (Pygoscelis ade…</td><td>&quot;Anvers&quot;</td><td>&quot;Dream&quot;</td><td>&quot;Adult, 1 Egg Stage&quot;</td><td>&quot;N23A1&quot;</td><td>&quot;Yes&quot;</td><td>&quot;11/16/07&quot;</td><td>36.4</td><td>17.0</td><td>195</td><td>3325</td><td>&quot;FEMALE&quot;</td><td>9.17847</td><td>-25.23061</td><td>null</td></tr><tr><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td></tr><tr><td>&quot;PAL0910&quot;</td><td>64</td><td>&quot;Chinstrap penguin (Pygoscelis …</td><td>&quot;Anvers&quot;</td><td>&quot;Dream&quot;</td><td>&quot;Adult, 1 Egg Stage&quot;</td><td>&quot;N98A2&quot;</td><td>&quot;Yes&quot;</td><td>&quot;11/19/09&quot;</td><td>55.8</td><td>19.8</td><td>207</td><td>4000</td><td>&quot;MALE&quot;</td><td>9.70465</td><td>-24.53494</td><td>null</td></tr><tr><td>&quot;PAL0910&quot;</td><td>65</td><td>&quot;Chinstrap penguin (Pygoscelis …</td><td>&quot;Anvers&quot;</td><td>&quot;Dream&quot;</td><td>&quot;Adult, 1 Egg Stage&quot;</td><td>&quot;N99A1&quot;</td><td>&quot;No&quot;</td><td>&quot;11/21/09&quot;</td><td>43.5</td><td>18.1</td><td>202</td><td>3400</td><td>&quot;FEMALE&quot;</td><td>9.37608</td><td>-24.40753</td><td>null</td></tr><tr><td>&quot;PAL0910&quot;</td><td>66</td><td>&quot;Chinstrap penguin (Pygoscelis …</td><td>&quot;Anvers&quot;</td><td>&quot;Dream&quot;</td><td>&quot;Adult, 1 Egg Stage&quot;</td><td>&quot;N99A2&quot;</td><td>&quot;No&quot;</td><td>&quot;11/21/09&quot;</td><td>49.6</td><td>18.2</td><td>193</td><td>3775</td><td>&quot;MALE&quot;</td><td>9.4618</td><td>-24.70615</td><td>null</td></tr><tr><td>&quot;PAL0910&quot;</td><td>67</td><td>&quot;Chinstrap penguin (Pygoscelis …</td><td>&quot;Anvers&quot;</td><td>&quot;Dream&quot;</td><td>&quot;Adult, 1 Egg Stage&quot;</td><td>&quot;N100A1&quot;</td><td>&quot;Yes&quot;</td><td>&quot;11/21/09&quot;</td><td>50.8</td><td>19.0</td><td>210</td><td>4100</td><td>&quot;MALE&quot;</td><td>9.98044</td><td>-24.68741</td><td>null</td></tr><tr><td>&quot;PAL0910&quot;</td><td>68</td><td>&quot;Chinstrap penguin (Pygoscelis …</td><td>&quot;Anvers&quot;</td><td>&quot;Dream&quot;</td><td>&quot;Adult, 1 Egg Stage&quot;</td><td>&quot;N100A2&quot;</td><td>&quot;Yes&quot;</td><td>&quot;11/21/09&quot;</td><td>50.2</td><td>18.7</td><td>198</td><td>3775</td><td>&quot;FEMALE&quot;</td><td>9.39305</td><td>-24.25255</td><td>null</td></tr></tbody></table></div>"
      ],
      "text/plain": [
       "shape: (124, 17)\n",
       "┌───────────┬────────┬──────────────┬────────┬───┬────────┬──────────────┬──────────────┬──────────┐\n",
       "│ studyName ┆ Sample ┆ Species      ┆ Region ┆ … ┆ Sex    ┆ Delta 15 N   ┆ Delta 13 C   ┆ Comments │\n",
       "│ ---       ┆ Number ┆ ---          ┆ ---    ┆   ┆ ---    ┆ (o/oo)       ┆ (o/oo)       ┆ ---      │\n",
       "│ str       ┆ ---    ┆ str          ┆ str    ┆   ┆ str    ┆ ---          ┆ ---          ┆ str      │\n",
       "│           ┆ i64    ┆              ┆        ┆   ┆        ┆ f64          ┆ f64          ┆          │\n",
       "╞═══════════╪════════╪══════════════╪════════╪═══╪════════╪══════════════╪══════════════╪══════════╡\n",
       "│ PAL0708   ┆ 31     ┆ Adelie       ┆ Anvers ┆ … ┆ FEMALE ┆ 9.69756      ┆ -25.11223    ┆ null     │\n",
       "│           ┆        ┆ Penguin      ┆        ┆   ┆        ┆              ┆              ┆          │\n",
       "│           ┆        ┆ (Pygoscelis  ┆        ┆   ┆        ┆              ┆              ┆          │\n",
       "│           ┆        ┆ ade…         ┆        ┆   ┆        ┆              ┆              ┆          │\n",
       "│ PAL0708   ┆ 32     ┆ Adelie       ┆ Anvers ┆ … ┆ MALE   ┆ 9.72764      ┆ -25.0102     ┆ null     │\n",
       "│           ┆        ┆ Penguin      ┆        ┆   ┆        ┆              ┆              ┆          │\n",
       "│           ┆        ┆ (Pygoscelis  ┆        ┆   ┆        ┆              ┆              ┆          │\n",
       "│           ┆        ┆ ade…         ┆        ┆   ┆        ┆              ┆              ┆          │\n",
       "│ PAL0708   ┆ 33     ┆ Adelie       ┆ Anvers ┆ … ┆ FEMALE ┆ 9.66523      ┆ -25.0602     ┆ null     │\n",
       "│           ┆        ┆ Penguin      ┆        ┆   ┆        ┆              ┆              ┆          │\n",
       "│           ┆        ┆ (Pygoscelis  ┆        ┆   ┆        ┆              ┆              ┆          │\n",
       "│           ┆        ┆ ade…         ┆        ┆   ┆        ┆              ┆              ┆          │\n",
       "│ PAL0708   ┆ 34     ┆ Adelie       ┆ Anvers ┆ … ┆ MALE   ┆ 8.79665      ┆ -25.14591    ┆ null     │\n",
       "│           ┆        ┆ Penguin      ┆        ┆   ┆        ┆              ┆              ┆          │\n",
       "│           ┆        ┆ (Pygoscelis  ┆        ┆   ┆        ┆              ┆              ┆          │\n",
       "│           ┆        ┆ ade…         ┆        ┆   ┆        ┆              ┆              ┆          │\n",
       "│ PAL0708   ┆ 35     ┆ Adelie       ┆ Anvers ┆ … ┆ FEMALE ┆ 9.17847      ┆ -25.23061    ┆ null     │\n",
       "│           ┆        ┆ Penguin      ┆        ┆   ┆        ┆              ┆              ┆          │\n",
       "│           ┆        ┆ (Pygoscelis  ┆        ┆   ┆        ┆              ┆              ┆          │\n",
       "│           ┆        ┆ ade…         ┆        ┆   ┆        ┆              ┆              ┆          │\n",
       "│ …         ┆ …      ┆ …            ┆ …      ┆ … ┆ …      ┆ …            ┆ …            ┆ …        │\n",
       "│ PAL0910   ┆ 64     ┆ Chinstrap    ┆ Anvers ┆ … ┆ MALE   ┆ 9.70465      ┆ -24.53494    ┆ null     │\n",
       "│           ┆        ┆ penguin      ┆        ┆   ┆        ┆              ┆              ┆          │\n",
       "│           ┆        ┆ (Pygoscelis  ┆        ┆   ┆        ┆              ┆              ┆          │\n",
       "│           ┆        ┆ …            ┆        ┆   ┆        ┆              ┆              ┆          │\n",
       "│ PAL0910   ┆ 65     ┆ Chinstrap    ┆ Anvers ┆ … ┆ FEMALE ┆ 9.37608      ┆ -24.40753    ┆ null     │\n",
       "│           ┆        ┆ penguin      ┆        ┆   ┆        ┆              ┆              ┆          │\n",
       "│           ┆        ┆ (Pygoscelis  ┆        ┆   ┆        ┆              ┆              ┆          │\n",
       "│           ┆        ┆ …            ┆        ┆   ┆        ┆              ┆              ┆          │\n",
       "│ PAL0910   ┆ 66     ┆ Chinstrap    ┆ Anvers ┆ … ┆ MALE   ┆ 9.4618       ┆ -24.70615    ┆ null     │\n",
       "│           ┆        ┆ penguin      ┆        ┆   ┆        ┆              ┆              ┆          │\n",
       "│           ┆        ┆ (Pygoscelis  ┆        ┆   ┆        ┆              ┆              ┆          │\n",
       "│           ┆        ┆ …            ┆        ┆   ┆        ┆              ┆              ┆          │\n",
       "│ PAL0910   ┆ 67     ┆ Chinstrap    ┆ Anvers ┆ … ┆ MALE   ┆ 9.98044      ┆ -24.68741    ┆ null     │\n",
       "│           ┆        ┆ penguin      ┆        ┆   ┆        ┆              ┆              ┆          │\n",
       "│           ┆        ┆ (Pygoscelis  ┆        ┆   ┆        ┆              ┆              ┆          │\n",
       "│           ┆        ┆ …            ┆        ┆   ┆        ┆              ┆              ┆          │\n",
       "│ PAL0910   ┆ 68     ┆ Chinstrap    ┆ Anvers ┆ … ┆ FEMALE ┆ 9.39305      ┆ -24.25255    ┆ null     │\n",
       "│           ┆        ┆ penguin      ┆        ┆   ┆        ┆              ┆              ┆          │\n",
       "│           ┆        ┆ (Pygoscelis  ┆        ┆   ┆        ┆              ┆              ┆          │\n",
       "│           ┆        ┆ …            ┆        ┆   ┆        ┆              ┆              ┆          │\n",
       "└───────────┴────────┴──────────────┴────────┴───┴────────┴──────────────┴──────────────┴──────────┘"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "data": {
      "text/plain": [
       "('Biscoe',)"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "data": {
      "text/html": [
       "<div><style>\n",
       ".dataframe > thead > tr,\n",
       ".dataframe > tbody > tr {\n",
       "  text-align: right;\n",
       "  white-space: pre-wrap;\n",
       "}\n",
       "</style>\n",
       "<small>shape: (168, 17)</small><table border=\"1\" class=\"dataframe\"><thead><tr><th>studyName</th><th>Sample Number</th><th>Species</th><th>Region</th><th>Island</th><th>Stage</th><th>Individual ID</th><th>Clutch Completion</th><th>Date Egg</th><th>Culmen Length (mm)</th><th>Culmen Depth (mm)</th><th>Flipper Length (mm)</th><th>Body Mass (g)</th><th>Sex</th><th>Delta 15 N (o/oo)</th><th>Delta 13 C (o/oo)</th><th>Comments</th></tr><tr><td>str</td><td>i64</td><td>str</td><td>str</td><td>str</td><td>str</td><td>str</td><td>str</td><td>str</td><td>f64</td><td>f64</td><td>i64</td><td>i64</td><td>str</td><td>f64</td><td>f64</td><td>str</td></tr></thead><tbody><tr><td>&quot;PAL0708&quot;</td><td>21</td><td>&quot;Adelie Penguin (Pygoscelis ade…</td><td>&quot;Anvers&quot;</td><td>&quot;Biscoe&quot;</td><td>&quot;Adult, 1 Egg Stage&quot;</td><td>&quot;N11A1&quot;</td><td>&quot;Yes&quot;</td><td>&quot;11/12/07&quot;</td><td>37.8</td><td>18.3</td><td>174</td><td>3400</td><td>&quot;FEMALE&quot;</td><td>8.73762</td><td>-25.09383</td><td>null</td></tr><tr><td>&quot;PAL0708&quot;</td><td>22</td><td>&quot;Adelie Penguin (Pygoscelis ade…</td><td>&quot;Anvers&quot;</td><td>&quot;Biscoe&quot;</td><td>&quot;Adult, 1 Egg Stage&quot;</td><td>&quot;N11A2&quot;</td><td>&quot;Yes&quot;</td><td>&quot;11/12/07&quot;</td><td>37.7</td><td>18.7</td><td>180</td><td>3600</td><td>&quot;MALE&quot;</td><td>8.66271</td><td>-25.0639</td><td>null</td></tr><tr><td>&quot;PAL0708&quot;</td><td>23</td><td>&quot;Adelie Penguin (Pygoscelis ade…</td><td>&quot;Anvers&quot;</td><td>&quot;Biscoe&quot;</td><td>&quot;Adult, 1 Egg Stage&quot;</td><td>&quot;N12A1&quot;</td><td>&quot;Yes&quot;</td><td>&quot;11/12/07&quot;</td><td>35.9</td><td>19.2</td><td>189</td><td>3800</td><td>&quot;FEMALE&quot;</td><td>9.22286</td><td>-25.03474</td><td>null</td></tr><tr><td>&quot;PAL0708&quot;</td><td>24</td><td>&quot;Adelie Penguin (Pygoscelis ade…</td><td>&quot;Anvers&quot;</td><td>&quot;Biscoe&quot;</td><td>&quot;Adult, 1 Egg Stage&quot;</td><td>&quot;N12A2&quot;</td><td>&quot;Yes&quot;</td><td>&quot;11/12/07&quot;</td><td>38.2</td><td>18.1</td><td>185</td><td>3950</td><td>&quot;MALE&quot;</td><td>8.43423</td><td>-25.22664</td><td>null</td></tr><tr><td>&quot;PAL0708&quot;</td><td>25</td><td>&quot;Adelie Penguin (Pygoscelis ade…</td><td>&quot;Anvers&quot;</td><td>&quot;Biscoe&quot;</td><td>&quot;Adult, 1 Egg Stage&quot;</td><td>&quot;N13A1&quot;</td><td>&quot;Yes&quot;</td><td>&quot;11/10/07&quot;</td><td>38.8</td><td>17.2</td><td>180</td><td>3800</td><td>&quot;MALE&quot;</td><td>9.63954</td><td>-25.29856</td><td>null</td></tr><tr><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td></tr><tr><td>&quot;PAL0910&quot;</td><td>120</td><td>&quot;Gentoo penguin (Pygoscelis pap…</td><td>&quot;Anvers&quot;</td><td>&quot;Biscoe&quot;</td><td>&quot;Adult, 1 Egg Stage&quot;</td><td>&quot;N38A2&quot;</td><td>&quot;No&quot;</td><td>&quot;12/1/09&quot;</td><td>null</td><td>null</td><td>null</td><td>null</td><td>null</td><td>null</td><td>null</td><td>null</td></tr><tr><td>&quot;PAL0910&quot;</td><td>121</td><td>&quot;Gentoo penguin (Pygoscelis pap…</td><td>&quot;Anvers&quot;</td><td>&quot;Biscoe&quot;</td><td>&quot;Adult, 1 Egg Stage&quot;</td><td>&quot;N39A1&quot;</td><td>&quot;Yes&quot;</td><td>&quot;11/22/09&quot;</td><td>46.8</td><td>14.3</td><td>215</td><td>4850</td><td>&quot;FEMALE&quot;</td><td>8.41151</td><td>-26.13832</td><td>null</td></tr><tr><td>&quot;PAL0910&quot;</td><td>122</td><td>&quot;Gentoo penguin (Pygoscelis pap…</td><td>&quot;Anvers&quot;</td><td>&quot;Biscoe&quot;</td><td>&quot;Adult, 1 Egg Stage&quot;</td><td>&quot;N39A2&quot;</td><td>&quot;Yes&quot;</td><td>&quot;11/22/09&quot;</td><td>50.4</td><td>15.7</td><td>222</td><td>5750</td><td>&quot;MALE&quot;</td><td>8.30166</td><td>-26.04117</td><td>null</td></tr><tr><td>&quot;PAL0910&quot;</td><td>123</td><td>&quot;Gentoo penguin (Pygoscelis pap…</td><td>&quot;Anvers&quot;</td><td>&quot;Biscoe&quot;</td><td>&quot;Adult, 1 Egg Stage&quot;</td><td>&quot;N43A1&quot;</td><td>&quot;Yes&quot;</td><td>&quot;11/22/09&quot;</td><td>45.2</td><td>14.8</td><td>212</td><td>5200</td><td>&quot;FEMALE&quot;</td><td>8.24246</td><td>-26.11969</td><td>null</td></tr><tr><td>&quot;PAL0910&quot;</td><td>124</td><td>&quot;Gentoo penguin (Pygoscelis pap…</td><td>&quot;Anvers&quot;</td><td>&quot;Biscoe&quot;</td><td>&quot;Adult, 1 Egg Stage&quot;</td><td>&quot;N43A2&quot;</td><td>&quot;Yes&quot;</td><td>&quot;11/22/09&quot;</td><td>49.9</td><td>16.1</td><td>213</td><td>5400</td><td>&quot;MALE&quot;</td><td>8.3639</td><td>-26.15531</td><td>null</td></tr></tbody></table></div>"
      ],
      "text/plain": [
       "shape: (168, 17)\n",
       "┌───────────┬────────┬──────────────┬────────┬───┬────────┬──────────────┬──────────────┬──────────┐\n",
       "│ studyName ┆ Sample ┆ Species      ┆ Region ┆ … ┆ Sex    ┆ Delta 15 N   ┆ Delta 13 C   ┆ Comments │\n",
       "│ ---       ┆ Number ┆ ---          ┆ ---    ┆   ┆ ---    ┆ (o/oo)       ┆ (o/oo)       ┆ ---      │\n",
       "│ str       ┆ ---    ┆ str          ┆ str    ┆   ┆ str    ┆ ---          ┆ ---          ┆ str      │\n",
       "│           ┆ i64    ┆              ┆        ┆   ┆        ┆ f64          ┆ f64          ┆          │\n",
       "╞═══════════╪════════╪══════════════╪════════╪═══╪════════╪══════════════╪══════════════╪══════════╡\n",
       "│ PAL0708   ┆ 21     ┆ Adelie       ┆ Anvers ┆ … ┆ FEMALE ┆ 8.73762      ┆ -25.09383    ┆ null     │\n",
       "│           ┆        ┆ Penguin      ┆        ┆   ┆        ┆              ┆              ┆          │\n",
       "│           ┆        ┆ (Pygoscelis  ┆        ┆   ┆        ┆              ┆              ┆          │\n",
       "│           ┆        ┆ ade…         ┆        ┆   ┆        ┆              ┆              ┆          │\n",
       "│ PAL0708   ┆ 22     ┆ Adelie       ┆ Anvers ┆ … ┆ MALE   ┆ 8.66271      ┆ -25.0639     ┆ null     │\n",
       "│           ┆        ┆ Penguin      ┆        ┆   ┆        ┆              ┆              ┆          │\n",
       "│           ┆        ┆ (Pygoscelis  ┆        ┆   ┆        ┆              ┆              ┆          │\n",
       "│           ┆        ┆ ade…         ┆        ┆   ┆        ┆              ┆              ┆          │\n",
       "│ PAL0708   ┆ 23     ┆ Adelie       ┆ Anvers ┆ … ┆ FEMALE ┆ 9.22286      ┆ -25.03474    ┆ null     │\n",
       "│           ┆        ┆ Penguin      ┆        ┆   ┆        ┆              ┆              ┆          │\n",
       "│           ┆        ┆ (Pygoscelis  ┆        ┆   ┆        ┆              ┆              ┆          │\n",
       "│           ┆        ┆ ade…         ┆        ┆   ┆        ┆              ┆              ┆          │\n",
       "│ PAL0708   ┆ 24     ┆ Adelie       ┆ Anvers ┆ … ┆ MALE   ┆ 8.43423      ┆ -25.22664    ┆ null     │\n",
       "│           ┆        ┆ Penguin      ┆        ┆   ┆        ┆              ┆              ┆          │\n",
       "│           ┆        ┆ (Pygoscelis  ┆        ┆   ┆        ┆              ┆              ┆          │\n",
       "│           ┆        ┆ ade…         ┆        ┆   ┆        ┆              ┆              ┆          │\n",
       "│ PAL0708   ┆ 25     ┆ Adelie       ┆ Anvers ┆ … ┆ MALE   ┆ 9.63954      ┆ -25.29856    ┆ null     │\n",
       "│           ┆        ┆ Penguin      ┆        ┆   ┆        ┆              ┆              ┆          │\n",
       "│           ┆        ┆ (Pygoscelis  ┆        ┆   ┆        ┆              ┆              ┆          │\n",
       "│           ┆        ┆ ade…         ┆        ┆   ┆        ┆              ┆              ┆          │\n",
       "│ …         ┆ …      ┆ …            ┆ …      ┆ … ┆ …      ┆ …            ┆ …            ┆ …        │\n",
       "│ PAL0910   ┆ 120    ┆ Gentoo       ┆ Anvers ┆ … ┆ null   ┆ null         ┆ null         ┆ null     │\n",
       "│           ┆        ┆ penguin      ┆        ┆   ┆        ┆              ┆              ┆          │\n",
       "│           ┆        ┆ (Pygoscelis  ┆        ┆   ┆        ┆              ┆              ┆          │\n",
       "│           ┆        ┆ pap…         ┆        ┆   ┆        ┆              ┆              ┆          │\n",
       "│ PAL0910   ┆ 121    ┆ Gentoo       ┆ Anvers ┆ … ┆ FEMALE ┆ 8.41151      ┆ -26.13832    ┆ null     │\n",
       "│           ┆        ┆ penguin      ┆        ┆   ┆        ┆              ┆              ┆          │\n",
       "│           ┆        ┆ (Pygoscelis  ┆        ┆   ┆        ┆              ┆              ┆          │\n",
       "│           ┆        ┆ pap…         ┆        ┆   ┆        ┆              ┆              ┆          │\n",
       "│ PAL0910   ┆ 122    ┆ Gentoo       ┆ Anvers ┆ … ┆ MALE   ┆ 8.30166      ┆ -26.04117    ┆ null     │\n",
       "│           ┆        ┆ penguin      ┆        ┆   ┆        ┆              ┆              ┆          │\n",
       "│           ┆        ┆ (Pygoscelis  ┆        ┆   ┆        ┆              ┆              ┆          │\n",
       "│           ┆        ┆ pap…         ┆        ┆   ┆        ┆              ┆              ┆          │\n",
       "│ PAL0910   ┆ 123    ┆ Gentoo       ┆ Anvers ┆ … ┆ FEMALE ┆ 8.24246      ┆ -26.11969    ┆ null     │\n",
       "│           ┆        ┆ penguin      ┆        ┆   ┆        ┆              ┆              ┆          │\n",
       "│           ┆        ┆ (Pygoscelis  ┆        ┆   ┆        ┆              ┆              ┆          │\n",
       "│           ┆        ┆ pap…         ┆        ┆   ┆        ┆              ┆              ┆          │\n",
       "│ PAL0910   ┆ 124    ┆ Gentoo       ┆ Anvers ┆ … ┆ MALE   ┆ 8.3639       ┆ -26.15531    ┆ null     │\n",
       "│           ┆        ┆ penguin      ┆        ┆   ┆        ┆              ┆              ┆          │\n",
       "│           ┆        ┆ (Pygoscelis  ┆        ┆   ┆        ┆              ┆              ┆          │\n",
       "│           ┆        ┆ pap…         ┆        ┆   ┆        ┆              ┆              ┆          │\n",
       "└───────────┴────────┴──────────────┴────────┴───┴────────┴──────────────┴──────────────┴──────────┘"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    }
   ],
   "source": [
    "for name, gdf in df.group_by('Island'):\n",
    "    display(name, gdf)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 60,
   "id": "e4aecfbd-7e44-4e6a-8d84-da7448aaaa1f",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div><style>\n",
       ".dataframe > thead > tr,\n",
       ".dataframe > tbody > tr {\n",
       "  text-align: right;\n",
       "  white-space: pre-wrap;\n",
       "}\n",
       "</style>\n",
       "<small>shape: (3, 2)</small><table border=\"1\" class=\"dataframe\"><thead><tr><th>Island</th><th>len</th></tr><tr><td>str</td><td>u32</td></tr></thead><tbody><tr><td>&quot;Biscoe&quot;</td><td>168</td></tr><tr><td>&quot;Dream&quot;</td><td>124</td></tr><tr><td>&quot;Torgersen&quot;</td><td>52</td></tr></tbody></table></div>"
      ],
      "text/plain": [
       "shape: (3, 2)\n",
       "┌───────────┬─────┐\n",
       "│ Island    ┆ len │\n",
       "│ ---       ┆ --- │\n",
       "│ str       ┆ u32 │\n",
       "╞═══════════╪═════╡\n",
       "│ Biscoe    ┆ 168 │\n",
       "│ Dream     ┆ 124 │\n",
       "│ Torgersen ┆ 52  │\n",
       "└───────────┴─────┘"
      ]
     },
     "execution_count": 60,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df.group_by('Island').agg(pl.len())"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 61,
   "id": "ef6ad4c0-89a0-48ff-b06d-6d33602a13ed",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div><style>\n",
       ".dataframe > thead > tr,\n",
       ".dataframe > tbody > tr {\n",
       "  text-align: right;\n",
       "  white-space: pre-wrap;\n",
       "}\n",
       "</style>\n",
       "<small>shape: (3, 2)</small><table border=\"1\" class=\"dataframe\"><thead><tr><th>Island</th><th>count</th></tr><tr><td>str</td><td>u32</td></tr></thead><tbody><tr><td>&quot;Torgersen&quot;</td><td>52</td></tr><tr><td>&quot;Biscoe&quot;</td><td>168</td></tr><tr><td>&quot;Dream&quot;</td><td>124</td></tr></tbody></table></div>"
      ],
      "text/plain": [
       "shape: (3, 2)\n",
       "┌───────────┬───────┐\n",
       "│ Island    ┆ count │\n",
       "│ ---       ┆ ---   │\n",
       "│ str       ┆ u32   │\n",
       "╞═══════════╪═══════╡\n",
       "│ Torgersen ┆ 52    │\n",
       "│ Biscoe    ┆ 168   │\n",
       "│ Dream     ┆ 124   │\n",
       "└───────────┴───────┘"
      ]
     },
     "execution_count": 61,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df['Island'].value_counts()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 62,
   "id": "1d9fc7e0-9e07-4bfb-8da7-b9255404fa54",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div><style>\n",
       ".dataframe > thead > tr,\n",
       ".dataframe > tbody > tr {\n",
       "  text-align: right;\n",
       "  white-space: pre-wrap;\n",
       "}\n",
       "</style>\n",
       "<small>shape: (3, 2)</small><table border=\"1\" class=\"dataframe\"><thead><tr><th>Island</th><th>Culmen Length (mm)</th></tr><tr><td>str</td><td>f64</td></tr></thead><tbody><tr><td>&quot;Torgersen&quot;</td><td>38.95098</td></tr><tr><td>&quot;Biscoe&quot;</td><td>45.257485</td></tr><tr><td>&quot;Dream&quot;</td><td>44.167742</td></tr></tbody></table></div>"
      ],
      "text/plain": [
       "shape: (3, 2)\n",
       "┌───────────┬────────────────────┐\n",
       "│ Island    ┆ Culmen Length (mm) │\n",
       "│ ---       ┆ ---                │\n",
       "│ str       ┆ f64                │\n",
       "╞═══════════╪════════════════════╡\n",
       "│ Torgersen ┆ 38.95098           │\n",
       "│ Biscoe    ┆ 45.257485          │\n",
       "│ Dream     ┆ 44.167742          │\n",
       "└───────────┴────────────────────┘"
      ]
     },
     "execution_count": 62,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df.group_by('Island').agg(pl.col('Culmen Length (mm)').mean())"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 63,
   "id": "fab53853-712c-43d4-8549-ceaf2121a507",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div><style>\n",
       ".dataframe > thead > tr,\n",
       ".dataframe > tbody > tr {\n",
       "  text-align: right;\n",
       "  white-space: pre-wrap;\n",
       "}\n",
       "</style>\n",
       "<small>shape: (3, 3)</small><table border=\"1\" class=\"dataframe\"><thead><tr><th>Island</th><th>Culmen Length (mm)</th><th>Culmen Depth (mm)</th></tr><tr><td>str</td><td>f64</td><td>f64</td></tr></thead><tbody><tr><td>&quot;Dream&quot;</td><td>44.167742</td><td>18.344355</td></tr><tr><td>&quot;Torgersen&quot;</td><td>38.95098</td><td>18.429412</td></tr><tr><td>&quot;Biscoe&quot;</td><td>45.257485</td><td>15.87485</td></tr></tbody></table></div>"
      ],
      "text/plain": [
       "shape: (3, 3)\n",
       "┌───────────┬────────────────────┬───────────────────┐\n",
       "│ Island    ┆ Culmen Length (mm) ┆ Culmen Depth (mm) │\n",
       "│ ---       ┆ ---                ┆ ---               │\n",
       "│ str       ┆ f64                ┆ f64               │\n",
       "╞═══════════╪════════════════════╪═══════════════════╡\n",
       "│ Dream     ┆ 44.167742          ┆ 18.344355         │\n",
       "│ Torgersen ┆ 38.95098           ┆ 18.429412         │\n",
       "│ Biscoe    ┆ 45.257485          ┆ 15.87485          │\n",
       "└───────────┴────────────────────┴───────────────────┘"
      ]
     },
     "execution_count": 63,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df.group_by('Island').agg(pl.col('Culmen Length (mm)').mean(), pl.col('Culmen Depth (mm)').mean())"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 64,
   "id": "be01b737-b914-4ece-89de-acb233392ee1",
   "metadata": {},
   "outputs": [
    {
     "ename": "DuplicateError",
     "evalue": "column with name 'Culmen Length (mm)' has more than one occurrence\n\nResolved plan until failure:\n\n\t---> FAILED HERE RESOLVING 'sink' <---\nDF [\"studyName\", \"Sample Number\", \"Species\", \"Region\", ...]; PROJECT */17 COLUMNS",
     "output_type": "error",
     "traceback": [
      "\u001b[31m---------------------------------------------------------------------------\u001b[39m",
      "\u001b[31mDuplicateError\u001b[39m                            Traceback (most recent call last)",
      "\u001b[36mCell\u001b[39m\u001b[36m \u001b[39m\u001b[32mIn[64]\u001b[39m\u001b[32m, line 1\u001b[39m\n\u001b[32m----> \u001b[39m\u001b[32m1\u001b[39m \u001b[43mdf\u001b[49m\u001b[43m.\u001b[49m\u001b[43mgroup_by\u001b[49m\u001b[43m(\u001b[49m\u001b[33;43m'\u001b[39;49m\u001b[33;43mIsland\u001b[39;49m\u001b[33;43m'\u001b[39;49m\u001b[43m)\u001b[49m\u001b[43m.\u001b[49m\u001b[43magg\u001b[49m\u001b[43m(\u001b[49m\n\u001b[32m      2\u001b[39m \u001b[43m    \u001b[49m\u001b[43mpl\u001b[49m\u001b[43m.\u001b[49m\u001b[43mcol\u001b[49m\u001b[43m(\u001b[49m\u001b[33;43m'\u001b[39;49m\u001b[33;43mCulmen Length (mm)\u001b[39;49m\u001b[33;43m'\u001b[39;49m\u001b[43m)\u001b[49m\u001b[43m.\u001b[49m\u001b[43mmean\u001b[49m\u001b[43m(\u001b[49m\u001b[43m)\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\n\u001b[32m      3\u001b[39m \u001b[43m    \u001b[49m\u001b[43mpl\u001b[49m\u001b[43m.\u001b[49m\u001b[43mcol\u001b[49m\u001b[43m(\u001b[49m\u001b[33;43m'\u001b[39;49m\u001b[33;43mCulmen Length (mm)\u001b[39;49m\u001b[33;43m'\u001b[39;49m\u001b[43m)\u001b[49m\u001b[43m.\u001b[49m\u001b[43mmax\u001b[49m\u001b[43m(\u001b[49m\u001b[43m)\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\n\u001b[32m      4\u001b[39m \u001b[43m    \u001b[49m\u001b[43mpl\u001b[49m\u001b[43m.\u001b[49m\u001b[43mcol\u001b[49m\u001b[43m(\u001b[49m\u001b[33;43m'\u001b[39;49m\u001b[33;43mCulmen Depth (mm)\u001b[39;49m\u001b[33;43m'\u001b[39;49m\u001b[43m)\u001b[49m\u001b[43m.\u001b[49m\u001b[43mmean\u001b[49m\u001b[43m(\u001b[49m\u001b[43m)\u001b[49m\n\u001b[32m      5\u001b[39m \u001b[43m)\u001b[49m\n",
      "\u001b[36mFile \u001b[39m\u001b[32m~/Dropbox/Documents/Teaching/cs503-2026sp/.pixi/envs/default/lib/python3.14/site-packages/polars/dataframe/group_by.py:298\u001b[39m, in \u001b[36mGroupBy.agg\u001b[39m\u001b[34m(self, *aggs, **named_aggs)\u001b[39m\n\u001b[32m    195\u001b[39m \u001b[38;5;250m\u001b[39m\u001b[33;03m\"\"\"\u001b[39;00m\n\u001b[32m    196\u001b[39m \u001b[33;03mCompute aggregations for each group of a group by operation.\u001b[39;00m\n\u001b[32m    197\u001b[39m \n\u001b[32m   (...)\u001b[39m\u001b[32m    291\u001b[39m \u001b[33;03m└─────┴───────┴────────────────┘\u001b[39;00m\n\u001b[32m    292\u001b[39m \u001b[33;03m\"\"\"\u001b[39;00m\n\u001b[32m    293\u001b[39m \u001b[38;5;28;01mfrom\u001b[39;00m\u001b[38;5;250m \u001b[39m\u001b[34;01mpolars\u001b[39;00m\u001b[34;01m.\u001b[39;00m\u001b[34;01mlazyframe\u001b[39;00m\u001b[34;01m.\u001b[39;00m\u001b[34;01mopt_flags\u001b[39;00m\u001b[38;5;250m \u001b[39m\u001b[38;5;28;01mimport\u001b[39;00m QueryOptFlags\n\u001b[32m    295\u001b[39m \u001b[38;5;28;01mreturn\u001b[39;00m (\n\u001b[32m    296\u001b[39m     \u001b[38;5;28;43mself\u001b[39;49m\u001b[43m.\u001b[49m\u001b[43m_lgb\u001b[49m\u001b[43m(\u001b[49m\u001b[43m)\u001b[49m\n\u001b[32m    297\u001b[39m \u001b[43m    \u001b[49m\u001b[43m.\u001b[49m\u001b[43magg\u001b[49m\u001b[43m(\u001b[49m\u001b[43m*\u001b[49m\u001b[43maggs\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[43m*\u001b[49m\u001b[43m*\u001b[49m\u001b[43mnamed_aggs\u001b[49m\u001b[43m)\u001b[49m\n\u001b[32m--> \u001b[39m\u001b[32m298\u001b[39m \u001b[43m    \u001b[49m\u001b[43m.\u001b[49m\u001b[43mcollect\u001b[49m\u001b[43m(\u001b[49m\u001b[43moptimizations\u001b[49m\u001b[43m=\u001b[49m\u001b[43mQueryOptFlags\u001b[49m\u001b[43m.\u001b[49m\u001b[43mnone\u001b[49m\u001b[43m(\u001b[49m\u001b[43m)\u001b[49m\u001b[43m)\u001b[49m\n\u001b[32m    299\u001b[39m )\n",
      "\u001b[36mFile \u001b[39m\u001b[32m~/Dropbox/Documents/Teaching/cs503-2026sp/.pixi/envs/default/lib/python3.14/site-packages/polars/_utils/deprecation.py:97\u001b[39m, in \u001b[36mdeprecate_streaming_parameter.<locals>.decorate.<locals>.wrapper\u001b[39m\u001b[34m(*args, **kwargs)\u001b[39m\n\u001b[32m     93\u001b[39m         kwargs[\u001b[33m\"\u001b[39m\u001b[33mengine\u001b[39m\u001b[33m\"\u001b[39m] = \u001b[33m\"\u001b[39m\u001b[33min-memory\u001b[39m\u001b[33m\"\u001b[39m\n\u001b[32m     95\u001b[39m     \u001b[38;5;28;01mdel\u001b[39;00m kwargs[\u001b[33m\"\u001b[39m\u001b[33mstreaming\u001b[39m\u001b[33m\"\u001b[39m]\n\u001b[32m---> \u001b[39m\u001b[32m97\u001b[39m \u001b[38;5;28;01mreturn\u001b[39;00m \u001b[43mfunction\u001b[49m\u001b[43m(\u001b[49m\u001b[43m*\u001b[49m\u001b[43margs\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[43m*\u001b[49m\u001b[43m*\u001b[49m\u001b[43mkwargs\u001b[49m\u001b[43m)\u001b[49m\n",
      "\u001b[36mFile \u001b[39m\u001b[32m~/Dropbox/Documents/Teaching/cs503-2026sp/.pixi/envs/default/lib/python3.14/site-packages/polars/lazyframe/opt_flags.py:328\u001b[39m, in \u001b[36mforward_old_opt_flags.<locals>.decorate.<locals>.wrapper\u001b[39m\u001b[34m(*args, **kwargs)\u001b[39m\n\u001b[32m    325\u001b[39m         optflags = cb(optflags, kwargs.pop(key))  \u001b[38;5;66;03m# type: ignore[no-untyped-call,unused-ignore]\u001b[39;00m\n\u001b[32m    327\u001b[39m kwargs[\u001b[33m\"\u001b[39m\u001b[33moptimizations\u001b[39m\u001b[33m\"\u001b[39m] = optflags\n\u001b[32m--> \u001b[39m\u001b[32m328\u001b[39m \u001b[38;5;28;01mreturn\u001b[39;00m \u001b[43mfunction\u001b[49m\u001b[43m(\u001b[49m\u001b[43m*\u001b[49m\u001b[43margs\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[43m*\u001b[49m\u001b[43m*\u001b[49m\u001b[43mkwargs\u001b[49m\u001b[43m)\u001b[49m\n",
      "\u001b[36mFile \u001b[39m\u001b[32m~/Dropbox/Documents/Teaching/cs503-2026sp/.pixi/envs/default/lib/python3.14/site-packages/polars/lazyframe/frame.py:2429\u001b[39m, in \u001b[36mLazyFrame.collect\u001b[39m\u001b[34m(self, type_coercion, predicate_pushdown, projection_pushdown, simplify_expression, slice_pushdown, comm_subplan_elim, comm_subexpr_elim, cluster_with_columns, collapse_joins, no_optimization, engine, background, optimizations, **_kwargs)\u001b[39m\n\u001b[32m   2427\u001b[39m \u001b[38;5;66;03m# Only for testing purposes\u001b[39;00m\n\u001b[32m   2428\u001b[39m callback = _kwargs.get(\u001b[33m\"\u001b[39m\u001b[33mpost_opt_callback\u001b[39m\u001b[33m\"\u001b[39m, callback)\n\u001b[32m-> \u001b[39m\u001b[32m2429\u001b[39m \u001b[38;5;28;01mreturn\u001b[39;00m wrap_df(\u001b[43mldf\u001b[49m\u001b[43m.\u001b[49m\u001b[43mcollect\u001b[49m\u001b[43m(\u001b[49m\u001b[43mengine\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[43mcallback\u001b[49m\u001b[43m)\u001b[49m)\n",
      "\u001b[31mDuplicateError\u001b[39m: column with name 'Culmen Length (mm)' has more than one occurrence\n\nResolved plan until failure:\n\n\t---> FAILED HERE RESOLVING 'sink' <---\nDF [\"studyName\", \"Sample Number\", \"Species\", \"Region\", ...]; PROJECT */17 COLUMNS"
     ]
    }
   ],
   "source": [
    "df.group_by('Island').agg(\n",
    "    pl.col('Culmen Length (mm)').mean(), \n",
    "    pl.col('Culmen Length (mm)').max(), \n",
    "    pl.col('Culmen Depth (mm)').mean()\n",
    ")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 65,
   "id": "71d3ca22-8111-4d01-b601-a5fcbefbea27",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div><style>\n",
       ".dataframe > thead > tr,\n",
       ".dataframe > tbody > tr {\n",
       "  text-align: right;\n",
       "  white-space: pre-wrap;\n",
       "}\n",
       "</style>\n",
       "<small>shape: (3, 4)</small><table border=\"1\" class=\"dataframe\"><thead><tr><th>Island</th><th>Culmen Length (mm)</th><th>CLengthMax</th><th>Culmen Depth (mm)</th></tr><tr><td>str</td><td>f64</td><td>f64</td><td>f64</td></tr></thead><tbody><tr><td>&quot;Torgersen&quot;</td><td>38.95098</td><td>46.0</td><td>18.429412</td></tr><tr><td>&quot;Dream&quot;</td><td>44.167742</td><td>58.0</td><td>18.344355</td></tr><tr><td>&quot;Biscoe&quot;</td><td>45.257485</td><td>59.6</td><td>15.87485</td></tr></tbody></table></div>"
      ],
      "text/plain": [
       "shape: (3, 4)\n",
       "┌───────────┬────────────────────┬────────────┬───────────────────┐\n",
       "│ Island    ┆ Culmen Length (mm) ┆ CLengthMax ┆ Culmen Depth (mm) │\n",
       "│ ---       ┆ ---                ┆ ---        ┆ ---               │\n",
       "│ str       ┆ f64                ┆ f64        ┆ f64               │\n",
       "╞═══════════╪════════════════════╪════════════╪═══════════════════╡\n",
       "│ Torgersen ┆ 38.95098           ┆ 46.0       ┆ 18.429412         │\n",
       "│ Dream     ┆ 44.167742          ┆ 58.0       ┆ 18.344355         │\n",
       "│ Biscoe    ┆ 45.257485          ┆ 59.6       ┆ 15.87485          │\n",
       "└───────────┴────────────────────┴────────────┴───────────────────┘"
      ]
     },
     "execution_count": 65,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df.group_by('Island').agg(\n",
    "    pl.col('Culmen Length (mm)').mean(), \n",
    "    pl.col('Culmen Length (mm)').max().alias('CLengthMax'), \n",
    "    pl.col('Culmen Depth (mm)').mean()\n",
    ")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 66,
   "id": "5ed4ec64-98e4-4f15-9c1c-744783fa9fb8",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div><style>\n",
       ".dataframe > thead > tr,\n",
       ".dataframe > tbody > tr {\n",
       "  text-align: right;\n",
       "  white-space: pre-wrap;\n",
       "}\n",
       "</style>\n",
       "<small>shape: (3, 4)</small><table border=\"1\" class=\"dataframe\"><thead><tr><th>Island</th><th>Culmen Length (mm)</th><th>Culmen Depth (mm)</th><th>Flipper Length (mm)</th></tr><tr><td>str</td><td>f64</td><td>f64</td><td>f64</td></tr></thead><tbody><tr><td>&quot;Dream&quot;</td><td>44.167742</td><td>18.344355</td><td>193.072581</td></tr><tr><td>&quot;Torgersen&quot;</td><td>38.95098</td><td>18.429412</td><td>191.196078</td></tr><tr><td>&quot;Biscoe&quot;</td><td>45.257485</td><td>15.87485</td><td>209.706587</td></tr></tbody></table></div>"
      ],
      "text/plain": [
       "shape: (3, 4)\n",
       "┌───────────┬────────────────────┬───────────────────┬─────────────────────┐\n",
       "│ Island    ┆ Culmen Length (mm) ┆ Culmen Depth (mm) ┆ Flipper Length (mm) │\n",
       "│ ---       ┆ ---                ┆ ---               ┆ ---                 │\n",
       "│ str       ┆ f64                ┆ f64               ┆ f64                 │\n",
       "╞═══════════╪════════════════════╪═══════════════════╪═════════════════════╡\n",
       "│ Dream     ┆ 44.167742          ┆ 18.344355         ┆ 193.072581          │\n",
       "│ Torgersen ┆ 38.95098           ┆ 18.429412         ┆ 191.196078          │\n",
       "│ Biscoe    ┆ 45.257485          ┆ 15.87485          ┆ 209.706587          │\n",
       "└───────────┴────────────────────┴───────────────────┴─────────────────────┘"
      ]
     },
     "execution_count": 66,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "import polars.selectors as cs\n",
    "df.group_by('Island').agg(cs.matches(r'.*\\(mm\\)').mean())"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 67,
   "id": "bca5536a-41ce-4f18-85fd-1a5c2b1617aa",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div><style>\n",
       ".dataframe > thead > tr,\n",
       ".dataframe > tbody > tr {\n",
       "  text-align: right;\n",
       "  white-space: pre-wrap;\n",
       "}\n",
       "</style>\n",
       "<small>shape: (3, 7)</small><table border=\"1\" class=\"dataframe\"><thead><tr><th>Island</th><th>Culmen Length (mm)</th><th>Culmen Depth (mm)</th><th>Flipper Length (mm)</th><th>Culmen Length (mm) Max</th><th>Culmen Depth (mm) Max</th><th>Flipper Length (mm) Max</th></tr><tr><td>str</td><td>f64</td><td>f64</td><td>f64</td><td>f64</td><td>f64</td><td>i64</td></tr></thead><tbody><tr><td>&quot;Dream&quot;</td><td>44.167742</td><td>18.344355</td><td>193.072581</td><td>58.0</td><td>21.2</td><td>212</td></tr><tr><td>&quot;Torgersen&quot;</td><td>38.95098</td><td>18.429412</td><td>191.196078</td><td>46.0</td><td>21.5</td><td>210</td></tr><tr><td>&quot;Biscoe&quot;</td><td>45.257485</td><td>15.87485</td><td>209.706587</td><td>59.6</td><td>21.1</td><td>231</td></tr></tbody></table></div>"
      ],
      "text/plain": [
       "shape: (3, 7)\n",
       "┌───────────┬──────────────┬──────────────┬──────────────┬─────────────┬─────────────┬─────────────┐\n",
       "│ Island    ┆ Culmen       ┆ Culmen Depth ┆ Flipper      ┆ Culmen      ┆ Culmen      ┆ Flipper     │\n",
       "│ ---       ┆ Length (mm)  ┆ (mm)         ┆ Length (mm)  ┆ Length (mm) ┆ Depth (mm)  ┆ Length (mm) │\n",
       "│ str       ┆ ---          ┆ ---          ┆ ---          ┆ Max         ┆ Max         ┆ Max         │\n",
       "│           ┆ f64          ┆ f64          ┆ f64          ┆ ---         ┆ ---         ┆ ---         │\n",
       "│           ┆              ┆              ┆              ┆ f64         ┆ f64         ┆ i64         │\n",
       "╞═══════════╪══════════════╪══════════════╪══════════════╪═════════════╪═════════════╪═════════════╡\n",
       "│ Dream     ┆ 44.167742    ┆ 18.344355    ┆ 193.072581   ┆ 58.0        ┆ 21.2        ┆ 212         │\n",
       "│ Torgersen ┆ 38.95098     ┆ 18.429412    ┆ 191.196078   ┆ 46.0        ┆ 21.5        ┆ 210         │\n",
       "│ Biscoe    ┆ 45.257485    ┆ 15.87485     ┆ 209.706587   ┆ 59.6        ┆ 21.1        ┆ 231         │\n",
       "└───────────┴──────────────┴──────────────┴──────────────┴─────────────┴─────────────┴─────────────┘"
      ]
     },
     "execution_count": 67,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df.group_by('Island').agg(cs.matches(r'.*\\(mm\\)').mean(), cs.matches(r'.*\\(mm\\)').max().name.suffix(' Max'))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 85,
   "id": "fddfab3c-1848-4eb7-bfca-4e76e688f874",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div><style>\n",
       ".dataframe > thead > tr,\n",
       ".dataframe > tbody > tr {\n",
       "  text-align: right;\n",
       "  white-space: pre-wrap;\n",
       "}\n",
       "</style>\n",
       "<small>shape: (5, 4)</small><table border=\"1\" class=\"dataframe\"><thead><tr><th>Island</th><th>Species</th><th>Culmen Length (mm)</th><th>Culmen Depth (mm)</th></tr><tr><td>str</td><td>str</td><td>f64</td><td>f64</td></tr></thead><tbody><tr><td>&quot;Torgersen&quot;</td><td>&quot;Adelie Penguin (Pygoscelis ade…</td><td>38.95098</td><td>18.429412</td></tr><tr><td>&quot;Biscoe&quot;</td><td>&quot;Gentoo penguin (Pygoscelis pap…</td><td>47.504878</td><td>14.982114</td></tr><tr><td>&quot;Biscoe&quot;</td><td>&quot;Adelie Penguin (Pygoscelis ade…</td><td>38.975</td><td>18.370455</td></tr><tr><td>&quot;Dream&quot;</td><td>&quot;Chinstrap penguin (Pygoscelis …</td><td>48.833824</td><td>18.420588</td></tr><tr><td>&quot;Dream&quot;</td><td>&quot;Adelie Penguin (Pygoscelis ade…</td><td>38.501786</td><td>18.251786</td></tr></tbody></table></div>"
      ],
      "text/plain": [
       "shape: (5, 4)\n",
       "┌───────────┬─────────────────────────────────┬────────────────────┬───────────────────┐\n",
       "│ Island    ┆ Species                         ┆ Culmen Length (mm) ┆ Culmen Depth (mm) │\n",
       "│ ---       ┆ ---                             ┆ ---                ┆ ---               │\n",
       "│ str       ┆ str                             ┆ f64                ┆ f64               │\n",
       "╞═══════════╪═════════════════════════════════╪════════════════════╪═══════════════════╡\n",
       "│ Torgersen ┆ Adelie Penguin (Pygoscelis ade… ┆ 38.95098           ┆ 18.429412         │\n",
       "│ Biscoe    ┆ Gentoo penguin (Pygoscelis pap… ┆ 47.504878          ┆ 14.982114         │\n",
       "│ Biscoe    ┆ Adelie Penguin (Pygoscelis ade… ┆ 38.975             ┆ 18.370455         │\n",
       "│ Dream     ┆ Chinstrap penguin (Pygoscelis … ┆ 48.833824          ┆ 18.420588         │\n",
       "│ Dream     ┆ Adelie Penguin (Pygoscelis ade… ┆ 38.501786          ┆ 18.251786         │\n",
       "└───────────┴─────────────────────────────────┴────────────────────┴───────────────────┘"
      ]
     },
     "execution_count": 85,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df.group_by('Island','Species').agg(pl.col('Culmen Length (mm)').mean(), pl.col('Culmen Depth (mm)').mean())"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "a2f56aea-a2f3-4451-90e2-eb16949756e4",
   "metadata": {},
   "source": [
    "##### pandas"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 68,
   "id": "9df927a2-e2f7-467a-9a28-d4a98ede4598",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "<pandas.core.groupby.generic.DataFrameGroupBy object at 0x11b153230>"
      ]
     },
     "execution_count": 68,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "dfa.groupby('Island')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 69,
   "id": "f9ac2509-df30-458a-bd80-bd9d7bfc6599",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "'Biscoe'"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>studyName</th>\n",
       "      <th>Sample Number</th>\n",
       "      <th>Species</th>\n",
       "      <th>Region</th>\n",
       "      <th>Island</th>\n",
       "      <th>Stage</th>\n",
       "      <th>Individual ID</th>\n",
       "      <th>Clutch Completion</th>\n",
       "      <th>Date Egg</th>\n",
       "      <th>Culmen Length (mm)</th>\n",
       "      <th>Culmen Depth (mm)</th>\n",
       "      <th>Flipper Length (mm)</th>\n",
       "      <th>Body Mass (g)</th>\n",
       "      <th>Sex</th>\n",
       "      <th>Delta 15 N (o/oo)</th>\n",
       "      <th>Delta 13 C (o/oo)</th>\n",
       "      <th>Comments</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>20</th>\n",
       "      <td>PAL0708</td>\n",
       "      <td>21</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Biscoe</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N11A1</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/12/07</td>\n",
       "      <td>37.8</td>\n",
       "      <td>18.3</td>\n",
       "      <td>174.0</td>\n",
       "      <td>3400.0</td>\n",
       "      <td>FEMALE</td>\n",
       "      <td>8.73762</td>\n",
       "      <td>-25.09383</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>21</th>\n",
       "      <td>PAL0708</td>\n",
       "      <td>22</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Biscoe</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N11A2</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/12/07</td>\n",
       "      <td>37.7</td>\n",
       "      <td>18.7</td>\n",
       "      <td>180.0</td>\n",
       "      <td>3600.0</td>\n",
       "      <td>MALE</td>\n",
       "      <td>8.66271</td>\n",
       "      <td>-25.06390</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>22</th>\n",
       "      <td>PAL0708</td>\n",
       "      <td>23</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Biscoe</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N12A1</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/12/07</td>\n",
       "      <td>35.9</td>\n",
       "      <td>19.2</td>\n",
       "      <td>189.0</td>\n",
       "      <td>3800.0</td>\n",
       "      <td>FEMALE</td>\n",
       "      <td>9.22286</td>\n",
       "      <td>-25.03474</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>23</th>\n",
       "      <td>PAL0708</td>\n",
       "      <td>24</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Biscoe</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N12A2</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/12/07</td>\n",
       "      <td>38.2</td>\n",
       "      <td>18.1</td>\n",
       "      <td>185.0</td>\n",
       "      <td>3950.0</td>\n",
       "      <td>MALE</td>\n",
       "      <td>8.43423</td>\n",
       "      <td>-25.22664</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>24</th>\n",
       "      <td>PAL0708</td>\n",
       "      <td>25</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Biscoe</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N13A1</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/10/07</td>\n",
       "      <td>38.8</td>\n",
       "      <td>17.2</td>\n",
       "      <td>180.0</td>\n",
       "      <td>3800.0</td>\n",
       "      <td>MALE</td>\n",
       "      <td>9.63954</td>\n",
       "      <td>-25.29856</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>339</th>\n",
       "      <td>PAL0910</td>\n",
       "      <td>120</td>\n",
       "      <td>Gentoo penguin (Pygoscelis papua)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Biscoe</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N38A2</td>\n",
       "      <td>No</td>\n",
       "      <td>12/1/09</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>340</th>\n",
       "      <td>PAL0910</td>\n",
       "      <td>121</td>\n",
       "      <td>Gentoo penguin (Pygoscelis papua)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Biscoe</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N39A1</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/22/09</td>\n",
       "      <td>46.8</td>\n",
       "      <td>14.3</td>\n",
       "      <td>215.0</td>\n",
       "      <td>4850.0</td>\n",
       "      <td>FEMALE</td>\n",
       "      <td>8.41151</td>\n",
       "      <td>-26.13832</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>341</th>\n",
       "      <td>PAL0910</td>\n",
       "      <td>122</td>\n",
       "      <td>Gentoo penguin (Pygoscelis papua)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Biscoe</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N39A2</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/22/09</td>\n",
       "      <td>50.4</td>\n",
       "      <td>15.7</td>\n",
       "      <td>222.0</td>\n",
       "      <td>5750.0</td>\n",
       "      <td>MALE</td>\n",
       "      <td>8.30166</td>\n",
       "      <td>-26.04117</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>342</th>\n",
       "      <td>PAL0910</td>\n",
       "      <td>123</td>\n",
       "      <td>Gentoo penguin (Pygoscelis papua)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Biscoe</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N43A1</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/22/09</td>\n",
       "      <td>45.2</td>\n",
       "      <td>14.8</td>\n",
       "      <td>212.0</td>\n",
       "      <td>5200.0</td>\n",
       "      <td>FEMALE</td>\n",
       "      <td>8.24246</td>\n",
       "      <td>-26.11969</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>343</th>\n",
       "      <td>PAL0910</td>\n",
       "      <td>124</td>\n",
       "      <td>Gentoo penguin (Pygoscelis papua)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Biscoe</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N43A2</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/22/09</td>\n",
       "      <td>49.9</td>\n",
       "      <td>16.1</td>\n",
       "      <td>213.0</td>\n",
       "      <td>5400.0</td>\n",
       "      <td>MALE</td>\n",
       "      <td>8.36390</td>\n",
       "      <td>-26.15531</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>168 rows × 17 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "    studyName  Sample Number                              Species  Region  \\\n",
       "20    PAL0708             21  Adelie Penguin (Pygoscelis adeliae)  Anvers   \n",
       "21    PAL0708             22  Adelie Penguin (Pygoscelis adeliae)  Anvers   \n",
       "22    PAL0708             23  Adelie Penguin (Pygoscelis adeliae)  Anvers   \n",
       "23    PAL0708             24  Adelie Penguin (Pygoscelis adeliae)  Anvers   \n",
       "24    PAL0708             25  Adelie Penguin (Pygoscelis adeliae)  Anvers   \n",
       "..        ...            ...                                  ...     ...   \n",
       "339   PAL0910            120    Gentoo penguin (Pygoscelis papua)  Anvers   \n",
       "340   PAL0910            121    Gentoo penguin (Pygoscelis papua)  Anvers   \n",
       "341   PAL0910            122    Gentoo penguin (Pygoscelis papua)  Anvers   \n",
       "342   PAL0910            123    Gentoo penguin (Pygoscelis papua)  Anvers   \n",
       "343   PAL0910            124    Gentoo penguin (Pygoscelis papua)  Anvers   \n",
       "\n",
       "     Island               Stage Individual ID Clutch Completion  Date Egg  \\\n",
       "20   Biscoe  Adult, 1 Egg Stage         N11A1               Yes  11/12/07   \n",
       "21   Biscoe  Adult, 1 Egg Stage         N11A2               Yes  11/12/07   \n",
       "22   Biscoe  Adult, 1 Egg Stage         N12A1               Yes  11/12/07   \n",
       "23   Biscoe  Adult, 1 Egg Stage         N12A2               Yes  11/12/07   \n",
       "24   Biscoe  Adult, 1 Egg Stage         N13A1               Yes  11/10/07   \n",
       "..      ...                 ...           ...               ...       ...   \n",
       "339  Biscoe  Adult, 1 Egg Stage         N38A2                No   12/1/09   \n",
       "340  Biscoe  Adult, 1 Egg Stage         N39A1               Yes  11/22/09   \n",
       "341  Biscoe  Adult, 1 Egg Stage         N39A2               Yes  11/22/09   \n",
       "342  Biscoe  Adult, 1 Egg Stage         N43A1               Yes  11/22/09   \n",
       "343  Biscoe  Adult, 1 Egg Stage         N43A2               Yes  11/22/09   \n",
       "\n",
       "     Culmen Length (mm)  Culmen Depth (mm)  Flipper Length (mm)  \\\n",
       "20                 37.8               18.3                174.0   \n",
       "21                 37.7               18.7                180.0   \n",
       "22                 35.9               19.2                189.0   \n",
       "23                 38.2               18.1                185.0   \n",
       "24                 38.8               17.2                180.0   \n",
       "..                  ...                ...                  ...   \n",
       "339                 NaN                NaN                  NaN   \n",
       "340                46.8               14.3                215.0   \n",
       "341                50.4               15.7                222.0   \n",
       "342                45.2               14.8                212.0   \n",
       "343                49.9               16.1                213.0   \n",
       "\n",
       "     Body Mass (g)     Sex  Delta 15 N (o/oo)  Delta 13 C (o/oo) Comments  \n",
       "20          3400.0  FEMALE            8.73762          -25.09383      NaN  \n",
       "21          3600.0    MALE            8.66271          -25.06390      NaN  \n",
       "22          3800.0  FEMALE            9.22286          -25.03474      NaN  \n",
       "23          3950.0    MALE            8.43423          -25.22664      NaN  \n",
       "24          3800.0    MALE            9.63954          -25.29856      NaN  \n",
       "..             ...     ...                ...                ...      ...  \n",
       "339            NaN     NaN                NaN                NaN      NaN  \n",
       "340         4850.0  FEMALE            8.41151          -26.13832      NaN  \n",
       "341         5750.0    MALE            8.30166          -26.04117      NaN  \n",
       "342         5200.0  FEMALE            8.24246          -26.11969      NaN  \n",
       "343         5400.0    MALE            8.36390          -26.15531      NaN  \n",
       "\n",
       "[168 rows x 17 columns]"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "data": {
      "text/plain": [
       "'Dream'"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>studyName</th>\n",
       "      <th>Sample Number</th>\n",
       "      <th>Species</th>\n",
       "      <th>Region</th>\n",
       "      <th>Island</th>\n",
       "      <th>Stage</th>\n",
       "      <th>Individual ID</th>\n",
       "      <th>Clutch Completion</th>\n",
       "      <th>Date Egg</th>\n",
       "      <th>Culmen Length (mm)</th>\n",
       "      <th>Culmen Depth (mm)</th>\n",
       "      <th>Flipper Length (mm)</th>\n",
       "      <th>Body Mass (g)</th>\n",
       "      <th>Sex</th>\n",
       "      <th>Delta 15 N (o/oo)</th>\n",
       "      <th>Delta 13 C (o/oo)</th>\n",
       "      <th>Comments</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>30</th>\n",
       "      <td>PAL0708</td>\n",
       "      <td>31</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Dream</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N21A1</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/9/07</td>\n",
       "      <td>39.5</td>\n",
       "      <td>16.7</td>\n",
       "      <td>178.0</td>\n",
       "      <td>3250.0</td>\n",
       "      <td>FEMALE</td>\n",
       "      <td>9.69756</td>\n",
       "      <td>-25.11223</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>31</th>\n",
       "      <td>PAL0708</td>\n",
       "      <td>32</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Dream</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N21A2</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/9/07</td>\n",
       "      <td>37.2</td>\n",
       "      <td>18.1</td>\n",
       "      <td>178.0</td>\n",
       "      <td>3900.0</td>\n",
       "      <td>MALE</td>\n",
       "      <td>9.72764</td>\n",
       "      <td>-25.01020</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>32</th>\n",
       "      <td>PAL0708</td>\n",
       "      <td>33</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Dream</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N22A1</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/9/07</td>\n",
       "      <td>39.5</td>\n",
       "      <td>17.8</td>\n",
       "      <td>188.0</td>\n",
       "      <td>3300.0</td>\n",
       "      <td>FEMALE</td>\n",
       "      <td>9.66523</td>\n",
       "      <td>-25.06020</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>33</th>\n",
       "      <td>PAL0708</td>\n",
       "      <td>34</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Dream</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N22A2</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/9/07</td>\n",
       "      <td>40.9</td>\n",
       "      <td>18.9</td>\n",
       "      <td>184.0</td>\n",
       "      <td>3900.0</td>\n",
       "      <td>MALE</td>\n",
       "      <td>8.79665</td>\n",
       "      <td>-25.14591</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>34</th>\n",
       "      <td>PAL0708</td>\n",
       "      <td>35</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Dream</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N23A1</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/16/07</td>\n",
       "      <td>36.4</td>\n",
       "      <td>17.0</td>\n",
       "      <td>195.0</td>\n",
       "      <td>3325.0</td>\n",
       "      <td>FEMALE</td>\n",
       "      <td>9.17847</td>\n",
       "      <td>-25.23061</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>215</th>\n",
       "      <td>PAL0910</td>\n",
       "      <td>64</td>\n",
       "      <td>Chinstrap penguin (Pygoscelis antarctica)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Dream</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N98A2</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/19/09</td>\n",
       "      <td>55.8</td>\n",
       "      <td>19.8</td>\n",
       "      <td>207.0</td>\n",
       "      <td>4000.0</td>\n",
       "      <td>MALE</td>\n",
       "      <td>9.70465</td>\n",
       "      <td>-24.53494</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>216</th>\n",
       "      <td>PAL0910</td>\n",
       "      <td>65</td>\n",
       "      <td>Chinstrap penguin (Pygoscelis antarctica)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Dream</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N99A1</td>\n",
       "      <td>No</td>\n",
       "      <td>11/21/09</td>\n",
       "      <td>43.5</td>\n",
       "      <td>18.1</td>\n",
       "      <td>202.0</td>\n",
       "      <td>3400.0</td>\n",
       "      <td>FEMALE</td>\n",
       "      <td>9.37608</td>\n",
       "      <td>-24.40753</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>217</th>\n",
       "      <td>PAL0910</td>\n",
       "      <td>66</td>\n",
       "      <td>Chinstrap penguin (Pygoscelis antarctica)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Dream</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N99A2</td>\n",
       "      <td>No</td>\n",
       "      <td>11/21/09</td>\n",
       "      <td>49.6</td>\n",
       "      <td>18.2</td>\n",
       "      <td>193.0</td>\n",
       "      <td>3775.0</td>\n",
       "      <td>MALE</td>\n",
       "      <td>9.46180</td>\n",
       "      <td>-24.70615</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>218</th>\n",
       "      <td>PAL0910</td>\n",
       "      <td>67</td>\n",
       "      <td>Chinstrap penguin (Pygoscelis antarctica)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Dream</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N100A1</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/21/09</td>\n",
       "      <td>50.8</td>\n",
       "      <td>19.0</td>\n",
       "      <td>210.0</td>\n",
       "      <td>4100.0</td>\n",
       "      <td>MALE</td>\n",
       "      <td>9.98044</td>\n",
       "      <td>-24.68741</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>219</th>\n",
       "      <td>PAL0910</td>\n",
       "      <td>68</td>\n",
       "      <td>Chinstrap penguin (Pygoscelis antarctica)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Dream</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N100A2</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/21/09</td>\n",
       "      <td>50.2</td>\n",
       "      <td>18.7</td>\n",
       "      <td>198.0</td>\n",
       "      <td>3775.0</td>\n",
       "      <td>FEMALE</td>\n",
       "      <td>9.39305</td>\n",
       "      <td>-24.25255</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>124 rows × 17 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "    studyName  Sample Number                                    Species  \\\n",
       "30    PAL0708             31        Adelie Penguin (Pygoscelis adeliae)   \n",
       "31    PAL0708             32        Adelie Penguin (Pygoscelis adeliae)   \n",
       "32    PAL0708             33        Adelie Penguin (Pygoscelis adeliae)   \n",
       "33    PAL0708             34        Adelie Penguin (Pygoscelis adeliae)   \n",
       "34    PAL0708             35        Adelie Penguin (Pygoscelis adeliae)   \n",
       "..        ...            ...                                        ...   \n",
       "215   PAL0910             64  Chinstrap penguin (Pygoscelis antarctica)   \n",
       "216   PAL0910             65  Chinstrap penguin (Pygoscelis antarctica)   \n",
       "217   PAL0910             66  Chinstrap penguin (Pygoscelis antarctica)   \n",
       "218   PAL0910             67  Chinstrap penguin (Pygoscelis antarctica)   \n",
       "219   PAL0910             68  Chinstrap penguin (Pygoscelis antarctica)   \n",
       "\n",
       "     Region Island               Stage Individual ID Clutch Completion  \\\n",
       "30   Anvers  Dream  Adult, 1 Egg Stage         N21A1               Yes   \n",
       "31   Anvers  Dream  Adult, 1 Egg Stage         N21A2               Yes   \n",
       "32   Anvers  Dream  Adult, 1 Egg Stage         N22A1               Yes   \n",
       "33   Anvers  Dream  Adult, 1 Egg Stage         N22A2               Yes   \n",
       "34   Anvers  Dream  Adult, 1 Egg Stage         N23A1               Yes   \n",
       "..      ...    ...                 ...           ...               ...   \n",
       "215  Anvers  Dream  Adult, 1 Egg Stage         N98A2               Yes   \n",
       "216  Anvers  Dream  Adult, 1 Egg Stage         N99A1                No   \n",
       "217  Anvers  Dream  Adult, 1 Egg Stage         N99A2                No   \n",
       "218  Anvers  Dream  Adult, 1 Egg Stage        N100A1               Yes   \n",
       "219  Anvers  Dream  Adult, 1 Egg Stage        N100A2               Yes   \n",
       "\n",
       "     Date Egg  Culmen Length (mm)  Culmen Depth (mm)  Flipper Length (mm)  \\\n",
       "30    11/9/07                39.5               16.7                178.0   \n",
       "31    11/9/07                37.2               18.1                178.0   \n",
       "32    11/9/07                39.5               17.8                188.0   \n",
       "33    11/9/07                40.9               18.9                184.0   \n",
       "34   11/16/07                36.4               17.0                195.0   \n",
       "..        ...                 ...                ...                  ...   \n",
       "215  11/19/09                55.8               19.8                207.0   \n",
       "216  11/21/09                43.5               18.1                202.0   \n",
       "217  11/21/09                49.6               18.2                193.0   \n",
       "218  11/21/09                50.8               19.0                210.0   \n",
       "219  11/21/09                50.2               18.7                198.0   \n",
       "\n",
       "     Body Mass (g)     Sex  Delta 15 N (o/oo)  Delta 13 C (o/oo) Comments  \n",
       "30          3250.0  FEMALE            9.69756          -25.11223      NaN  \n",
       "31          3900.0    MALE            9.72764          -25.01020      NaN  \n",
       "32          3300.0  FEMALE            9.66523          -25.06020      NaN  \n",
       "33          3900.0    MALE            8.79665          -25.14591      NaN  \n",
       "34          3325.0  FEMALE            9.17847          -25.23061      NaN  \n",
       "..             ...     ...                ...                ...      ...  \n",
       "215         4000.0    MALE            9.70465          -24.53494      NaN  \n",
       "216         3400.0  FEMALE            9.37608          -24.40753      NaN  \n",
       "217         3775.0    MALE            9.46180          -24.70615      NaN  \n",
       "218         4100.0    MALE            9.98044          -24.68741      NaN  \n",
       "219         3775.0  FEMALE            9.39305          -24.25255      NaN  \n",
       "\n",
       "[124 rows x 17 columns]"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "data": {
      "text/plain": [
       "'Torgersen'"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>studyName</th>\n",
       "      <th>Sample Number</th>\n",
       "      <th>Species</th>\n",
       "      <th>Region</th>\n",
       "      <th>Island</th>\n",
       "      <th>Stage</th>\n",
       "      <th>Individual ID</th>\n",
       "      <th>Clutch Completion</th>\n",
       "      <th>Date Egg</th>\n",
       "      <th>Culmen Length (mm)</th>\n",
       "      <th>Culmen Depth (mm)</th>\n",
       "      <th>Flipper Length (mm)</th>\n",
       "      <th>Body Mass (g)</th>\n",
       "      <th>Sex</th>\n",
       "      <th>Delta 15 N (o/oo)</th>\n",
       "      <th>Delta 13 C (o/oo)</th>\n",
       "      <th>Comments</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>PAL0708</td>\n",
       "      <td>1</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Torgersen</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N1A1</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/11/07</td>\n",
       "      <td>39.1</td>\n",
       "      <td>18.7</td>\n",
       "      <td>181.0</td>\n",
       "      <td>3750.0</td>\n",
       "      <td>MALE</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>Not enough blood for isotopes.</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>PAL0708</td>\n",
       "      <td>2</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Torgersen</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N1A2</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/11/07</td>\n",
       "      <td>39.5</td>\n",
       "      <td>17.4</td>\n",
       "      <td>186.0</td>\n",
       "      <td>3800.0</td>\n",
       "      <td>FEMALE</td>\n",
       "      <td>8.94956</td>\n",
       "      <td>-24.69454</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>PAL0708</td>\n",
       "      <td>3</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Torgersen</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N2A1</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/16/07</td>\n",
       "      <td>40.3</td>\n",
       "      <td>18.0</td>\n",
       "      <td>195.0</td>\n",
       "      <td>3250.0</td>\n",
       "      <td>FEMALE</td>\n",
       "      <td>8.36821</td>\n",
       "      <td>-25.33302</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>PAL0708</td>\n",
       "      <td>4</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Torgersen</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N2A2</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/16/07</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>Adult not sampled.</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>PAL0708</td>\n",
       "      <td>5</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Torgersen</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N3A1</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/16/07</td>\n",
       "      <td>36.7</td>\n",
       "      <td>19.3</td>\n",
       "      <td>193.0</td>\n",
       "      <td>3450.0</td>\n",
       "      <td>FEMALE</td>\n",
       "      <td>8.76651</td>\n",
       "      <td>-25.32426</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>5</th>\n",
       "      <td>PAL0708</td>\n",
       "      <td>6</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Torgersen</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N3A2</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/16/07</td>\n",
       "      <td>39.3</td>\n",
       "      <td>20.6</td>\n",
       "      <td>190.0</td>\n",
       "      <td>3650.0</td>\n",
       "      <td>MALE</td>\n",
       "      <td>8.66496</td>\n",
       "      <td>-25.29805</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>6</th>\n",
       "      <td>PAL0708</td>\n",
       "      <td>7</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Torgersen</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N4A1</td>\n",
       "      <td>No</td>\n",
       "      <td>11/15/07</td>\n",
       "      <td>38.9</td>\n",
       "      <td>17.8</td>\n",
       "      <td>181.0</td>\n",
       "      <td>3625.0</td>\n",
       "      <td>FEMALE</td>\n",
       "      <td>9.18718</td>\n",
       "      <td>-25.21799</td>\n",
       "      <td>Nest never observed with full clutch.</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>7</th>\n",
       "      <td>PAL0708</td>\n",
       "      <td>8</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Torgersen</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N4A2</td>\n",
       "      <td>No</td>\n",
       "      <td>11/15/07</td>\n",
       "      <td>39.2</td>\n",
       "      <td>19.6</td>\n",
       "      <td>195.0</td>\n",
       "      <td>4675.0</td>\n",
       "      <td>MALE</td>\n",
       "      <td>9.46060</td>\n",
       "      <td>-24.89958</td>\n",
       "      <td>Nest never observed with full clutch.</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>8</th>\n",
       "      <td>PAL0708</td>\n",
       "      <td>9</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Torgersen</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N5A1</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/9/07</td>\n",
       "      <td>34.1</td>\n",
       "      <td>18.1</td>\n",
       "      <td>193.0</td>\n",
       "      <td>3475.0</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>No blood sample obtained.</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>9</th>\n",
       "      <td>PAL0708</td>\n",
       "      <td>10</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Torgersen</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N5A2</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/9/07</td>\n",
       "      <td>42.0</td>\n",
       "      <td>20.2</td>\n",
       "      <td>190.0</td>\n",
       "      <td>4250.0</td>\n",
       "      <td>NaN</td>\n",
       "      <td>9.13362</td>\n",
       "      <td>-25.09368</td>\n",
       "      <td>No blood sample obtained for sexing.</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>10</th>\n",
       "      <td>PAL0708</td>\n",
       "      <td>11</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Torgersen</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N6A1</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/9/07</td>\n",
       "      <td>37.8</td>\n",
       "      <td>17.1</td>\n",
       "      <td>186.0</td>\n",
       "      <td>3300.0</td>\n",
       "      <td>NaN</td>\n",
       "      <td>8.63243</td>\n",
       "      <td>-25.21315</td>\n",
       "      <td>No blood sample obtained for sexing.</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>11</th>\n",
       "      <td>PAL0708</td>\n",
       "      <td>12</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Torgersen</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N6A2</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/9/07</td>\n",
       "      <td>37.8</td>\n",
       "      <td>17.3</td>\n",
       "      <td>180.0</td>\n",
       "      <td>3700.0</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>No blood sample obtained.</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>12</th>\n",
       "      <td>PAL0708</td>\n",
       "      <td>13</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Torgersen</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N7A1</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/15/07</td>\n",
       "      <td>41.1</td>\n",
       "      <td>17.6</td>\n",
       "      <td>182.0</td>\n",
       "      <td>3200.0</td>\n",
       "      <td>FEMALE</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>Not enough blood for isotopes.</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>13</th>\n",
       "      <td>PAL0708</td>\n",
       "      <td>14</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Torgersen</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N7A2</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/15/07</td>\n",
       "      <td>38.6</td>\n",
       "      <td>21.2</td>\n",
       "      <td>191.0</td>\n",
       "      <td>3800.0</td>\n",
       "      <td>MALE</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>Not enough blood for isotopes.</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>14</th>\n",
       "      <td>PAL0708</td>\n",
       "      <td>15</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Torgersen</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N8A1</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/16/07</td>\n",
       "      <td>34.6</td>\n",
       "      <td>21.1</td>\n",
       "      <td>198.0</td>\n",
       "      <td>4400.0</td>\n",
       "      <td>MALE</td>\n",
       "      <td>8.55583</td>\n",
       "      <td>-25.22588</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>15</th>\n",
       "      <td>PAL0708</td>\n",
       "      <td>16</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Torgersen</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N8A2</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/16/07</td>\n",
       "      <td>36.6</td>\n",
       "      <td>17.8</td>\n",
       "      <td>185.0</td>\n",
       "      <td>3700.0</td>\n",
       "      <td>FEMALE</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>Not enough blood for isotopes.</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>16</th>\n",
       "      <td>PAL0708</td>\n",
       "      <td>17</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Torgersen</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N9A1</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/12/07</td>\n",
       "      <td>38.7</td>\n",
       "      <td>19.0</td>\n",
       "      <td>195.0</td>\n",
       "      <td>3450.0</td>\n",
       "      <td>FEMALE</td>\n",
       "      <td>9.18528</td>\n",
       "      <td>-25.06691</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>17</th>\n",
       "      <td>PAL0708</td>\n",
       "      <td>18</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Torgersen</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N9A2</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/12/07</td>\n",
       "      <td>42.5</td>\n",
       "      <td>20.7</td>\n",
       "      <td>197.0</td>\n",
       "      <td>4500.0</td>\n",
       "      <td>MALE</td>\n",
       "      <td>8.67538</td>\n",
       "      <td>-25.13993</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>18</th>\n",
       "      <td>PAL0708</td>\n",
       "      <td>19</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Torgersen</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N10A1</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/16/07</td>\n",
       "      <td>34.4</td>\n",
       "      <td>18.4</td>\n",
       "      <td>184.0</td>\n",
       "      <td>3325.0</td>\n",
       "      <td>FEMALE</td>\n",
       "      <td>8.47827</td>\n",
       "      <td>-25.23319</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>19</th>\n",
       "      <td>PAL0708</td>\n",
       "      <td>20</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Torgersen</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N10A2</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/16/07</td>\n",
       "      <td>46.0</td>\n",
       "      <td>21.5</td>\n",
       "      <td>194.0</td>\n",
       "      <td>4200.0</td>\n",
       "      <td>MALE</td>\n",
       "      <td>9.11616</td>\n",
       "      <td>-24.77227</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>68</th>\n",
       "      <td>PAL0809</td>\n",
       "      <td>69</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Torgersen</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N32A1</td>\n",
       "      <td>No</td>\n",
       "      <td>11/11/08</td>\n",
       "      <td>35.9</td>\n",
       "      <td>16.6</td>\n",
       "      <td>190.0</td>\n",
       "      <td>3050.0</td>\n",
       "      <td>FEMALE</td>\n",
       "      <td>8.47781</td>\n",
       "      <td>-26.07821</td>\n",
       "      <td>Nest never observed with full clutch.</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>69</th>\n",
       "      <td>PAL0809</td>\n",
       "      <td>70</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Torgersen</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N32A2</td>\n",
       "      <td>No</td>\n",
       "      <td>11/11/08</td>\n",
       "      <td>41.8</td>\n",
       "      <td>19.4</td>\n",
       "      <td>198.0</td>\n",
       "      <td>4450.0</td>\n",
       "      <td>MALE</td>\n",
       "      <td>8.86853</td>\n",
       "      <td>-26.06209</td>\n",
       "      <td>Nest never observed with full clutch.</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>70</th>\n",
       "      <td>PAL0809</td>\n",
       "      <td>71</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Torgersen</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N34A1</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/14/08</td>\n",
       "      <td>33.5</td>\n",
       "      <td>19.0</td>\n",
       "      <td>190.0</td>\n",
       "      <td>3600.0</td>\n",
       "      <td>FEMALE</td>\n",
       "      <td>7.88863</td>\n",
       "      <td>-26.63085</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>71</th>\n",
       "      <td>PAL0809</td>\n",
       "      <td>72</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Torgersen</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N34A2</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/14/08</td>\n",
       "      <td>39.7</td>\n",
       "      <td>18.4</td>\n",
       "      <td>190.0</td>\n",
       "      <td>3900.0</td>\n",
       "      <td>MALE</td>\n",
       "      <td>9.29808</td>\n",
       "      <td>-25.23453</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>72</th>\n",
       "      <td>PAL0809</td>\n",
       "      <td>73</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Torgersen</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N35A1</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/11/08</td>\n",
       "      <td>39.6</td>\n",
       "      <td>17.2</td>\n",
       "      <td>196.0</td>\n",
       "      <td>3550.0</td>\n",
       "      <td>FEMALE</td>\n",
       "      <td>8.33524</td>\n",
       "      <td>-26.55351</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>73</th>\n",
       "      <td>PAL0809</td>\n",
       "      <td>74</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Torgersen</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N35A2</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/11/08</td>\n",
       "      <td>45.8</td>\n",
       "      <td>18.9</td>\n",
       "      <td>197.0</td>\n",
       "      <td>4150.0</td>\n",
       "      <td>MALE</td>\n",
       "      <td>8.18658</td>\n",
       "      <td>-26.45978</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>74</th>\n",
       "      <td>PAL0809</td>\n",
       "      <td>75</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Torgersen</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N36A1</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/8/08</td>\n",
       "      <td>35.5</td>\n",
       "      <td>17.5</td>\n",
       "      <td>190.0</td>\n",
       "      <td>3700.0</td>\n",
       "      <td>FEMALE</td>\n",
       "      <td>8.70642</td>\n",
       "      <td>-26.15003</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>75</th>\n",
       "      <td>PAL0809</td>\n",
       "      <td>76</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Torgersen</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N36A2</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/8/08</td>\n",
       "      <td>42.8</td>\n",
       "      <td>18.5</td>\n",
       "      <td>195.0</td>\n",
       "      <td>4250.0</td>\n",
       "      <td>MALE</td>\n",
       "      <td>8.29930</td>\n",
       "      <td>-26.38986</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>76</th>\n",
       "      <td>PAL0809</td>\n",
       "      <td>77</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Torgersen</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N37A1</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/6/08</td>\n",
       "      <td>40.9</td>\n",
       "      <td>16.8</td>\n",
       "      <td>191.0</td>\n",
       "      <td>3700.0</td>\n",
       "      <td>FEMALE</td>\n",
       "      <td>8.47257</td>\n",
       "      <td>-26.02002</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>77</th>\n",
       "      <td>PAL0809</td>\n",
       "      <td>78</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Torgersen</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N37A2</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/6/08</td>\n",
       "      <td>37.2</td>\n",
       "      <td>19.4</td>\n",
       "      <td>184.0</td>\n",
       "      <td>3900.0</td>\n",
       "      <td>MALE</td>\n",
       "      <td>8.35540</td>\n",
       "      <td>-26.44787</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>78</th>\n",
       "      <td>PAL0809</td>\n",
       "      <td>79</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Torgersen</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N38A1</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/9/08</td>\n",
       "      <td>36.2</td>\n",
       "      <td>16.1</td>\n",
       "      <td>187.0</td>\n",
       "      <td>3550.0</td>\n",
       "      <td>FEMALE</td>\n",
       "      <td>7.82381</td>\n",
       "      <td>-26.51382</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>79</th>\n",
       "      <td>PAL0809</td>\n",
       "      <td>80</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Torgersen</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N38A2</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/9/08</td>\n",
       "      <td>42.1</td>\n",
       "      <td>19.1</td>\n",
       "      <td>195.0</td>\n",
       "      <td>4000.0</td>\n",
       "      <td>MALE</td>\n",
       "      <td>9.05736</td>\n",
       "      <td>-25.81513</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>80</th>\n",
       "      <td>PAL0809</td>\n",
       "      <td>81</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Torgersen</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N39A1</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/2/08</td>\n",
       "      <td>34.6</td>\n",
       "      <td>17.2</td>\n",
       "      <td>189.0</td>\n",
       "      <td>3200.0</td>\n",
       "      <td>FEMALE</td>\n",
       "      <td>7.69778</td>\n",
       "      <td>-26.53870</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>81</th>\n",
       "      <td>PAL0809</td>\n",
       "      <td>82</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Torgersen</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N39A2</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/2/08</td>\n",
       "      <td>42.9</td>\n",
       "      <td>17.6</td>\n",
       "      <td>196.0</td>\n",
       "      <td>4700.0</td>\n",
       "      <td>MALE</td>\n",
       "      <td>8.63259</td>\n",
       "      <td>-26.23027</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>82</th>\n",
       "      <td>PAL0809</td>\n",
       "      <td>83</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Torgersen</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N40A1</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/7/08</td>\n",
       "      <td>36.7</td>\n",
       "      <td>18.8</td>\n",
       "      <td>187.0</td>\n",
       "      <td>3800.0</td>\n",
       "      <td>FEMALE</td>\n",
       "      <td>7.88494</td>\n",
       "      <td>-26.24837</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>83</th>\n",
       "      <td>PAL0809</td>\n",
       "      <td>84</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Torgersen</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N40A2</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/7/08</td>\n",
       "      <td>35.1</td>\n",
       "      <td>19.4</td>\n",
       "      <td>193.0</td>\n",
       "      <td>4200.0</td>\n",
       "      <td>MALE</td>\n",
       "      <td>8.90002</td>\n",
       "      <td>-26.46254</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>116</th>\n",
       "      <td>PAL0910</td>\n",
       "      <td>117</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Torgersen</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N63A1</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/18/09</td>\n",
       "      <td>38.6</td>\n",
       "      <td>17.0</td>\n",
       "      <td>188.0</td>\n",
       "      <td>2900.0</td>\n",
       "      <td>FEMALE</td>\n",
       "      <td>9.18021</td>\n",
       "      <td>-25.77264</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>117</th>\n",
       "      <td>PAL0910</td>\n",
       "      <td>118</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Torgersen</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N63A2</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/18/09</td>\n",
       "      <td>37.3</td>\n",
       "      <td>20.5</td>\n",
       "      <td>199.0</td>\n",
       "      <td>3775.0</td>\n",
       "      <td>MALE</td>\n",
       "      <td>9.49645</td>\n",
       "      <td>-26.36678</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>118</th>\n",
       "      <td>PAL0910</td>\n",
       "      <td>119</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Torgersen</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N64A1</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/22/09</td>\n",
       "      <td>35.7</td>\n",
       "      <td>17.0</td>\n",
       "      <td>189.0</td>\n",
       "      <td>3350.0</td>\n",
       "      <td>FEMALE</td>\n",
       "      <td>8.96436</td>\n",
       "      <td>-23.90309</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>119</th>\n",
       "      <td>PAL0910</td>\n",
       "      <td>120</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Torgersen</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N64A2</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/22/09</td>\n",
       "      <td>41.1</td>\n",
       "      <td>18.6</td>\n",
       "      <td>189.0</td>\n",
       "      <td>3325.0</td>\n",
       "      <td>MALE</td>\n",
       "      <td>9.32277</td>\n",
       "      <td>-26.09989</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>120</th>\n",
       "      <td>PAL0910</td>\n",
       "      <td>121</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Torgersen</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N66A1</td>\n",
       "      <td>No</td>\n",
       "      <td>11/17/09</td>\n",
       "      <td>36.2</td>\n",
       "      <td>17.2</td>\n",
       "      <td>187.0</td>\n",
       "      <td>3150.0</td>\n",
       "      <td>FEMALE</td>\n",
       "      <td>9.04296</td>\n",
       "      <td>-26.19444</td>\n",
       "      <td>Nest never observed with full clutch.</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>121</th>\n",
       "      <td>PAL0910</td>\n",
       "      <td>122</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Torgersen</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N66A2</td>\n",
       "      <td>No</td>\n",
       "      <td>11/17/09</td>\n",
       "      <td>37.7</td>\n",
       "      <td>19.8</td>\n",
       "      <td>198.0</td>\n",
       "      <td>3500.0</td>\n",
       "      <td>MALE</td>\n",
       "      <td>9.11066</td>\n",
       "      <td>-26.42563</td>\n",
       "      <td>Nest never observed with full clutch.</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>122</th>\n",
       "      <td>PAL0910</td>\n",
       "      <td>123</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Torgersen</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N67A1</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/16/09</td>\n",
       "      <td>40.2</td>\n",
       "      <td>17.0</td>\n",
       "      <td>176.0</td>\n",
       "      <td>3450.0</td>\n",
       "      <td>FEMALE</td>\n",
       "      <td>9.30722</td>\n",
       "      <td>-25.61039</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>123</th>\n",
       "      <td>PAL0910</td>\n",
       "      <td>124</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Torgersen</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N67A2</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/16/09</td>\n",
       "      <td>41.4</td>\n",
       "      <td>18.5</td>\n",
       "      <td>202.0</td>\n",
       "      <td>3875.0</td>\n",
       "      <td>MALE</td>\n",
       "      <td>9.59462</td>\n",
       "      <td>-25.42621</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>124</th>\n",
       "      <td>PAL0910</td>\n",
       "      <td>125</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Torgersen</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N69A1</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/18/09</td>\n",
       "      <td>35.2</td>\n",
       "      <td>15.9</td>\n",
       "      <td>186.0</td>\n",
       "      <td>3050.0</td>\n",
       "      <td>FEMALE</td>\n",
       "      <td>8.81668</td>\n",
       "      <td>-25.95399</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>125</th>\n",
       "      <td>PAL0910</td>\n",
       "      <td>126</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Torgersen</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N69A2</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/18/09</td>\n",
       "      <td>40.6</td>\n",
       "      <td>19.0</td>\n",
       "      <td>199.0</td>\n",
       "      <td>4000.0</td>\n",
       "      <td>MALE</td>\n",
       "      <td>9.22537</td>\n",
       "      <td>-25.60826</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>126</th>\n",
       "      <td>PAL0910</td>\n",
       "      <td>127</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Torgersen</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N71A1</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/21/09</td>\n",
       "      <td>38.8</td>\n",
       "      <td>17.6</td>\n",
       "      <td>191.0</td>\n",
       "      <td>3275.0</td>\n",
       "      <td>FEMALE</td>\n",
       "      <td>8.88098</td>\n",
       "      <td>-25.89741</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>127</th>\n",
       "      <td>PAL0910</td>\n",
       "      <td>128</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Torgersen</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N71A2</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/21/09</td>\n",
       "      <td>41.5</td>\n",
       "      <td>18.3</td>\n",
       "      <td>195.0</td>\n",
       "      <td>4300.0</td>\n",
       "      <td>MALE</td>\n",
       "      <td>8.52566</td>\n",
       "      <td>-26.02450</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>128</th>\n",
       "      <td>PAL0910</td>\n",
       "      <td>129</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Torgersen</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N72A1</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/18/09</td>\n",
       "      <td>39.0</td>\n",
       "      <td>17.1</td>\n",
       "      <td>191.0</td>\n",
       "      <td>3050.0</td>\n",
       "      <td>FEMALE</td>\n",
       "      <td>9.19031</td>\n",
       "      <td>-25.73722</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>129</th>\n",
       "      <td>PAL0910</td>\n",
       "      <td>130</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Torgersen</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N72A2</td>\n",
       "      <td>Yes</td>\n",
       "      <td>11/18/09</td>\n",
       "      <td>44.1</td>\n",
       "      <td>18.0</td>\n",
       "      <td>210.0</td>\n",
       "      <td>4000.0</td>\n",
       "      <td>MALE</td>\n",
       "      <td>9.10702</td>\n",
       "      <td>-26.01363</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>130</th>\n",
       "      <td>PAL0910</td>\n",
       "      <td>131</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Torgersen</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N73A1</td>\n",
       "      <td>No</td>\n",
       "      <td>11/23/09</td>\n",
       "      <td>38.5</td>\n",
       "      <td>17.9</td>\n",
       "      <td>190.0</td>\n",
       "      <td>3325.0</td>\n",
       "      <td>FEMALE</td>\n",
       "      <td>8.98460</td>\n",
       "      <td>-25.57956</td>\n",
       "      <td>Nest never observed with full clutch.</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>131</th>\n",
       "      <td>PAL0910</td>\n",
       "      <td>132</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>Anvers</td>\n",
       "      <td>Torgersen</td>\n",
       "      <td>Adult, 1 Egg Stage</td>\n",
       "      <td>N73A2</td>\n",
       "      <td>No</td>\n",
       "      <td>11/23/09</td>\n",
       "      <td>43.1</td>\n",
       "      <td>19.2</td>\n",
       "      <td>197.0</td>\n",
       "      <td>3500.0</td>\n",
       "      <td>MALE</td>\n",
       "      <td>8.86495</td>\n",
       "      <td>-26.13960</td>\n",
       "      <td>Nest never observed with full clutch.</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "    studyName  Sample Number                              Species  Region  \\\n",
       "0     PAL0708              1  Adelie Penguin (Pygoscelis adeliae)  Anvers   \n",
       "1     PAL0708              2  Adelie Penguin (Pygoscelis adeliae)  Anvers   \n",
       "2     PAL0708              3  Adelie Penguin (Pygoscelis adeliae)  Anvers   \n",
       "3     PAL0708              4  Adelie Penguin (Pygoscelis adeliae)  Anvers   \n",
       "4     PAL0708              5  Adelie Penguin (Pygoscelis adeliae)  Anvers   \n",
       "5     PAL0708              6  Adelie Penguin (Pygoscelis adeliae)  Anvers   \n",
       "6     PAL0708              7  Adelie Penguin (Pygoscelis adeliae)  Anvers   \n",
       "7     PAL0708              8  Adelie Penguin (Pygoscelis adeliae)  Anvers   \n",
       "8     PAL0708              9  Adelie Penguin (Pygoscelis adeliae)  Anvers   \n",
       "9     PAL0708             10  Adelie Penguin (Pygoscelis adeliae)  Anvers   \n",
       "10    PAL0708             11  Adelie Penguin (Pygoscelis adeliae)  Anvers   \n",
       "11    PAL0708             12  Adelie Penguin (Pygoscelis adeliae)  Anvers   \n",
       "12    PAL0708             13  Adelie Penguin (Pygoscelis adeliae)  Anvers   \n",
       "13    PAL0708             14  Adelie Penguin (Pygoscelis adeliae)  Anvers   \n",
       "14    PAL0708             15  Adelie Penguin (Pygoscelis adeliae)  Anvers   \n",
       "15    PAL0708             16  Adelie Penguin (Pygoscelis adeliae)  Anvers   \n",
       "16    PAL0708             17  Adelie Penguin (Pygoscelis adeliae)  Anvers   \n",
       "17    PAL0708             18  Adelie Penguin (Pygoscelis adeliae)  Anvers   \n",
       "18    PAL0708             19  Adelie Penguin (Pygoscelis adeliae)  Anvers   \n",
       "19    PAL0708             20  Adelie Penguin (Pygoscelis adeliae)  Anvers   \n",
       "68    PAL0809             69  Adelie Penguin (Pygoscelis adeliae)  Anvers   \n",
       "69    PAL0809             70  Adelie Penguin (Pygoscelis adeliae)  Anvers   \n",
       "70    PAL0809             71  Adelie Penguin (Pygoscelis adeliae)  Anvers   \n",
       "71    PAL0809             72  Adelie Penguin (Pygoscelis adeliae)  Anvers   \n",
       "72    PAL0809             73  Adelie Penguin (Pygoscelis adeliae)  Anvers   \n",
       "73    PAL0809             74  Adelie Penguin (Pygoscelis adeliae)  Anvers   \n",
       "74    PAL0809             75  Adelie Penguin (Pygoscelis adeliae)  Anvers   \n",
       "75    PAL0809             76  Adelie Penguin (Pygoscelis adeliae)  Anvers   \n",
       "76    PAL0809             77  Adelie Penguin (Pygoscelis adeliae)  Anvers   \n",
       "77    PAL0809             78  Adelie Penguin (Pygoscelis adeliae)  Anvers   \n",
       "78    PAL0809             79  Adelie Penguin (Pygoscelis adeliae)  Anvers   \n",
       "79    PAL0809             80  Adelie Penguin (Pygoscelis adeliae)  Anvers   \n",
       "80    PAL0809             81  Adelie Penguin (Pygoscelis adeliae)  Anvers   \n",
       "81    PAL0809             82  Adelie Penguin (Pygoscelis adeliae)  Anvers   \n",
       "82    PAL0809             83  Adelie Penguin (Pygoscelis adeliae)  Anvers   \n",
       "83    PAL0809             84  Adelie Penguin (Pygoscelis adeliae)  Anvers   \n",
       "116   PAL0910            117  Adelie Penguin (Pygoscelis adeliae)  Anvers   \n",
       "117   PAL0910            118  Adelie Penguin (Pygoscelis adeliae)  Anvers   \n",
       "118   PAL0910            119  Adelie Penguin (Pygoscelis adeliae)  Anvers   \n",
       "119   PAL0910            120  Adelie Penguin (Pygoscelis adeliae)  Anvers   \n",
       "120   PAL0910            121  Adelie Penguin (Pygoscelis adeliae)  Anvers   \n",
       "121   PAL0910            122  Adelie Penguin (Pygoscelis adeliae)  Anvers   \n",
       "122   PAL0910            123  Adelie Penguin (Pygoscelis adeliae)  Anvers   \n",
       "123   PAL0910            124  Adelie Penguin (Pygoscelis adeliae)  Anvers   \n",
       "124   PAL0910            125  Adelie Penguin (Pygoscelis adeliae)  Anvers   \n",
       "125   PAL0910            126  Adelie Penguin (Pygoscelis adeliae)  Anvers   \n",
       "126   PAL0910            127  Adelie Penguin (Pygoscelis adeliae)  Anvers   \n",
       "127   PAL0910            128  Adelie Penguin (Pygoscelis adeliae)  Anvers   \n",
       "128   PAL0910            129  Adelie Penguin (Pygoscelis adeliae)  Anvers   \n",
       "129   PAL0910            130  Adelie Penguin (Pygoscelis adeliae)  Anvers   \n",
       "130   PAL0910            131  Adelie Penguin (Pygoscelis adeliae)  Anvers   \n",
       "131   PAL0910            132  Adelie Penguin (Pygoscelis adeliae)  Anvers   \n",
       "\n",
       "        Island               Stage Individual ID Clutch Completion  Date Egg  \\\n",
       "0    Torgersen  Adult, 1 Egg Stage          N1A1               Yes  11/11/07   \n",
       "1    Torgersen  Adult, 1 Egg Stage          N1A2               Yes  11/11/07   \n",
       "2    Torgersen  Adult, 1 Egg Stage          N2A1               Yes  11/16/07   \n",
       "3    Torgersen  Adult, 1 Egg Stage          N2A2               Yes  11/16/07   \n",
       "4    Torgersen  Adult, 1 Egg Stage          N3A1               Yes  11/16/07   \n",
       "5    Torgersen  Adult, 1 Egg Stage          N3A2               Yes  11/16/07   \n",
       "6    Torgersen  Adult, 1 Egg Stage          N4A1                No  11/15/07   \n",
       "7    Torgersen  Adult, 1 Egg Stage          N4A2                No  11/15/07   \n",
       "8    Torgersen  Adult, 1 Egg Stage          N5A1               Yes   11/9/07   \n",
       "9    Torgersen  Adult, 1 Egg Stage          N5A2               Yes   11/9/07   \n",
       "10   Torgersen  Adult, 1 Egg Stage          N6A1               Yes   11/9/07   \n",
       "11   Torgersen  Adult, 1 Egg Stage          N6A2               Yes   11/9/07   \n",
       "12   Torgersen  Adult, 1 Egg Stage          N7A1               Yes  11/15/07   \n",
       "13   Torgersen  Adult, 1 Egg Stage          N7A2               Yes  11/15/07   \n",
       "14   Torgersen  Adult, 1 Egg Stage          N8A1               Yes  11/16/07   \n",
       "15   Torgersen  Adult, 1 Egg Stage          N8A2               Yes  11/16/07   \n",
       "16   Torgersen  Adult, 1 Egg Stage          N9A1               Yes  11/12/07   \n",
       "17   Torgersen  Adult, 1 Egg Stage          N9A2               Yes  11/12/07   \n",
       "18   Torgersen  Adult, 1 Egg Stage         N10A1               Yes  11/16/07   \n",
       "19   Torgersen  Adult, 1 Egg Stage         N10A2               Yes  11/16/07   \n",
       "68   Torgersen  Adult, 1 Egg Stage         N32A1                No  11/11/08   \n",
       "69   Torgersen  Adult, 1 Egg Stage         N32A2                No  11/11/08   \n",
       "70   Torgersen  Adult, 1 Egg Stage         N34A1               Yes  11/14/08   \n",
       "71   Torgersen  Adult, 1 Egg Stage         N34A2               Yes  11/14/08   \n",
       "72   Torgersen  Adult, 1 Egg Stage         N35A1               Yes  11/11/08   \n",
       "73   Torgersen  Adult, 1 Egg Stage         N35A2               Yes  11/11/08   \n",
       "74   Torgersen  Adult, 1 Egg Stage         N36A1               Yes   11/8/08   \n",
       "75   Torgersen  Adult, 1 Egg Stage         N36A2               Yes   11/8/08   \n",
       "76   Torgersen  Adult, 1 Egg Stage         N37A1               Yes   11/6/08   \n",
       "77   Torgersen  Adult, 1 Egg Stage         N37A2               Yes   11/6/08   \n",
       "78   Torgersen  Adult, 1 Egg Stage         N38A1               Yes   11/9/08   \n",
       "79   Torgersen  Adult, 1 Egg Stage         N38A2               Yes   11/9/08   \n",
       "80   Torgersen  Adult, 1 Egg Stage         N39A1               Yes   11/2/08   \n",
       "81   Torgersen  Adult, 1 Egg Stage         N39A2               Yes   11/2/08   \n",
       "82   Torgersen  Adult, 1 Egg Stage         N40A1               Yes   11/7/08   \n",
       "83   Torgersen  Adult, 1 Egg Stage         N40A2               Yes   11/7/08   \n",
       "116  Torgersen  Adult, 1 Egg Stage         N63A1               Yes  11/18/09   \n",
       "117  Torgersen  Adult, 1 Egg Stage         N63A2               Yes  11/18/09   \n",
       "118  Torgersen  Adult, 1 Egg Stage         N64A1               Yes  11/22/09   \n",
       "119  Torgersen  Adult, 1 Egg Stage         N64A2               Yes  11/22/09   \n",
       "120  Torgersen  Adult, 1 Egg Stage         N66A1                No  11/17/09   \n",
       "121  Torgersen  Adult, 1 Egg Stage         N66A2                No  11/17/09   \n",
       "122  Torgersen  Adult, 1 Egg Stage         N67A1               Yes  11/16/09   \n",
       "123  Torgersen  Adult, 1 Egg Stage         N67A2               Yes  11/16/09   \n",
       "124  Torgersen  Adult, 1 Egg Stage         N69A1               Yes  11/18/09   \n",
       "125  Torgersen  Adult, 1 Egg Stage         N69A2               Yes  11/18/09   \n",
       "126  Torgersen  Adult, 1 Egg Stage         N71A1               Yes  11/21/09   \n",
       "127  Torgersen  Adult, 1 Egg Stage         N71A2               Yes  11/21/09   \n",
       "128  Torgersen  Adult, 1 Egg Stage         N72A1               Yes  11/18/09   \n",
       "129  Torgersen  Adult, 1 Egg Stage         N72A2               Yes  11/18/09   \n",
       "130  Torgersen  Adult, 1 Egg Stage         N73A1                No  11/23/09   \n",
       "131  Torgersen  Adult, 1 Egg Stage         N73A2                No  11/23/09   \n",
       "\n",
       "     Culmen Length (mm)  Culmen Depth (mm)  Flipper Length (mm)  \\\n",
       "0                  39.1               18.7                181.0   \n",
       "1                  39.5               17.4                186.0   \n",
       "2                  40.3               18.0                195.0   \n",
       "3                   NaN                NaN                  NaN   \n",
       "4                  36.7               19.3                193.0   \n",
       "5                  39.3               20.6                190.0   \n",
       "6                  38.9               17.8                181.0   \n",
       "7                  39.2               19.6                195.0   \n",
       "8                  34.1               18.1                193.0   \n",
       "9                  42.0               20.2                190.0   \n",
       "10                 37.8               17.1                186.0   \n",
       "11                 37.8               17.3                180.0   \n",
       "12                 41.1               17.6                182.0   \n",
       "13                 38.6               21.2                191.0   \n",
       "14                 34.6               21.1                198.0   \n",
       "15                 36.6               17.8                185.0   \n",
       "16                 38.7               19.0                195.0   \n",
       "17                 42.5               20.7                197.0   \n",
       "18                 34.4               18.4                184.0   \n",
       "19                 46.0               21.5                194.0   \n",
       "68                 35.9               16.6                190.0   \n",
       "69                 41.8               19.4                198.0   \n",
       "70                 33.5               19.0                190.0   \n",
       "71                 39.7               18.4                190.0   \n",
       "72                 39.6               17.2                196.0   \n",
       "73                 45.8               18.9                197.0   \n",
       "74                 35.5               17.5                190.0   \n",
       "75                 42.8               18.5                195.0   \n",
       "76                 40.9               16.8                191.0   \n",
       "77                 37.2               19.4                184.0   \n",
       "78                 36.2               16.1                187.0   \n",
       "79                 42.1               19.1                195.0   \n",
       "80                 34.6               17.2                189.0   \n",
       "81                 42.9               17.6                196.0   \n",
       "82                 36.7               18.8                187.0   \n",
       "83                 35.1               19.4                193.0   \n",
       "116                38.6               17.0                188.0   \n",
       "117                37.3               20.5                199.0   \n",
       "118                35.7               17.0                189.0   \n",
       "119                41.1               18.6                189.0   \n",
       "120                36.2               17.2                187.0   \n",
       "121                37.7               19.8                198.0   \n",
       "122                40.2               17.0                176.0   \n",
       "123                41.4               18.5                202.0   \n",
       "124                35.2               15.9                186.0   \n",
       "125                40.6               19.0                199.0   \n",
       "126                38.8               17.6                191.0   \n",
       "127                41.5               18.3                195.0   \n",
       "128                39.0               17.1                191.0   \n",
       "129                44.1               18.0                210.0   \n",
       "130                38.5               17.9                190.0   \n",
       "131                43.1               19.2                197.0   \n",
       "\n",
       "     Body Mass (g)     Sex  Delta 15 N (o/oo)  Delta 13 C (o/oo)  \\\n",
       "0           3750.0    MALE                NaN                NaN   \n",
       "1           3800.0  FEMALE            8.94956          -24.69454   \n",
       "2           3250.0  FEMALE            8.36821          -25.33302   \n",
       "3              NaN     NaN                NaN                NaN   \n",
       "4           3450.0  FEMALE            8.76651          -25.32426   \n",
       "5           3650.0    MALE            8.66496          -25.29805   \n",
       "6           3625.0  FEMALE            9.18718          -25.21799   \n",
       "7           4675.0    MALE            9.46060          -24.89958   \n",
       "8           3475.0     NaN                NaN                NaN   \n",
       "9           4250.0     NaN            9.13362          -25.09368   \n",
       "10          3300.0     NaN            8.63243          -25.21315   \n",
       "11          3700.0     NaN                NaN                NaN   \n",
       "12          3200.0  FEMALE                NaN                NaN   \n",
       "13          3800.0    MALE                NaN                NaN   \n",
       "14          4400.0    MALE            8.55583          -25.22588   \n",
       "15          3700.0  FEMALE                NaN                NaN   \n",
       "16          3450.0  FEMALE            9.18528          -25.06691   \n",
       "17          4500.0    MALE            8.67538          -25.13993   \n",
       "18          3325.0  FEMALE            8.47827          -25.23319   \n",
       "19          4200.0    MALE            9.11616          -24.77227   \n",
       "68          3050.0  FEMALE            8.47781          -26.07821   \n",
       "69          4450.0    MALE            8.86853          -26.06209   \n",
       "70          3600.0  FEMALE            7.88863          -26.63085   \n",
       "71          3900.0    MALE            9.29808          -25.23453   \n",
       "72          3550.0  FEMALE            8.33524          -26.55351   \n",
       "73          4150.0    MALE            8.18658          -26.45978   \n",
       "74          3700.0  FEMALE            8.70642          -26.15003   \n",
       "75          4250.0    MALE            8.29930          -26.38986   \n",
       "76          3700.0  FEMALE            8.47257          -26.02002   \n",
       "77          3900.0    MALE            8.35540          -26.44787   \n",
       "78          3550.0  FEMALE            7.82381          -26.51382   \n",
       "79          4000.0    MALE            9.05736          -25.81513   \n",
       "80          3200.0  FEMALE            7.69778          -26.53870   \n",
       "81          4700.0    MALE            8.63259          -26.23027   \n",
       "82          3800.0  FEMALE            7.88494          -26.24837   \n",
       "83          4200.0    MALE            8.90002          -26.46254   \n",
       "116         2900.0  FEMALE            9.18021          -25.77264   \n",
       "117         3775.0    MALE            9.49645          -26.36678   \n",
       "118         3350.0  FEMALE            8.96436          -23.90309   \n",
       "119         3325.0    MALE            9.32277          -26.09989   \n",
       "120         3150.0  FEMALE            9.04296          -26.19444   \n",
       "121         3500.0    MALE            9.11066          -26.42563   \n",
       "122         3450.0  FEMALE            9.30722          -25.61039   \n",
       "123         3875.0    MALE            9.59462          -25.42621   \n",
       "124         3050.0  FEMALE            8.81668          -25.95399   \n",
       "125         4000.0    MALE            9.22537          -25.60826   \n",
       "126         3275.0  FEMALE            8.88098          -25.89741   \n",
       "127         4300.0    MALE            8.52566          -26.02450   \n",
       "128         3050.0  FEMALE            9.19031          -25.73722   \n",
       "129         4000.0    MALE            9.10702          -26.01363   \n",
       "130         3325.0  FEMALE            8.98460          -25.57956   \n",
       "131         3500.0    MALE            8.86495          -26.13960   \n",
       "\n",
       "                                  Comments  \n",
       "0           Not enough blood for isotopes.  \n",
       "1                                      NaN  \n",
       "2                                      NaN  \n",
       "3                       Adult not sampled.  \n",
       "4                                      NaN  \n",
       "5                                      NaN  \n",
       "6    Nest never observed with full clutch.  \n",
       "7    Nest never observed with full clutch.  \n",
       "8                No blood sample obtained.  \n",
       "9     No blood sample obtained for sexing.  \n",
       "10    No blood sample obtained for sexing.  \n",
       "11               No blood sample obtained.  \n",
       "12          Not enough blood for isotopes.  \n",
       "13          Not enough blood for isotopes.  \n",
       "14                                     NaN  \n",
       "15          Not enough blood for isotopes.  \n",
       "16                                     NaN  \n",
       "17                                     NaN  \n",
       "18                                     NaN  \n",
       "19                                     NaN  \n",
       "68   Nest never observed with full clutch.  \n",
       "69   Nest never observed with full clutch.  \n",
       "70                                     NaN  \n",
       "71                                     NaN  \n",
       "72                                     NaN  \n",
       "73                                     NaN  \n",
       "74                                     NaN  \n",
       "75                                     NaN  \n",
       "76                                     NaN  \n",
       "77                                     NaN  \n",
       "78                                     NaN  \n",
       "79                                     NaN  \n",
       "80                                     NaN  \n",
       "81                                     NaN  \n",
       "82                                     NaN  \n",
       "83                                     NaN  \n",
       "116                                    NaN  \n",
       "117                                    NaN  \n",
       "118                                    NaN  \n",
       "119                                    NaN  \n",
       "120  Nest never observed with full clutch.  \n",
       "121  Nest never observed with full clutch.  \n",
       "122                                    NaN  \n",
       "123                                    NaN  \n",
       "124                                    NaN  \n",
       "125                                    NaN  \n",
       "126                                    NaN  \n",
       "127                                    NaN  \n",
       "128                                    NaN  \n",
       "129                                    NaN  \n",
       "130  Nest never observed with full clutch.  \n",
       "131  Nest never observed with full clutch.  "
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    }
   ],
   "source": [
    "for name, gdf in dfa.groupby('Island'):\n",
    "    display(name, gdf)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 70,
   "id": "affc142d-5411-4305-a441-0c058a7fff7c",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "Island\n",
       "Biscoe       168\n",
       "Dream        124\n",
       "Torgersen     52\n",
       "dtype: int64"
      ]
     },
     "execution_count": 70,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "dfa.groupby('Island').size()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 74,
   "id": "a10d9160-8e63-4a1e-af89-2d6cfc6f9b7b",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>0</th>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>Island</th>\n",
       "      <th></th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>Biscoe</th>\n",
       "      <td>168</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>Dream</th>\n",
       "      <td>124</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>Torgersen</th>\n",
       "      <td>52</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "             0\n",
       "Island        \n",
       "Biscoe     168\n",
       "Dream      124\n",
       "Torgersen   52"
      ]
     },
     "execution_count": 74,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "dfa.groupby('Island').size().to_frame()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 75,
   "id": "6693b39b-1b1f-4195-9e1f-d6756cfc1de1",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "Island\n",
       "Biscoe       45.257485\n",
       "Dream        44.167742\n",
       "Torgersen    38.950980\n",
       "Name: Culmen Length (mm), dtype: float64"
      ]
     },
     "execution_count": 75,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "dfa.groupby('Island')['Culmen Length (mm)'].mean()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 78,
   "id": "c10cebe0-c9b2-4068-a5a1-04024f521d5d",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>Island</th>\n",
       "      <th>Culmen Length (mm)</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>Biscoe</td>\n",
       "      <td>45.257485</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>Dream</td>\n",
       "      <td>44.167742</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>Torgersen</td>\n",
       "      <td>38.950980</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "      Island  Culmen Length (mm)\n",
       "0     Biscoe           45.257485\n",
       "1      Dream           44.167742\n",
       "2  Torgersen           38.950980"
      ]
     },
     "execution_count": 78,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "dfa.groupby('Island')['Culmen Length (mm)'].mean().to_frame().reset_index()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 79,
   "id": "f4c1ca13-8f7f-40cb-817e-14bb3f1fcd6b",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>Culmen Length (mm)</th>\n",
       "      <th>Culmen Depth (mm)</th>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>Island</th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>Biscoe</th>\n",
       "      <td>45.257485</td>\n",
       "      <td>15.874850</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>Dream</th>\n",
       "      <td>44.167742</td>\n",
       "      <td>18.344355</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>Torgersen</th>\n",
       "      <td>38.950980</td>\n",
       "      <td>18.429412</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "           Culmen Length (mm)  Culmen Depth (mm)\n",
       "Island                                          \n",
       "Biscoe              45.257485          15.874850\n",
       "Dream               44.167742          18.344355\n",
       "Torgersen           38.950980          18.429412"
      ]
     },
     "execution_count": 79,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "dfa.groupby('Island')[['Culmen Length (mm)', 'Culmen Depth (mm)']].mean()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 80,
   "id": "3b395216-186c-4784-bf2f-2def8779ade3",
   "metadata": {
    "scrolled": true
   },
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead tr th {\n",
       "        text-align: left;\n",
       "    }\n",
       "\n",
       "    .dataframe thead tr:last-of-type th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr>\n",
       "      <th></th>\n",
       "      <th colspan=\"2\" halign=\"left\">Culmen Length (mm)</th>\n",
       "      <th colspan=\"2\" halign=\"left\">Culmen Depth (mm)</th>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th></th>\n",
       "      <th>min</th>\n",
       "      <th>max</th>\n",
       "      <th>min</th>\n",
       "      <th>max</th>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>Island</th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>Biscoe</th>\n",
       "      <td>34.5</td>\n",
       "      <td>59.6</td>\n",
       "      <td>13.1</td>\n",
       "      <td>21.1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>Dream</th>\n",
       "      <td>32.1</td>\n",
       "      <td>58.0</td>\n",
       "      <td>15.5</td>\n",
       "      <td>21.2</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>Torgersen</th>\n",
       "      <td>33.5</td>\n",
       "      <td>46.0</td>\n",
       "      <td>15.9</td>\n",
       "      <td>21.5</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "          Culmen Length (mm)       Culmen Depth (mm)      \n",
       "                         min   max               min   max\n",
       "Island                                                    \n",
       "Biscoe                  34.5  59.6              13.1  21.1\n",
       "Dream                   32.1  58.0              15.5  21.2\n",
       "Torgersen               33.5  46.0              15.9  21.5"
      ]
     },
     "execution_count": 80,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "dfa.groupby('Island').agg({'Culmen Length (mm)': ['min','max'], 'Culmen Depth (mm)': ['min','max']})"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 81,
   "id": "829cb56f-fd32-4775-80cc-4099cf96f6fe",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead tr th {\n",
       "        text-align: left;\n",
       "    }\n",
       "\n",
       "    .dataframe thead tr:last-of-type th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th colspan=\"2\" halign=\"left\">Culmen Length (mm)</th>\n",
       "      <th colspan=\"2\" halign=\"left\">Culmen Depth (mm)</th>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th>min</th>\n",
       "      <th>max</th>\n",
       "      <th>min</th>\n",
       "      <th>max</th>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>Island</th>\n",
       "      <th>Species</th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th rowspan=\"2\" valign=\"top\">Biscoe</th>\n",
       "      <th>Adelie Penguin (Pygoscelis adeliae)</th>\n",
       "      <td>34.5</td>\n",
       "      <td>45.6</td>\n",
       "      <td>16.0</td>\n",
       "      <td>21.1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>Gentoo penguin (Pygoscelis papua)</th>\n",
       "      <td>40.9</td>\n",
       "      <td>59.6</td>\n",
       "      <td>13.1</td>\n",
       "      <td>17.3</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th rowspan=\"2\" valign=\"top\">Dream</th>\n",
       "      <th>Adelie Penguin (Pygoscelis adeliae)</th>\n",
       "      <td>32.1</td>\n",
       "      <td>44.1</td>\n",
       "      <td>15.5</td>\n",
       "      <td>21.2</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>Chinstrap penguin (Pygoscelis antarctica)</th>\n",
       "      <td>40.9</td>\n",
       "      <td>58.0</td>\n",
       "      <td>16.4</td>\n",
       "      <td>20.8</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>Torgersen</th>\n",
       "      <th>Adelie Penguin (Pygoscelis adeliae)</th>\n",
       "      <td>33.5</td>\n",
       "      <td>46.0</td>\n",
       "      <td>15.9</td>\n",
       "      <td>21.5</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "                                                    Culmen Length (mm)        \\\n",
       "                                                                   min   max   \n",
       "Island    Species                                                              \n",
       "Biscoe    Adelie Penguin (Pygoscelis adeliae)                     34.5  45.6   \n",
       "          Gentoo penguin (Pygoscelis papua)                       40.9  59.6   \n",
       "Dream     Adelie Penguin (Pygoscelis adeliae)                     32.1  44.1   \n",
       "          Chinstrap penguin (Pygoscelis antarctica)               40.9  58.0   \n",
       "Torgersen Adelie Penguin (Pygoscelis adeliae)                     33.5  46.0   \n",
       "\n",
       "                                                    Culmen Depth (mm)        \n",
       "                                                                  min   max  \n",
       "Island    Species                                                            \n",
       "Biscoe    Adelie Penguin (Pygoscelis adeliae)                    16.0  21.1  \n",
       "          Gentoo penguin (Pygoscelis papua)                      13.1  17.3  \n",
       "Dream     Adelie Penguin (Pygoscelis adeliae)                    15.5  21.2  \n",
       "          Chinstrap penguin (Pygoscelis antarctica)              16.4  20.8  \n",
       "Torgersen Adelie Penguin (Pygoscelis adeliae)                    15.9  21.5  "
      ]
     },
     "execution_count": 81,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "dfa.groupby(['Island','Species']).agg({'Culmen Length (mm)': ['min','max'], 'Culmen Depth (mm)': ['min','max']})"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 82,
   "id": "9773c054-9f88-4e16-9bdb-5748ea28cad7",
   "metadata": {
    "scrolled": true
   },
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead tr th {\n",
       "        text-align: left;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr>\n",
       "      <th></th>\n",
       "      <th>Island</th>\n",
       "      <th>Species</th>\n",
       "      <th colspan=\"2\" halign=\"left\">Culmen Length (mm)</th>\n",
       "      <th colspan=\"2\" halign=\"left\">Culmen Depth (mm)</th>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th>min</th>\n",
       "      <th>max</th>\n",
       "      <th>min</th>\n",
       "      <th>max</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>Biscoe</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>34.5</td>\n",
       "      <td>45.6</td>\n",
       "      <td>16.0</td>\n",
       "      <td>21.1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>Biscoe</td>\n",
       "      <td>Gentoo penguin (Pygoscelis papua)</td>\n",
       "      <td>40.9</td>\n",
       "      <td>59.6</td>\n",
       "      <td>13.1</td>\n",
       "      <td>17.3</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>Dream</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>32.1</td>\n",
       "      <td>44.1</td>\n",
       "      <td>15.5</td>\n",
       "      <td>21.2</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>Dream</td>\n",
       "      <td>Chinstrap penguin (Pygoscelis antarctica)</td>\n",
       "      <td>40.9</td>\n",
       "      <td>58.0</td>\n",
       "      <td>16.4</td>\n",
       "      <td>20.8</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>Torgersen</td>\n",
       "      <td>Adelie Penguin (Pygoscelis adeliae)</td>\n",
       "      <td>33.5</td>\n",
       "      <td>46.0</td>\n",
       "      <td>15.9</td>\n",
       "      <td>21.5</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "      Island                                    Species Culmen Length (mm)  \\\n",
       "                                                                       min   \n",
       "0     Biscoe        Adelie Penguin (Pygoscelis adeliae)               34.5   \n",
       "1     Biscoe          Gentoo penguin (Pygoscelis papua)               40.9   \n",
       "2      Dream        Adelie Penguin (Pygoscelis adeliae)               32.1   \n",
       "3      Dream  Chinstrap penguin (Pygoscelis antarctica)               40.9   \n",
       "4  Torgersen        Adelie Penguin (Pygoscelis adeliae)               33.5   \n",
       "\n",
       "        Culmen Depth (mm)        \n",
       "    max               min   max  \n",
       "0  45.6              16.0  21.1  \n",
       "1  59.6              13.1  17.3  \n",
       "2  44.1              15.5  21.2  \n",
       "3  58.0              16.4  20.8  \n",
       "4  46.0              15.9  21.5  "
      ]
     },
     "execution_count": 82,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "dfa.groupby(['Island','Species']).agg({'Culmen Length (mm)': ['min','max'], 'Culmen Depth (mm)': ['min','max']}).reset_index()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 83,
   "id": "20f72953-9a58-4bad-b97a-341021b005d8",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th>Lmin</th>\n",
       "      <th>Lmax</th>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>Island</th>\n",
       "      <th>Species</th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th rowspan=\"2\" valign=\"top\">Biscoe</th>\n",
       "      <th>Adelie Penguin (Pygoscelis adeliae)</th>\n",
       "      <td>34.5</td>\n",
       "      <td>34.5</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>Gentoo penguin (Pygoscelis papua)</th>\n",
       "      <td>40.9</td>\n",
       "      <td>40.9</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th rowspan=\"2\" valign=\"top\">Dream</th>\n",
       "      <th>Adelie Penguin (Pygoscelis adeliae)</th>\n",
       "      <td>32.1</td>\n",
       "      <td>32.1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>Chinstrap penguin (Pygoscelis antarctica)</th>\n",
       "      <td>40.9</td>\n",
       "      <td>40.9</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>Torgersen</th>\n",
       "      <th>Adelie Penguin (Pygoscelis adeliae)</th>\n",
       "      <td>33.5</td>\n",
       "      <td>33.5</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "                                                     Lmin  Lmax\n",
       "Island    Species                                              \n",
       "Biscoe    Adelie Penguin (Pygoscelis adeliae)        34.5  34.5\n",
       "          Gentoo penguin (Pygoscelis papua)          40.9  40.9\n",
       "Dream     Adelie Penguin (Pygoscelis adeliae)        32.1  32.1\n",
       "          Chinstrap penguin (Pygoscelis antarctica)  40.9  40.9\n",
       "Torgersen Adelie Penguin (Pygoscelis adeliae)        33.5  33.5"
      ]
     },
     "execution_count": 83,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "dfa.groupby(['Island','Species']).agg(Lmin=('Culmen Length (mm)', 'min'), Lmax=('Culmen Length (mm)', 'min'))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 84,
   "id": "ef8f4c5d-9899-4f68-8add-551edceae534",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th>Culmen Length (mm) Min</th>\n",
       "      <th>Culmen Length (mm) Max</th>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>Island</th>\n",
       "      <th>Species</th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th rowspan=\"2\" valign=\"top\">Biscoe</th>\n",
       "      <th>Adelie Penguin (Pygoscelis adeliae)</th>\n",
       "      <td>34.5</td>\n",
       "      <td>34.5</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>Gentoo penguin (Pygoscelis papua)</th>\n",
       "      <td>40.9</td>\n",
       "      <td>40.9</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th rowspan=\"2\" valign=\"top\">Dream</th>\n",
       "      <th>Adelie Penguin (Pygoscelis adeliae)</th>\n",
       "      <td>32.1</td>\n",
       "      <td>32.1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>Chinstrap penguin (Pygoscelis antarctica)</th>\n",
       "      <td>40.9</td>\n",
       "      <td>40.9</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>Torgersen</th>\n",
       "      <th>Adelie Penguin (Pygoscelis adeliae)</th>\n",
       "      <td>33.5</td>\n",
       "      <td>33.5</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "                                                     Culmen Length (mm) Min  \\\n",
       "Island    Species                                                             \n",
       "Biscoe    Adelie Penguin (Pygoscelis adeliae)                          34.5   \n",
       "          Gentoo penguin (Pygoscelis papua)                            40.9   \n",
       "Dream     Adelie Penguin (Pygoscelis adeliae)                          32.1   \n",
       "          Chinstrap penguin (Pygoscelis antarctica)                    40.9   \n",
       "Torgersen Adelie Penguin (Pygoscelis adeliae)                          33.5   \n",
       "\n",
       "                                                     Culmen Length (mm) Max  \n",
       "Island    Species                                                            \n",
       "Biscoe    Adelie Penguin (Pygoscelis adeliae)                          34.5  \n",
       "          Gentoo penguin (Pygoscelis papua)                            40.9  \n",
       "Dream     Adelie Penguin (Pygoscelis adeliae)                          32.1  \n",
       "          Chinstrap penguin (Pygoscelis antarctica)                    40.9  \n",
       "Torgersen Adelie Penguin (Pygoscelis adeliae)                          33.5  "
      ]
     },
     "execution_count": 84,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "dfa.groupby(['Island','Species']).agg(**{\"Culmen Length (mm) Min\": ('Culmen Length (mm)', 'min'), \"Culmen Length (mm) Max\": ('Culmen Length (mm)', 'min')})"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "4c638be9-7d10-47f3-a48b-33f64d0ab0f0",
   "metadata": {},
   "source": [
    "### Melt/Unpivot and Pivot"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "ea38a33a-5440-4303-9ea3-df8d733a815c",
   "metadata": {},
   "outputs": [],
   "source": [
    "# weather.txt data from https://code.webartifex.biz/alexander/tidy-data"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 86,
   "id": "863a5d1d-eb03-4168-a29f-28dae4da7074",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "MX000017004195504TMAX  310  I  310  I  310  I  320  I  330  I  320  I  320  I  330  I  330  I  330  I  330  I  320  I  310  I  310  I  320  I  320  I  320  I  310  I  310  I  320  I  320  I  330  I  330  I  330  I  330  I  330  I  330  I  340  I  330  I  320  I-9999   \n",
      "MX000017004195504TMIN  150  I  150  I  160  I  150  I  160  I  160  I  160  I  160  I  160  I  170  I  170  I  160  I  160  I  160  I  170  I  170  I  160  I  160  I  160  I  160  I  170  I  170  I  170  I  170  I  180  I  190  I  190  I  170  I  180  I  160  I-9999   \n",
      "MX000017004195504PRCP    0  I    0  I    0  I    0  I    0  I    0  I    0  I    0  I    0  I    0  I    0  I    0  I    0  I    0  I    0  I    0  I    0  I    0  I    0  I    0  I    0  I    0  I    0  I    0  I    0  I    0  I    0  I    0  I    0  I    6  I-9999   \n",
      "MX000017004195505TMAX  310  I  310  I  310  I  300  I  300  I  300  I  310  I  310  I  310  I  300  I  300  I  310  I  300  I  310  I  320  I  320  I  330  I  330  I  330  I  300  I  350  I  330  I  340  I  350  I  330  I  310  I  310  I  320  I  310  I  300  I  290  I\n",
      "MX000017004195505TMIN  200  I  160  I  160  I  150  I  150  I  150  I  160  I  160  I  170  I  170  I  170  I  170  I  160  I  170  I  170  I  180  I  190  I  180  I  180  I  180  I  200  I  170  I  190  I  190  I  190  I  180  I  160  I  150  I  170  I  150  I  160  I\n",
      "MX000017004195505PRCP    0  I    0  I    0  I    0  I    0  I    0  I    0  I    0  I    0  I    0  I    0  I   12  I   24  I    0  I    0  I    0  I    0  I    0  I    0  I    0  I    5  I    0  I    0  I    0  I    0  I    0  I  142  I    0  I   54  I    0  I   46  I\n",
      "MX000017004195506TMAX  300  I  290  I  280  I  270  I  280  I  260  I  230  I  270  I  280  I  280  I  270  I  290  I  290  I  270  I  290  I  290  I  290  I  300  I  300  I  300  I  300  I  290  I  270  I  270  I  270  I  280  I  300  I  270  I  290  I  270  I-9999   \n",
      "MX000017004195506TMIN  160  I  160  I  150  I  140  I  160  I  150  I  150  I  150  I  160  I  150  I  160  I  180  I  170  I  140  I  160  I  150  I  160  I  170  I  160  I  170  I  170  I  160  I  170  I  150  I  160  I  160  I  160  I  180  I  150  I  150  I-9999   \n",
      "MX000017004195506PRCP  103  I  435  I  422  I    0  I  243  I   17  I    0  I    0  I    0  I   27  I    0  I   15  I  292  I    0  I   28  I   76  I    0  I    0  I    0  I    0  I    0  I    0  I   44  I   52  I    3  I   13  I    0  I   37  I  165  I  323  I-9999   \n",
      "MX000017004195507TMAX  270  I  270  I  260  I  260  I  240  I  240  I  190  I  210  I  250  I  250  I  260  I  240  I  250  I  250  I  270  I  240  I  230  I  240  I  230  I  240  I  240  I  230  I  240  I  240  I  260  I  260  I  260  I  260  I  260  I  260  I  260  I\n"
     ]
    }
   ],
   "source": [
    "!head -10 weather.txt"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 87,
   "id": "08b8a567-addb-41ce-ac0a-795e39f1d572",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div><style>\n",
       ".dataframe > thead > tr,\n",
       ".dataframe > tbody > tr {\n",
       "  text-align: right;\n",
       "  white-space: pre-wrap;\n",
       "}\n",
       "</style>\n",
       "<small>shape: (1_714, 128)</small><table border=\"1\" class=\"dataframe\"><thead><tr><th>id</th><th>year</th><th>month</th><th>element</th><th>value1</th><th>mflag1</th><th>qflag1</th><th>sflag1</th><th>value2</th><th>mflag2</th><th>qflag2</th><th>sflag2</th><th>value3</th><th>mflag3</th><th>qflag3</th><th>sflag3</th><th>value4</th><th>mflag4</th><th>qflag4</th><th>sflag4</th><th>value5</th><th>mflag5</th><th>qflag5</th><th>sflag5</th><th>value6</th><th>mflag6</th><th>qflag6</th><th>sflag6</th><th>value7</th><th>mflag7</th><th>qflag7</th><th>sflag7</th><th>value8</th><th>mflag8</th><th>qflag8</th><th>sflag8</th><th>value9</th><th>&hellip;</th><th>sflag22</th><th>value23</th><th>mflag23</th><th>qflag23</th><th>sflag23</th><th>value24</th><th>mflag24</th><th>qflag24</th><th>sflag24</th><th>value25</th><th>mflag25</th><th>qflag25</th><th>sflag25</th><th>value26</th><th>mflag26</th><th>qflag26</th><th>sflag26</th><th>value27</th><th>mflag27</th><th>qflag27</th><th>sflag27</th><th>value28</th><th>mflag28</th><th>qflag28</th><th>sflag28</th><th>value29</th><th>mflag29</th><th>qflag29</th><th>sflag29</th><th>value30</th><th>mflag30</th><th>qflag30</th><th>sflag30</th><th>value31</th><th>mflag31</th><th>qflag31</th><th>sflag31</th></tr><tr><td>str</td><td>i32</td><td>i32</td><td>str</td><td>i32</td><td>str</td><td>str</td><td>str</td><td>i32</td><td>str</td><td>str</td><td>str</td><td>i32</td><td>str</td><td>str</td><td>str</td><td>i32</td><td>str</td><td>str</td><td>str</td><td>i32</td><td>str</td><td>str</td><td>str</td><td>i32</td><td>str</td><td>str</td><td>str</td><td>i32</td><td>str</td><td>str</td><td>str</td><td>i32</td><td>str</td><td>str</td><td>str</td><td>i32</td><td>&hellip;</td><td>str</td><td>i32</td><td>str</td><td>str</td><td>str</td><td>i32</td><td>str</td><td>str</td><td>str</td><td>i32</td><td>str</td><td>str</td><td>str</td><td>i32</td><td>str</td><td>str</td><td>str</td><td>i32</td><td>str</td><td>str</td><td>str</td><td>i32</td><td>str</td><td>str</td><td>str</td><td>i32</td><td>str</td><td>str</td><td>str</td><td>i32</td><td>str</td><td>str</td><td>str</td><td>i32</td><td>str</td><td>str</td><td>str</td></tr></thead><tbody><tr><td>&quot;MX000017004&quot;</td><td>1955</td><td>4</td><td>&quot;tmax&quot;</td><td>310</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot;I&quot;</td><td>310</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot;I&quot;</td><td>310</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot;I&quot;</td><td>320</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot;I&quot;</td><td>330</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot;I&quot;</td><td>320</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot;I&quot;</td><td>320</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot;I&quot;</td><td>330</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot;I&quot;</td><td>330</td><td>&hellip;</td><td>&quot;I&quot;</td><td>330</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot;I&quot;</td><td>330</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot;I&quot;</td><td>330</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot;I&quot;</td><td>330</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot;I&quot;</td><td>330</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot;I&quot;</td><td>340</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot;I&quot;</td><td>330</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot;I&quot;</td><td>320</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot;I&quot;</td><td>-9999</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot; &quot;</td></tr><tr><td>&quot;MX000017004&quot;</td><td>1955</td><td>4</td><td>&quot;tmin&quot;</td><td>150</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot;I&quot;</td><td>150</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot;I&quot;</td><td>160</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot;I&quot;</td><td>150</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot;I&quot;</td><td>160</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot;I&quot;</td><td>160</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot;I&quot;</td><td>160</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot;I&quot;</td><td>160</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot;I&quot;</td><td>160</td><td>&hellip;</td><td>&quot;I&quot;</td><td>170</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot;I&quot;</td><td>170</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot;I&quot;</td><td>180</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot;I&quot;</td><td>190</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot;I&quot;</td><td>190</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot;I&quot;</td><td>170</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot;I&quot;</td><td>180</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot;I&quot;</td><td>160</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot;I&quot;</td><td>-9999</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot; &quot;</td></tr><tr><td>&quot;MX000017004&quot;</td><td>1955</td><td>4</td><td>&quot;prcp&quot;</td><td>0</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot;I&quot;</td><td>0</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot;I&quot;</td><td>0</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot;I&quot;</td><td>0</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot;I&quot;</td><td>0</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot;I&quot;</td><td>0</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot;I&quot;</td><td>0</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot;I&quot;</td><td>0</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot;I&quot;</td><td>0</td><td>&hellip;</td><td>&quot;I&quot;</td><td>0</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot;I&quot;</td><td>0</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot;I&quot;</td><td>0</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot;I&quot;</td><td>0</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot;I&quot;</td><td>0</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot;I&quot;</td><td>0</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot;I&quot;</td><td>0</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot;I&quot;</td><td>6</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot;I&quot;</td><td>-9999</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot; &quot;</td></tr><tr><td>&quot;MX000017004&quot;</td><td>1955</td><td>5</td><td>&quot;tmax&quot;</td><td>310</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot;I&quot;</td><td>310</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot;I&quot;</td><td>310</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot;I&quot;</td><td>300</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot;I&quot;</td><td>300</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot;I&quot;</td><td>300</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot;I&quot;</td><td>310</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot;I&quot;</td><td>310</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot;I&quot;</td><td>310</td><td>&hellip;</td><td>&quot;I&quot;</td><td>340</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot;I&quot;</td><td>350</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot;I&quot;</td><td>330</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot;I&quot;</td><td>310</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot;I&quot;</td><td>310</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot;I&quot;</td><td>320</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot;I&quot;</td><td>310</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot;I&quot;</td><td>300</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot;I&quot;</td><td>290</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot;I&quot;</td></tr><tr><td>&quot;MX000017004&quot;</td><td>1955</td><td>5</td><td>&quot;tmin&quot;</td><td>200</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot;I&quot;</td><td>160</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot;I&quot;</td><td>160</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot;I&quot;</td><td>150</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot;I&quot;</td><td>150</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot;I&quot;</td><td>150</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot;I&quot;</td><td>160</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot;I&quot;</td><td>160</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot;I&quot;</td><td>170</td><td>&hellip;</td><td>&quot;I&quot;</td><td>190</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot;I&quot;</td><td>190</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot;I&quot;</td><td>190</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot;I&quot;</td><td>180</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot;I&quot;</td><td>160</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot;I&quot;</td><td>150</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot;I&quot;</td><td>170</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot;I&quot;</td><td>150</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot;I&quot;</td><td>160</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot;I&quot;</td></tr><tr><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td></tr><tr><td>&quot;MX000017004&quot;</td><td>2011</td><td>3</td><td>&quot;tmin&quot;</td><td>-9999</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>-9999</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>-9999</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>-9999</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>148</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot;S&quot;</td><td>-9999</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>-9999</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>-9999</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>-9999</td><td>&hellip;</td><td>&quot; &quot;</td><td>-9999</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>-9999</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>-9999</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>162</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot;S&quot;</td><td>-9999</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>-9999</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>-9999</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>-9999</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>170</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot;S&quot;</td></tr><tr><td>&quot;MX000017004&quot;</td><td>2011</td><td>3</td><td>&quot;prcp&quot;</td><td>0</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot;S&quot;</td><td>-9999</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>0</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot;S&quot;</td><td>0</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot;S&quot;</td><td>0</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot;S&quot;</td><td>-9999</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>0</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot;S&quot;</td><td>0</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot;S&quot;</td><td>0</td><td>&hellip;</td><td>&quot;S&quot;</td><td>-9999</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>0</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot;S&quot;</td><td>-9999</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>0</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot;S&quot;</td><td>-9999</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>-9999</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>0</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot;S&quot;</td><td>-9999</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>0</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot;S&quot;</td></tr><tr><td>&quot;MX000017004&quot;</td><td>2011</td><td>4</td><td>&quot;tmax&quot;</td><td>-9999</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>350</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot;S&quot;</td><td>-9999</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>-9999</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>-9999</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>-9999</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>-9999</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>-9999</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>-9999</td><td>&hellip;</td><td>&quot; &quot;</td><td>-9999</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>-9999</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>-9999</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>-9999</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>-9999</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>-9999</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>-9999</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>-9999</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>-9999</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot; &quot;</td></tr><tr><td>&quot;MX000017004&quot;</td><td>2011</td><td>4</td><td>&quot;tmin&quot;</td><td>-9999</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>168</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot;S&quot;</td><td>-9999</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>-9999</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>-9999</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>-9999</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>-9999</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>-9999</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>-9999</td><td>&hellip;</td><td>&quot; &quot;</td><td>-9999</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>-9999</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>-9999</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>-9999</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>-9999</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>-9999</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>-9999</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>-9999</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>-9999</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot; &quot;</td></tr><tr><td>&quot;MX000017004&quot;</td><td>2011</td><td>4</td><td>&quot;prcp&quot;</td><td>0</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot;S&quot;</td><td>0</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot;S&quot;</td><td>-9999</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>-9999</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>0</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot;S&quot;</td><td>0</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot;S&quot;</td><td>-9999</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>-9999</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>-9999</td><td>&hellip;</td><td>&quot; &quot;</td><td>-9999</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>-9999</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>-9999</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>-9999</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>-9999</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>-9999</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>-9999</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>-9999</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>-9999</td><td>&quot; &quot;</td><td>&quot; &quot;</td><td>&quot; &quot;</td></tr></tbody></table></div>"
      ],
      "text/plain": [
       "shape: (1_714, 128)\n",
       "┌─────────────┬──────┬───────┬─────────┬───┬─────────┬─────────┬─────────┬─────────┐\n",
       "│ id          ┆ year ┆ month ┆ element ┆ … ┆ value31 ┆ mflag31 ┆ qflag31 ┆ sflag31 │\n",
       "│ ---         ┆ ---  ┆ ---   ┆ ---     ┆   ┆ ---     ┆ ---     ┆ ---     ┆ ---     │\n",
       "│ str         ┆ i32  ┆ i32   ┆ str     ┆   ┆ i32     ┆ str     ┆ str     ┆ str     │\n",
       "╞═════════════╪══════╪═══════╪═════════╪═══╪═════════╪═════════╪═════════╪═════════╡\n",
       "│ MX000017004 ┆ 1955 ┆ 4     ┆ tmax    ┆ … ┆ -9999   ┆         ┆         ┆         │\n",
       "│ MX000017004 ┆ 1955 ┆ 4     ┆ tmin    ┆ … ┆ -9999   ┆         ┆         ┆         │\n",
       "│ MX000017004 ┆ 1955 ┆ 4     ┆ prcp    ┆ … ┆ -9999   ┆         ┆         ┆         │\n",
       "│ MX000017004 ┆ 1955 ┆ 5     ┆ tmax    ┆ … ┆ 290     ┆         ┆         ┆ I       │\n",
       "│ MX000017004 ┆ 1955 ┆ 5     ┆ tmin    ┆ … ┆ 160     ┆         ┆         ┆ I       │\n",
       "│ …           ┆ …    ┆ …     ┆ …       ┆ … ┆ …       ┆ …       ┆ …       ┆ …       │\n",
       "│ MX000017004 ┆ 2011 ┆ 3     ┆ tmin    ┆ … ┆ 170     ┆         ┆         ┆ S       │\n",
       "│ MX000017004 ┆ 2011 ┆ 3     ┆ prcp    ┆ … ┆ 0       ┆         ┆         ┆ S       │\n",
       "│ MX000017004 ┆ 2011 ┆ 4     ┆ tmax    ┆ … ┆ -9999   ┆         ┆         ┆         │\n",
       "│ MX000017004 ┆ 2011 ┆ 4     ┆ tmin    ┆ … ┆ -9999   ┆         ┆         ┆         │\n",
       "│ MX000017004 ┆ 2011 ┆ 4     ┆ prcp    ┆ … ┆ -9999   ┆         ┆         ┆         │\n",
       "└─────────────┴──────┴───────┴─────────┴───┴─────────┴─────────┴─────────┴─────────┘"
      ]
     },
     "execution_count": 87,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# ghcn file format detailed here:\n",
    "# https://www1.ncdc.noaa.gov/pub/data/ghcn/daily/readme.txt\n",
    "\n",
    "# ------------------------------\n",
    "# Variable   Columns   Type\n",
    "# ------------------------------\n",
    "# ID            1-11   Character\n",
    "# YEAR         12-15   Integer\n",
    "# MONTH        16-17   Integer\n",
    "# ELEMENT      18-21   Character\n",
    "# VALUE1       22-26   Integer\n",
    "# MFLAG1       27-27   Character\n",
    "# QFLAG1       28-28   Character\n",
    "# SFLAG1       29-29   Character\n",
    "# VALUE2       30-34   Integer\n",
    "# MFLAG2       35-35   Character\n",
    "# QFLAG2       36-36   Character\n",
    "# SFLAG2       37-37   Character\n",
    "#   .           .          .\n",
    "#   .           .          .\n",
    "#   .           .          .\n",
    "# VALUE31    262-266   Integer\n",
    "# MFLAG31    267-267   Character\n",
    "# QFLAG31    268-268   Character\n",
    "# SFLAG31    269-269   Character\n",
    "# ------------------------------\n",
    "\n",
    "# parsing using extract_groups\n",
    "# h/t https://stackoverflow.com/a/78545671\n",
    "\n",
    "import polars as pl\n",
    "\n",
    "# Read file as a single-column DataFrame\n",
    "wdf = pl.read_csv(\n",
    "    \"weather.txt\",\n",
    "    separator=\"\\n\",\n",
    "    has_header=False,\n",
    "    new_columns=[\"data\"],\n",
    ")\n",
    "\n",
    "# Extract columns with regex\n",
    "days = \"\".join([f\"(?<value{d}>.{{5}})(?<mflag{d}>.{{1}})(?<qflag{d}>.{{1}})(?<sflag{d}>.{{1}})\" for d in range(1,32)])\n",
    "wdf = wdf.select(\n",
    "    pl.col(\"data\").str.extract_groups(\n",
    "        r\"^(?<id>.{11})(?<year>.{4})(?<month>.{2})(?<element>.{4})\" + days + \"$\"\n",
    "    )\n",
    ").unnest(\"data\")\n",
    "\n",
    "wdf = wdf.with_columns(pl.col(\"year\",\"month\",r\"^value\\d*$\").str.strip_chars().cast(pl.Int32),\n",
    "                      pl.col('element').str.to_lowercase())"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 88,
   "id": "f9aeae1a-f589-40b5-b6bf-fffd7f89a974",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div><style>\n",
       ".dataframe > thead > tr,\n",
       ".dataframe > tbody > tr {\n",
       "  text-align: right;\n",
       "  white-space: pre-wrap;\n",
       "}\n",
       "</style>\n",
       "<small>shape: (1_129, 35)</small><table border=\"1\" class=\"dataframe\"><thead><tr><th>id</th><th>year</th><th>month</th><th>element</th><th>d1</th><th>d2</th><th>d3</th><th>d4</th><th>d5</th><th>d6</th><th>d7</th><th>d8</th><th>d9</th><th>d10</th><th>d11</th><th>d12</th><th>d13</th><th>d14</th><th>d15</th><th>d16</th><th>d17</th><th>d18</th><th>d19</th><th>d20</th><th>d21</th><th>d22</th><th>d23</th><th>d24</th><th>d25</th><th>d26</th><th>d27</th><th>d28</th><th>d29</th><th>d30</th><th>d31</th></tr><tr><td>str</td><td>i32</td><td>i32</td><td>str</td><td>f64</td><td>f64</td><td>f64</td><td>f64</td><td>f64</td><td>f64</td><td>f64</td><td>f64</td><td>f64</td><td>f64</td><td>f64</td><td>f64</td><td>f64</td><td>f64</td><td>f64</td><td>f64</td><td>f64</td><td>f64</td><td>f64</td><td>f64</td><td>f64</td><td>f64</td><td>f64</td><td>f64</td><td>f64</td><td>f64</td><td>f64</td><td>f64</td><td>f64</td><td>f64</td><td>f64</td></tr></thead><tbody><tr><td>&quot;MX000017004&quot;</td><td>1955</td><td>4</td><td>&quot;tmax&quot;</td><td>31.0</td><td>31.0</td><td>31.0</td><td>32.0</td><td>33.0</td><td>32.0</td><td>32.0</td><td>33.0</td><td>33.0</td><td>33.0</td><td>33.0</td><td>32.0</td><td>31.0</td><td>31.0</td><td>32.0</td><td>32.0</td><td>32.0</td><td>31.0</td><td>31.0</td><td>32.0</td><td>32.0</td><td>33.0</td><td>33.0</td><td>33.0</td><td>33.0</td><td>33.0</td><td>33.0</td><td>34.0</td><td>33.0</td><td>32.0</td><td>NaN</td></tr><tr><td>&quot;MX000017004&quot;</td><td>1955</td><td>4</td><td>&quot;tmin&quot;</td><td>15.0</td><td>15.0</td><td>16.0</td><td>15.0</td><td>16.0</td><td>16.0</td><td>16.0</td><td>16.0</td><td>16.0</td><td>17.0</td><td>17.0</td><td>16.0</td><td>16.0</td><td>16.0</td><td>17.0</td><td>17.0</td><td>16.0</td><td>16.0</td><td>16.0</td><td>16.0</td><td>17.0</td><td>17.0</td><td>17.0</td><td>17.0</td><td>18.0</td><td>19.0</td><td>19.0</td><td>17.0</td><td>18.0</td><td>16.0</td><td>NaN</td></tr><tr><td>&quot;MX000017004&quot;</td><td>1955</td><td>5</td><td>&quot;tmax&quot;</td><td>31.0</td><td>31.0</td><td>31.0</td><td>30.0</td><td>30.0</td><td>30.0</td><td>31.0</td><td>31.0</td><td>31.0</td><td>30.0</td><td>30.0</td><td>31.0</td><td>30.0</td><td>31.0</td><td>32.0</td><td>32.0</td><td>33.0</td><td>33.0</td><td>33.0</td><td>30.0</td><td>35.0</td><td>33.0</td><td>34.0</td><td>35.0</td><td>33.0</td><td>31.0</td><td>31.0</td><td>32.0</td><td>31.0</td><td>30.0</td><td>29.0</td></tr><tr><td>&quot;MX000017004&quot;</td><td>1955</td><td>5</td><td>&quot;tmin&quot;</td><td>20.0</td><td>16.0</td><td>16.0</td><td>15.0</td><td>15.0</td><td>15.0</td><td>16.0</td><td>16.0</td><td>17.0</td><td>17.0</td><td>17.0</td><td>17.0</td><td>16.0</td><td>17.0</td><td>17.0</td><td>18.0</td><td>19.0</td><td>18.0</td><td>18.0</td><td>18.0</td><td>20.0</td><td>17.0</td><td>19.0</td><td>19.0</td><td>19.0</td><td>18.0</td><td>16.0</td><td>15.0</td><td>17.0</td><td>15.0</td><td>16.0</td></tr><tr><td>&quot;MX000017004&quot;</td><td>1955</td><td>6</td><td>&quot;tmax&quot;</td><td>30.0</td><td>29.0</td><td>28.0</td><td>27.0</td><td>28.0</td><td>26.0</td><td>23.0</td><td>27.0</td><td>28.0</td><td>28.0</td><td>27.0</td><td>29.0</td><td>29.0</td><td>27.0</td><td>29.0</td><td>29.0</td><td>29.0</td><td>30.0</td><td>30.0</td><td>30.0</td><td>30.0</td><td>29.0</td><td>27.0</td><td>27.0</td><td>27.0</td><td>28.0</td><td>30.0</td><td>27.0</td><td>29.0</td><td>27.0</td><td>NaN</td></tr><tr><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td></tr><tr><td>&quot;MX000017004&quot;</td><td>2011</td><td>2</td><td>&quot;tmin&quot;</td><td>NaN</td><td>NaN</td><td>NaN</td><td>NaN</td><td>NaN</td><td>NaN</td><td>NaN</td><td>NaN</td><td>NaN</td><td>NaN</td><td>NaN</td><td>NaN</td><td>NaN</td><td>NaN</td><td>13.6</td><td>NaN</td><td>13.4</td><td>NaN</td><td>12.8</td><td>NaN</td><td>NaN</td><td>NaN</td><td>NaN</td><td>NaN</td><td>NaN</td><td>NaN</td><td>NaN</td><td>NaN</td><td>NaN</td><td>NaN</td><td>NaN</td></tr><tr><td>&quot;MX000017004&quot;</td><td>2011</td><td>3</td><td>&quot;tmax&quot;</td><td>NaN</td><td>NaN</td><td>NaN</td><td>NaN</td><td>33.2</td><td>NaN</td><td>NaN</td><td>NaN</td><td>NaN</td><td>32.0</td><td>NaN</td><td>NaN</td><td>NaN</td><td>NaN</td><td>NaN</td><td>NaN</td><td>NaN</td><td>NaN</td><td>NaN</td><td>NaN</td><td>NaN</td><td>NaN</td><td>NaN</td><td>NaN</td><td>NaN</td><td>33.2</td><td>NaN</td><td>NaN</td><td>NaN</td><td>NaN</td><td>36.5</td></tr><tr><td>&quot;MX000017004&quot;</td><td>2011</td><td>3</td><td>&quot;tmin&quot;</td><td>NaN</td><td>NaN</td><td>NaN</td><td>NaN</td><td>14.8</td><td>NaN</td><td>NaN</td><td>NaN</td><td>NaN</td><td>12.7</td><td>NaN</td><td>NaN</td><td>NaN</td><td>NaN</td><td>NaN</td><td>NaN</td><td>NaN</td><td>NaN</td><td>NaN</td><td>NaN</td><td>NaN</td><td>NaN</td><td>NaN</td><td>NaN</td><td>NaN</td><td>16.2</td><td>NaN</td><td>NaN</td><td>NaN</td><td>NaN</td><td>17.0</td></tr><tr><td>&quot;MX000017004&quot;</td><td>2011</td><td>4</td><td>&quot;tmax&quot;</td><td>NaN</td><td>35.0</td><td>NaN</td><td>NaN</td><td>NaN</td><td>NaN</td><td>NaN</td><td>NaN</td><td>NaN</td><td>NaN</td><td>NaN</td><td>NaN</td><td>NaN</td><td>NaN</td><td>NaN</td><td>NaN</td><td>NaN</td><td>NaN</td><td>NaN</td><td>NaN</td><td>NaN</td><td>NaN</td><td>NaN</td><td>NaN</td><td>NaN</td><td>NaN</td><td>NaN</td><td>NaN</td><td>NaN</td><td>NaN</td><td>NaN</td></tr><tr><td>&quot;MX000017004&quot;</td><td>2011</td><td>4</td><td>&quot;tmin&quot;</td><td>NaN</td><td>16.8</td><td>NaN</td><td>NaN</td><td>NaN</td><td>NaN</td><td>NaN</td><td>NaN</td><td>NaN</td><td>NaN</td><td>NaN</td><td>NaN</td><td>NaN</td><td>NaN</td><td>NaN</td><td>NaN</td><td>NaN</td><td>NaN</td><td>NaN</td><td>NaN</td><td>NaN</td><td>NaN</td><td>NaN</td><td>NaN</td><td>NaN</td><td>NaN</td><td>NaN</td><td>NaN</td><td>NaN</td><td>NaN</td><td>NaN</td></tr></tbody></table></div>"
      ],
      "text/plain": [
       "shape: (1_129, 35)\n",
       "┌─────────────┬──────┬───────┬─────────┬───┬──────┬──────┬──────┬──────┐\n",
       "│ id          ┆ year ┆ month ┆ element ┆ … ┆ d28  ┆ d29  ┆ d30  ┆ d31  │\n",
       "│ ---         ┆ ---  ┆ ---   ┆ ---     ┆   ┆ ---  ┆ ---  ┆ ---  ┆ ---  │\n",
       "│ str         ┆ i32  ┆ i32   ┆ str     ┆   ┆ f64  ┆ f64  ┆ f64  ┆ f64  │\n",
       "╞═════════════╪══════╪═══════╪═════════╪═══╪══════╪══════╪══════╪══════╡\n",
       "│ MX000017004 ┆ 1955 ┆ 4     ┆ tmax    ┆ … ┆ 34.0 ┆ 33.0 ┆ 32.0 ┆ NaN  │\n",
       "│ MX000017004 ┆ 1955 ┆ 4     ┆ tmin    ┆ … ┆ 17.0 ┆ 18.0 ┆ 16.0 ┆ NaN  │\n",
       "│ MX000017004 ┆ 1955 ┆ 5     ┆ tmax    ┆ … ┆ 32.0 ┆ 31.0 ┆ 30.0 ┆ 29.0 │\n",
       "│ MX000017004 ┆ 1955 ┆ 5     ┆ tmin    ┆ … ┆ 15.0 ┆ 17.0 ┆ 15.0 ┆ 16.0 │\n",
       "│ MX000017004 ┆ 1955 ┆ 6     ┆ tmax    ┆ … ┆ 27.0 ┆ 29.0 ┆ 27.0 ┆ NaN  │\n",
       "│ …           ┆ …    ┆ …     ┆ …       ┆ … ┆ …    ┆ …    ┆ …    ┆ …    │\n",
       "│ MX000017004 ┆ 2011 ┆ 2     ┆ tmin    ┆ … ┆ NaN  ┆ NaN  ┆ NaN  ┆ NaN  │\n",
       "│ MX000017004 ┆ 2011 ┆ 3     ┆ tmax    ┆ … ┆ NaN  ┆ NaN  ┆ NaN  ┆ 36.5 │\n",
       "│ MX000017004 ┆ 2011 ┆ 3     ┆ tmin    ┆ … ┆ NaN  ┆ NaN  ┆ NaN  ┆ 17.0 │\n",
       "│ MX000017004 ┆ 2011 ┆ 4     ┆ tmax    ┆ … ┆ NaN  ┆ NaN  ┆ NaN  ┆ NaN  │\n",
       "│ MX000017004 ┆ 2011 ┆ 4     ┆ tmin    ┆ … ┆ NaN  ┆ NaN  ┆ NaN  ┆ NaN  │\n",
       "└─────────────┴──────┴───────┴─────────┴───┴──────┴──────┴──────┴──────┘"
      ]
     },
     "execution_count": 88,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "import math\n",
    "wdf = (wdf.filter(pl.col(\"element\").str.to_lowercase().is_in([\"tmax\",\"tmin\"]))\n",
    "          .with_columns(pl.col(r\"^value\\d*$\").cast(pl.Float64).replace(-9999,math.nan) / 10)\n",
    "          .select(pl.col(\"id\",\"year\",\"month\",\"element\",r\"^value.*$\"))\n",
    ").rename(lambda c: f\"d{c[5:]}\" if c.startswith('value') else c)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 89,
   "id": "1a570516-dd13-40dd-a6ce-79eda2863a7a",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div><style>\n",
       ".dataframe > thead > tr,\n",
       ".dataframe > tbody > tr {\n",
       "  text-align: right;\n",
       "  white-space: pre-wrap;\n",
       "}\n",
       "</style>\n",
       "<small>shape: (34_999, 6)</small><table border=\"1\" class=\"dataframe\"><thead><tr><th>id</th><th>year</th><th>month</th><th>element</th><th>variable</th><th>value</th></tr><tr><td>str</td><td>i32</td><td>i32</td><td>str</td><td>str</td><td>f64</td></tr></thead><tbody><tr><td>&quot;MX000017004&quot;</td><td>1955</td><td>4</td><td>&quot;tmax&quot;</td><td>&quot;d1&quot;</td><td>31.0</td></tr><tr><td>&quot;MX000017004&quot;</td><td>1955</td><td>4</td><td>&quot;tmin&quot;</td><td>&quot;d1&quot;</td><td>15.0</td></tr><tr><td>&quot;MX000017004&quot;</td><td>1955</td><td>5</td><td>&quot;tmax&quot;</td><td>&quot;d1&quot;</td><td>31.0</td></tr><tr><td>&quot;MX000017004&quot;</td><td>1955</td><td>5</td><td>&quot;tmin&quot;</td><td>&quot;d1&quot;</td><td>20.0</td></tr><tr><td>&quot;MX000017004&quot;</td><td>1955</td><td>6</td><td>&quot;tmax&quot;</td><td>&quot;d1&quot;</td><td>30.0</td></tr><tr><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td></tr><tr><td>&quot;MX000017004&quot;</td><td>2011</td><td>2</td><td>&quot;tmin&quot;</td><td>&quot;d31&quot;</td><td>NaN</td></tr><tr><td>&quot;MX000017004&quot;</td><td>2011</td><td>3</td><td>&quot;tmax&quot;</td><td>&quot;d31&quot;</td><td>36.5</td></tr><tr><td>&quot;MX000017004&quot;</td><td>2011</td><td>3</td><td>&quot;tmin&quot;</td><td>&quot;d31&quot;</td><td>17.0</td></tr><tr><td>&quot;MX000017004&quot;</td><td>2011</td><td>4</td><td>&quot;tmax&quot;</td><td>&quot;d31&quot;</td><td>NaN</td></tr><tr><td>&quot;MX000017004&quot;</td><td>2011</td><td>4</td><td>&quot;tmin&quot;</td><td>&quot;d31&quot;</td><td>NaN</td></tr></tbody></table></div>"
      ],
      "text/plain": [
       "shape: (34_999, 6)\n",
       "┌─────────────┬──────┬───────┬─────────┬──────────┬───────┐\n",
       "│ id          ┆ year ┆ month ┆ element ┆ variable ┆ value │\n",
       "│ ---         ┆ ---  ┆ ---   ┆ ---     ┆ ---      ┆ ---   │\n",
       "│ str         ┆ i32  ┆ i32   ┆ str     ┆ str      ┆ f64   │\n",
       "╞═════════════╪══════╪═══════╪═════════╪══════════╪═══════╡\n",
       "│ MX000017004 ┆ 1955 ┆ 4     ┆ tmax    ┆ d1       ┆ 31.0  │\n",
       "│ MX000017004 ┆ 1955 ┆ 4     ┆ tmin    ┆ d1       ┆ 15.0  │\n",
       "│ MX000017004 ┆ 1955 ┆ 5     ┆ tmax    ┆ d1       ┆ 31.0  │\n",
       "│ MX000017004 ┆ 1955 ┆ 5     ┆ tmin    ┆ d1       ┆ 20.0  │\n",
       "│ MX000017004 ┆ 1955 ┆ 6     ┆ tmax    ┆ d1       ┆ 30.0  │\n",
       "│ …           ┆ …    ┆ …     ┆ …       ┆ …        ┆ …     │\n",
       "│ MX000017004 ┆ 2011 ┆ 2     ┆ tmin    ┆ d31      ┆ NaN   │\n",
       "│ MX000017004 ┆ 2011 ┆ 3     ┆ tmax    ┆ d31      ┆ 36.5  │\n",
       "│ MX000017004 ┆ 2011 ┆ 3     ┆ tmin    ┆ d31      ┆ 17.0  │\n",
       "│ MX000017004 ┆ 2011 ┆ 4     ┆ tmax    ┆ d31      ┆ NaN   │\n",
       "│ MX000017004 ┆ 2011 ┆ 4     ┆ tmin    ┆ d31      ┆ NaN   │\n",
       "└─────────────┴──────┴───────┴─────────┴──────────┴───────┘"
      ]
     },
     "execution_count": 89,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "wdf_up = wdf.unpivot(index=['id','year','month','element'])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 90,
   "id": "37b2807a-d61d-4b6c-9137-9ad42ba9f89e",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div><style>\n",
       ".dataframe > thead > tr,\n",
       ".dataframe > tbody > tr {\n",
       "  text-align: right;\n",
       "  white-space: pre-wrap;\n",
       "}\n",
       "</style>\n",
       "<small>shape: (17_515, 6)</small><table border=\"1\" class=\"dataframe\"><thead><tr><th>id</th><th>year</th><th>month</th><th>variable</th><th>tmax</th><th>tmin</th></tr><tr><td>str</td><td>i32</td><td>i32</td><td>str</td><td>f64</td><td>f64</td></tr></thead><tbody><tr><td>&quot;MX000017004&quot;</td><td>1955</td><td>4</td><td>&quot;d1&quot;</td><td>31.0</td><td>15.0</td></tr><tr><td>&quot;MX000017004&quot;</td><td>1955</td><td>5</td><td>&quot;d1&quot;</td><td>31.0</td><td>20.0</td></tr><tr><td>&quot;MX000017004&quot;</td><td>1955</td><td>6</td><td>&quot;d1&quot;</td><td>30.0</td><td>16.0</td></tr><tr><td>&quot;MX000017004&quot;</td><td>1955</td><td>7</td><td>&quot;d1&quot;</td><td>27.0</td><td>15.0</td></tr><tr><td>&quot;MX000017004&quot;</td><td>1955</td><td>8</td><td>&quot;d1&quot;</td><td>23.0</td><td>14.0</td></tr><tr><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td></tr><tr><td>&quot;MX000017004&quot;</td><td>2010</td><td>12</td><td>&quot;d31&quot;</td><td>NaN</td><td>NaN</td></tr><tr><td>&quot;MX000017004&quot;</td><td>2011</td><td>1</td><td>&quot;d31&quot;</td><td>NaN</td><td>NaN</td></tr><tr><td>&quot;MX000017004&quot;</td><td>2011</td><td>2</td><td>&quot;d31&quot;</td><td>NaN</td><td>NaN</td></tr><tr><td>&quot;MX000017004&quot;</td><td>2011</td><td>3</td><td>&quot;d31&quot;</td><td>36.5</td><td>17.0</td></tr><tr><td>&quot;MX000017004&quot;</td><td>2011</td><td>4</td><td>&quot;d31&quot;</td><td>NaN</td><td>NaN</td></tr></tbody></table></div>"
      ],
      "text/plain": [
       "shape: (17_515, 6)\n",
       "┌─────────────┬──────┬───────┬──────────┬──────┬──────┐\n",
       "│ id          ┆ year ┆ month ┆ variable ┆ tmax ┆ tmin │\n",
       "│ ---         ┆ ---  ┆ ---   ┆ ---      ┆ ---  ┆ ---  │\n",
       "│ str         ┆ i32  ┆ i32   ┆ str      ┆ f64  ┆ f64  │\n",
       "╞═════════════╪══════╪═══════╪══════════╪══════╪══════╡\n",
       "│ MX000017004 ┆ 1955 ┆ 4     ┆ d1       ┆ 31.0 ┆ 15.0 │\n",
       "│ MX000017004 ┆ 1955 ┆ 5     ┆ d1       ┆ 31.0 ┆ 20.0 │\n",
       "│ MX000017004 ┆ 1955 ┆ 6     ┆ d1       ┆ 30.0 ┆ 16.0 │\n",
       "│ MX000017004 ┆ 1955 ┆ 7     ┆ d1       ┆ 27.0 ┆ 15.0 │\n",
       "│ MX000017004 ┆ 1955 ┆ 8     ┆ d1       ┆ 23.0 ┆ 14.0 │\n",
       "│ …           ┆ …    ┆ …     ┆ …        ┆ …    ┆ …    │\n",
       "│ MX000017004 ┆ 2010 ┆ 12    ┆ d31      ┆ NaN  ┆ NaN  │\n",
       "│ MX000017004 ┆ 2011 ┆ 1     ┆ d31      ┆ NaN  ┆ NaN  │\n",
       "│ MX000017004 ┆ 2011 ┆ 2     ┆ d31      ┆ NaN  ┆ NaN  │\n",
       "│ MX000017004 ┆ 2011 ┆ 3     ┆ d31      ┆ 36.5 ┆ 17.0 │\n",
       "│ MX000017004 ┆ 2011 ┆ 4     ┆ d31      ┆ NaN  ┆ NaN  │\n",
       "└─────────────┴──────┴───────┴──────────┴──────┴──────┘"
      ]
     },
     "execution_count": 90,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "wdf_p = wdf_up.pivot('element', index=['id','year','month','variable'], values='value')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 91,
   "id": "344ebe1d-d19a-4b7b-9571-7baf5bd82823",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div><style>\n",
       ".dataframe > thead > tr,\n",
       ".dataframe > tbody > tr {\n",
       "  text-align: right;\n",
       "  white-space: pre-wrap;\n",
       "}\n",
       "</style>\n",
       "<small>shape: (17_204, 4)</small><table border=\"1\" class=\"dataframe\"><thead><tr><th>id</th><th>date</th><th>tmin</th><th>tmax</th></tr><tr><td>str</td><td>date</td><td>f64</td><td>f64</td></tr></thead><tbody><tr><td>&quot;MX000017004&quot;</td><td>1955-04-01</td><td>15.0</td><td>31.0</td></tr><tr><td>&quot;MX000017004&quot;</td><td>1955-04-02</td><td>15.0</td><td>31.0</td></tr><tr><td>&quot;MX000017004&quot;</td><td>1955-04-03</td><td>16.0</td><td>31.0</td></tr><tr><td>&quot;MX000017004&quot;</td><td>1955-04-04</td><td>15.0</td><td>32.0</td></tr><tr><td>&quot;MX000017004&quot;</td><td>1955-04-05</td><td>16.0</td><td>33.0</td></tr><tr><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td></tr><tr><td>&quot;MX000017004&quot;</td><td>2011-04-26</td><td>NaN</td><td>NaN</td></tr><tr><td>&quot;MX000017004&quot;</td><td>2011-04-27</td><td>NaN</td><td>NaN</td></tr><tr><td>&quot;MX000017004&quot;</td><td>2011-04-28</td><td>NaN</td><td>NaN</td></tr><tr><td>&quot;MX000017004&quot;</td><td>2011-04-29</td><td>NaN</td><td>NaN</td></tr><tr><td>&quot;MX000017004&quot;</td><td>2011-04-30</td><td>NaN</td><td>NaN</td></tr></tbody></table></div>"
      ],
      "text/plain": [
       "shape: (17_204, 4)\n",
       "┌─────────────┬────────────┬──────┬──────┐\n",
       "│ id          ┆ date       ┆ tmin ┆ tmax │\n",
       "│ ---         ┆ ---        ┆ ---  ┆ ---  │\n",
       "│ str         ┆ date       ┆ f64  ┆ f64  │\n",
       "╞═════════════╪════════════╪══════╪══════╡\n",
       "│ MX000017004 ┆ 1955-04-01 ┆ 15.0 ┆ 31.0 │\n",
       "│ MX000017004 ┆ 1955-04-02 ┆ 15.0 ┆ 31.0 │\n",
       "│ MX000017004 ┆ 1955-04-03 ┆ 16.0 ┆ 31.0 │\n",
       "│ MX000017004 ┆ 1955-04-04 ┆ 15.0 ┆ 32.0 │\n",
       "│ MX000017004 ┆ 1955-04-05 ┆ 16.0 ┆ 33.0 │\n",
       "│ …           ┆ …          ┆ …    ┆ …    │\n",
       "│ MX000017004 ┆ 2011-04-26 ┆ NaN  ┆ NaN  │\n",
       "│ MX000017004 ┆ 2011-04-27 ┆ NaN  ┆ NaN  │\n",
       "│ MX000017004 ┆ 2011-04-28 ┆ NaN  ┆ NaN  │\n",
       "│ MX000017004 ┆ 2011-04-29 ┆ NaN  ┆ NaN  │\n",
       "│ MX000017004 ┆ 2011-04-30 ┆ NaN  ┆ NaN  │\n",
       "└─────────────┴────────────┴──────┴──────┘"
      ]
     },
     "execution_count": 91,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "wdf_out = (wdf_p.with_columns(pl.concat_str([pl.col('year'),pl.col('month'),pl.col('variable').str.slice(1)], separator='-').str.to_date(strict=False).alias('date'))\n",
    "      .filter(pl.col('date').is_not_null())\n",
    "      .select('id','date','tmin','tmax')\n",
    ").sort('date')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 92,
   "id": "4c47ab54-c045-4646-aed9-fd4d445703a8",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div><style>\n",
       ".dataframe > thead > tr,\n",
       ".dataframe > tbody > tr {\n",
       "  text-align: right;\n",
       "  white-space: pre-wrap;\n",
       "}\n",
       "</style>\n",
       "<small>shape: (56, 3)</small><table border=\"1\" class=\"dataframe\"><thead><tr><th>date</th><th>tmin</th><th>tmax</th></tr><tr><td>i32</td><td>f64</td><td>f64</td></tr></thead><tbody><tr><td>1955</td><td>14.461818</td><td>26.647273</td></tr><tr><td>1956</td><td>13.764881</td><td>26.526786</td></tr><tr><td>1957</td><td>14.883582</td><td>27.913433</td></tr><tr><td>1958</td><td>14.69589</td><td>26.723288</td></tr><tr><td>1959</td><td>15.109589</td><td>26.80274</td></tr><tr><td>&hellip;</td><td>&hellip;</td><td>&hellip;</td></tr><tr><td>2007</td><td>14.207547</td><td>31.026415</td></tr><tr><td>2008</td><td>14.466667</td><td>31.59697</td></tr><tr><td>2009</td><td>13.373913</td><td>29.113043</td></tr><tr><td>2010</td><td>14.651515</td><td>29.190909</td></tr><tr><td>2011</td><td>14.17</td><td>32.1</td></tr></tbody></table></div>"
      ],
      "text/plain": [
       "shape: (56, 3)\n",
       "┌──────┬───────────┬───────────┐\n",
       "│ date ┆ tmin      ┆ tmax      │\n",
       "│ ---  ┆ ---       ┆ ---       │\n",
       "│ i32  ┆ f64       ┆ f64       │\n",
       "╞══════╪═══════════╪═══════════╡\n",
       "│ 1955 ┆ 14.461818 ┆ 26.647273 │\n",
       "│ 1956 ┆ 13.764881 ┆ 26.526786 │\n",
       "│ 1957 ┆ 14.883582 ┆ 27.913433 │\n",
       "│ 1958 ┆ 14.69589  ┆ 26.723288 │\n",
       "│ 1959 ┆ 15.109589 ┆ 26.80274  │\n",
       "│ …    ┆ …         ┆ …         │\n",
       "│ 2007 ┆ 14.207547 ┆ 31.026415 │\n",
       "│ 2008 ┆ 14.466667 ┆ 31.59697  │\n",
       "│ 2009 ┆ 13.373913 ┆ 29.113043 │\n",
       "│ 2010 ┆ 14.651515 ┆ 29.190909 │\n",
       "│ 2011 ┆ 14.17     ┆ 32.1      │\n",
       "└──────┴───────────┴───────────┘"
      ]
     },
     "execution_count": 92,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "wdf_out.group_by(pl.col('date').dt.year()).agg(pl.col('tmin','tmax').drop_nans().mean()).sort('date')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 93,
   "id": "3f3128f7-ddc5-431a-9d9f-a499ceff7b1e",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>id</th>\n",
       "      <th>year</th>\n",
       "      <th>month</th>\n",
       "      <th>element</th>\n",
       "      <th>d1</th>\n",
       "      <th>d2</th>\n",
       "      <th>d3</th>\n",
       "      <th>d4</th>\n",
       "      <th>d5</th>\n",
       "      <th>d6</th>\n",
       "      <th>...</th>\n",
       "      <th>d22</th>\n",
       "      <th>d23</th>\n",
       "      <th>d24</th>\n",
       "      <th>d25</th>\n",
       "      <th>d26</th>\n",
       "      <th>d27</th>\n",
       "      <th>d28</th>\n",
       "      <th>d29</th>\n",
       "      <th>d30</th>\n",
       "      <th>d31</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>MX000017004</td>\n",
       "      <td>1955</td>\n",
       "      <td>4</td>\n",
       "      <td>tmax</td>\n",
       "      <td>31.0</td>\n",
       "      <td>31.0</td>\n",
       "      <td>31.0</td>\n",
       "      <td>32.0</td>\n",
       "      <td>33.0</td>\n",
       "      <td>32.0</td>\n",
       "      <td>...</td>\n",
       "      <td>33.0</td>\n",
       "      <td>33.0</td>\n",
       "      <td>33.0</td>\n",
       "      <td>33.0</td>\n",
       "      <td>33.0</td>\n",
       "      <td>33.0</td>\n",
       "      <td>34.0</td>\n",
       "      <td>33.0</td>\n",
       "      <td>32.0</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>MX000017004</td>\n",
       "      <td>1955</td>\n",
       "      <td>4</td>\n",
       "      <td>tmin</td>\n",
       "      <td>15.0</td>\n",
       "      <td>15.0</td>\n",
       "      <td>16.0</td>\n",
       "      <td>15.0</td>\n",
       "      <td>16.0</td>\n",
       "      <td>16.0</td>\n",
       "      <td>...</td>\n",
       "      <td>17.0</td>\n",
       "      <td>17.0</td>\n",
       "      <td>17.0</td>\n",
       "      <td>18.0</td>\n",
       "      <td>19.0</td>\n",
       "      <td>19.0</td>\n",
       "      <td>17.0</td>\n",
       "      <td>18.0</td>\n",
       "      <td>16.0</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>MX000017004</td>\n",
       "      <td>1955</td>\n",
       "      <td>5</td>\n",
       "      <td>tmax</td>\n",
       "      <td>31.0</td>\n",
       "      <td>31.0</td>\n",
       "      <td>31.0</td>\n",
       "      <td>30.0</td>\n",
       "      <td>30.0</td>\n",
       "      <td>30.0</td>\n",
       "      <td>...</td>\n",
       "      <td>33.0</td>\n",
       "      <td>34.0</td>\n",
       "      <td>35.0</td>\n",
       "      <td>33.0</td>\n",
       "      <td>31.0</td>\n",
       "      <td>31.0</td>\n",
       "      <td>32.0</td>\n",
       "      <td>31.0</td>\n",
       "      <td>30.0</td>\n",
       "      <td>29.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>MX000017004</td>\n",
       "      <td>1955</td>\n",
       "      <td>5</td>\n",
       "      <td>tmin</td>\n",
       "      <td>20.0</td>\n",
       "      <td>16.0</td>\n",
       "      <td>16.0</td>\n",
       "      <td>15.0</td>\n",
       "      <td>15.0</td>\n",
       "      <td>15.0</td>\n",
       "      <td>...</td>\n",
       "      <td>17.0</td>\n",
       "      <td>19.0</td>\n",
       "      <td>19.0</td>\n",
       "      <td>19.0</td>\n",
       "      <td>18.0</td>\n",
       "      <td>16.0</td>\n",
       "      <td>15.0</td>\n",
       "      <td>17.0</td>\n",
       "      <td>15.0</td>\n",
       "      <td>16.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>MX000017004</td>\n",
       "      <td>1955</td>\n",
       "      <td>6</td>\n",
       "      <td>tmax</td>\n",
       "      <td>30.0</td>\n",
       "      <td>29.0</td>\n",
       "      <td>28.0</td>\n",
       "      <td>27.0</td>\n",
       "      <td>28.0</td>\n",
       "      <td>26.0</td>\n",
       "      <td>...</td>\n",
       "      <td>29.0</td>\n",
       "      <td>27.0</td>\n",
       "      <td>27.0</td>\n",
       "      <td>27.0</td>\n",
       "      <td>28.0</td>\n",
       "      <td>30.0</td>\n",
       "      <td>27.0</td>\n",
       "      <td>29.0</td>\n",
       "      <td>27.0</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1124</th>\n",
       "      <td>MX000017004</td>\n",
       "      <td>2011</td>\n",
       "      <td>2</td>\n",
       "      <td>tmin</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>...</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1125</th>\n",
       "      <td>MX000017004</td>\n",
       "      <td>2011</td>\n",
       "      <td>3</td>\n",
       "      <td>tmax</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>33.2</td>\n",
       "      <td>NaN</td>\n",
       "      <td>...</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>33.2</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>36.5</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1126</th>\n",
       "      <td>MX000017004</td>\n",
       "      <td>2011</td>\n",
       "      <td>3</td>\n",
       "      <td>tmin</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>14.8</td>\n",
       "      <td>NaN</td>\n",
       "      <td>...</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>16.2</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>17.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1127</th>\n",
       "      <td>MX000017004</td>\n",
       "      <td>2011</td>\n",
       "      <td>4</td>\n",
       "      <td>tmax</td>\n",
       "      <td>NaN</td>\n",
       "      <td>35.0</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>...</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1128</th>\n",
       "      <td>MX000017004</td>\n",
       "      <td>2011</td>\n",
       "      <td>4</td>\n",
       "      <td>tmin</td>\n",
       "      <td>NaN</td>\n",
       "      <td>16.8</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>...</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>1129 rows × 35 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "               id  year  month element    d1    d2    d3    d4    d5    d6  \\\n",
       "0     MX000017004  1955      4    tmax  31.0  31.0  31.0  32.0  33.0  32.0   \n",
       "1     MX000017004  1955      4    tmin  15.0  15.0  16.0  15.0  16.0  16.0   \n",
       "2     MX000017004  1955      5    tmax  31.0  31.0  31.0  30.0  30.0  30.0   \n",
       "3     MX000017004  1955      5    tmin  20.0  16.0  16.0  15.0  15.0  15.0   \n",
       "4     MX000017004  1955      6    tmax  30.0  29.0  28.0  27.0  28.0  26.0   \n",
       "...           ...   ...    ...     ...   ...   ...   ...   ...   ...   ...   \n",
       "1124  MX000017004  2011      2    tmin   NaN   NaN   NaN   NaN   NaN   NaN   \n",
       "1125  MX000017004  2011      3    tmax   NaN   NaN   NaN   NaN  33.2   NaN   \n",
       "1126  MX000017004  2011      3    tmin   NaN   NaN   NaN   NaN  14.8   NaN   \n",
       "1127  MX000017004  2011      4    tmax   NaN  35.0   NaN   NaN   NaN   NaN   \n",
       "1128  MX000017004  2011      4    tmin   NaN  16.8   NaN   NaN   NaN   NaN   \n",
       "\n",
       "      ...   d22   d23   d24   d25   d26   d27   d28   d29   d30   d31  \n",
       "0     ...  33.0  33.0  33.0  33.0  33.0  33.0  34.0  33.0  32.0   NaN  \n",
       "1     ...  17.0  17.0  17.0  18.0  19.0  19.0  17.0  18.0  16.0   NaN  \n",
       "2     ...  33.0  34.0  35.0  33.0  31.0  31.0  32.0  31.0  30.0  29.0  \n",
       "3     ...  17.0  19.0  19.0  19.0  18.0  16.0  15.0  17.0  15.0  16.0  \n",
       "4     ...  29.0  27.0  27.0  27.0  28.0  30.0  27.0  29.0  27.0   NaN  \n",
       "...   ...   ...   ...   ...   ...   ...   ...   ...   ...   ...   ...  \n",
       "1124  ...   NaN   NaN   NaN   NaN   NaN   NaN   NaN   NaN   NaN   NaN  \n",
       "1125  ...   NaN   NaN   NaN   NaN  33.2   NaN   NaN   NaN   NaN  36.5  \n",
       "1126  ...   NaN   NaN   NaN   NaN  16.2   NaN   NaN   NaN   NaN  17.0  \n",
       "1127  ...   NaN   NaN   NaN   NaN   NaN   NaN   NaN   NaN   NaN   NaN  \n",
       "1128  ...   NaN   NaN   NaN   NaN   NaN   NaN   NaN   NaN   NaN   NaN  \n",
       "\n",
       "[1129 rows x 35 columns]"
      ]
     },
     "execution_count": 93,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "import pandas as pd\n",
    "wdfa = wdf.to_pandas()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 94,
   "id": "4ccd6ba8-65b3-486a-a976-cfb397853386",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>id</th>\n",
       "      <th>year</th>\n",
       "      <th>month</th>\n",
       "      <th>element</th>\n",
       "      <th>variable</th>\n",
       "      <th>value</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>MX000017004</td>\n",
       "      <td>1955</td>\n",
       "      <td>4</td>\n",
       "      <td>tmax</td>\n",
       "      <td>d1</td>\n",
       "      <td>31.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>MX000017004</td>\n",
       "      <td>1955</td>\n",
       "      <td>4</td>\n",
       "      <td>tmin</td>\n",
       "      <td>d1</td>\n",
       "      <td>15.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>MX000017004</td>\n",
       "      <td>1955</td>\n",
       "      <td>5</td>\n",
       "      <td>tmax</td>\n",
       "      <td>d1</td>\n",
       "      <td>31.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>MX000017004</td>\n",
       "      <td>1955</td>\n",
       "      <td>5</td>\n",
       "      <td>tmin</td>\n",
       "      <td>d1</td>\n",
       "      <td>20.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>MX000017004</td>\n",
       "      <td>1955</td>\n",
       "      <td>6</td>\n",
       "      <td>tmax</td>\n",
       "      <td>d1</td>\n",
       "      <td>30.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>34994</th>\n",
       "      <td>MX000017004</td>\n",
       "      <td>2011</td>\n",
       "      <td>2</td>\n",
       "      <td>tmin</td>\n",
       "      <td>d31</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>34995</th>\n",
       "      <td>MX000017004</td>\n",
       "      <td>2011</td>\n",
       "      <td>3</td>\n",
       "      <td>tmax</td>\n",
       "      <td>d31</td>\n",
       "      <td>36.5</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>34996</th>\n",
       "      <td>MX000017004</td>\n",
       "      <td>2011</td>\n",
       "      <td>3</td>\n",
       "      <td>tmin</td>\n",
       "      <td>d31</td>\n",
       "      <td>17.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>34997</th>\n",
       "      <td>MX000017004</td>\n",
       "      <td>2011</td>\n",
       "      <td>4</td>\n",
       "      <td>tmax</td>\n",
       "      <td>d31</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>34998</th>\n",
       "      <td>MX000017004</td>\n",
       "      <td>2011</td>\n",
       "      <td>4</td>\n",
       "      <td>tmin</td>\n",
       "      <td>d31</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>34999 rows × 6 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "                id  year  month element variable  value\n",
       "0      MX000017004  1955      4    tmax       d1   31.0\n",
       "1      MX000017004  1955      4    tmin       d1   15.0\n",
       "2      MX000017004  1955      5    tmax       d1   31.0\n",
       "3      MX000017004  1955      5    tmin       d1   20.0\n",
       "4      MX000017004  1955      6    tmax       d1   30.0\n",
       "...            ...   ...    ...     ...      ...    ...\n",
       "34994  MX000017004  2011      2    tmin      d31    NaN\n",
       "34995  MX000017004  2011      3    tmax      d31   36.5\n",
       "34996  MX000017004  2011      3    tmin      d31   17.0\n",
       "34997  MX000017004  2011      4    tmax      d31    NaN\n",
       "34998  MX000017004  2011      4    tmin      d31    NaN\n",
       "\n",
       "[34999 rows x 6 columns]"
      ]
     },
     "execution_count": 94,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "wdfa_melt = wdfa.melt(id_vars=['id','year','month','element'])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 97,
   "id": "6fd663f0-026f-48c3-8602-6d16b77ef5cc",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th>element</th>\n",
       "      <th>id</th>\n",
       "      <th>year</th>\n",
       "      <th>month</th>\n",
       "      <th>variable</th>\n",
       "      <th>tmax</th>\n",
       "      <th>tmin</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>MX000017004</td>\n",
       "      <td>1955</td>\n",
       "      <td>4</td>\n",
       "      <td>d1</td>\n",
       "      <td>31.0</td>\n",
       "      <td>15.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>MX000017004</td>\n",
       "      <td>1955</td>\n",
       "      <td>4</td>\n",
       "      <td>d10</td>\n",
       "      <td>33.0</td>\n",
       "      <td>17.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>MX000017004</td>\n",
       "      <td>1955</td>\n",
       "      <td>4</td>\n",
       "      <td>d11</td>\n",
       "      <td>33.0</td>\n",
       "      <td>17.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>MX000017004</td>\n",
       "      <td>1955</td>\n",
       "      <td>4</td>\n",
       "      <td>d12</td>\n",
       "      <td>32.0</td>\n",
       "      <td>16.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>MX000017004</td>\n",
       "      <td>1955</td>\n",
       "      <td>4</td>\n",
       "      <td>d13</td>\n",
       "      <td>31.0</td>\n",
       "      <td>16.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>17510</th>\n",
       "      <td>MX000017004</td>\n",
       "      <td>2011</td>\n",
       "      <td>4</td>\n",
       "      <td>d5</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>17511</th>\n",
       "      <td>MX000017004</td>\n",
       "      <td>2011</td>\n",
       "      <td>4</td>\n",
       "      <td>d6</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>17512</th>\n",
       "      <td>MX000017004</td>\n",
       "      <td>2011</td>\n",
       "      <td>4</td>\n",
       "      <td>d7</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>17513</th>\n",
       "      <td>MX000017004</td>\n",
       "      <td>2011</td>\n",
       "      <td>4</td>\n",
       "      <td>d8</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>17514</th>\n",
       "      <td>MX000017004</td>\n",
       "      <td>2011</td>\n",
       "      <td>4</td>\n",
       "      <td>d9</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>17515 rows × 6 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "element           id  year  month variable  tmax  tmin\n",
       "0        MX000017004  1955      4       d1  31.0  15.0\n",
       "1        MX000017004  1955      4      d10  33.0  17.0\n",
       "2        MX000017004  1955      4      d11  33.0  17.0\n",
       "3        MX000017004  1955      4      d12  32.0  16.0\n",
       "4        MX000017004  1955      4      d13  31.0  16.0\n",
       "...              ...   ...    ...      ...   ...   ...\n",
       "17510    MX000017004  2011      4       d5   NaN   NaN\n",
       "17511    MX000017004  2011      4       d6   NaN   NaN\n",
       "17512    MX000017004  2011      4       d7   NaN   NaN\n",
       "17513    MX000017004  2011      4       d8   NaN   NaN\n",
       "17514    MX000017004  2011      4       d9   NaN   NaN\n",
       "\n",
       "[17515 rows x 6 columns]"
      ]
     },
     "execution_count": 97,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "wdfa_pivot = wdfa_melt.pivot(columns='element',index=['id','year','month','variable'],values='value').reset_index()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 98,
   "id": "324e1790-273d-4db9-b1bc-75f3245347da",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th>element</th>\n",
       "      <th>id</th>\n",
       "      <th>year</th>\n",
       "      <th>month</th>\n",
       "      <th>variable</th>\n",
       "      <th>tmax</th>\n",
       "      <th>tmin</th>\n",
       "      <th>day</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>MX000017004</td>\n",
       "      <td>1955</td>\n",
       "      <td>4</td>\n",
       "      <td>d1</td>\n",
       "      <td>31.0</td>\n",
       "      <td>15.0</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>MX000017004</td>\n",
       "      <td>1955</td>\n",
       "      <td>4</td>\n",
       "      <td>d10</td>\n",
       "      <td>33.0</td>\n",
       "      <td>17.0</td>\n",
       "      <td>10</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>MX000017004</td>\n",
       "      <td>1955</td>\n",
       "      <td>4</td>\n",
       "      <td>d11</td>\n",
       "      <td>33.0</td>\n",
       "      <td>17.0</td>\n",
       "      <td>11</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>MX000017004</td>\n",
       "      <td>1955</td>\n",
       "      <td>4</td>\n",
       "      <td>d12</td>\n",
       "      <td>32.0</td>\n",
       "      <td>16.0</td>\n",
       "      <td>12</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>MX000017004</td>\n",
       "      <td>1955</td>\n",
       "      <td>4</td>\n",
       "      <td>d13</td>\n",
       "      <td>31.0</td>\n",
       "      <td>16.0</td>\n",
       "      <td>13</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>17510</th>\n",
       "      <td>MX000017004</td>\n",
       "      <td>2011</td>\n",
       "      <td>4</td>\n",
       "      <td>d5</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>5</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>17511</th>\n",
       "      <td>MX000017004</td>\n",
       "      <td>2011</td>\n",
       "      <td>4</td>\n",
       "      <td>d6</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>6</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>17512</th>\n",
       "      <td>MX000017004</td>\n",
       "      <td>2011</td>\n",
       "      <td>4</td>\n",
       "      <td>d7</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>7</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>17513</th>\n",
       "      <td>MX000017004</td>\n",
       "      <td>2011</td>\n",
       "      <td>4</td>\n",
       "      <td>d8</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>8</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>17514</th>\n",
       "      <td>MX000017004</td>\n",
       "      <td>2011</td>\n",
       "      <td>4</td>\n",
       "      <td>d9</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>9</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>17515 rows × 7 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "element           id  year  month variable  tmax  tmin  day\n",
       "0        MX000017004  1955      4       d1  31.0  15.0    1\n",
       "1        MX000017004  1955      4      d10  33.0  17.0   10\n",
       "2        MX000017004  1955      4      d11  33.0  17.0   11\n",
       "3        MX000017004  1955      4      d12  32.0  16.0   12\n",
       "4        MX000017004  1955      4      d13  31.0  16.0   13\n",
       "...              ...   ...    ...      ...   ...   ...  ...\n",
       "17510    MX000017004  2011      4       d5   NaN   NaN    5\n",
       "17511    MX000017004  2011      4       d6   NaN   NaN    6\n",
       "17512    MX000017004  2011      4       d7   NaN   NaN    7\n",
       "17513    MX000017004  2011      4       d8   NaN   NaN    8\n",
       "17514    MX000017004  2011      4       d9   NaN   NaN    9\n",
       "\n",
       "[17515 rows x 7 columns]"
      ]
     },
     "execution_count": 98,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "wdfa_pivot = wdfa_pivot.assign(day=lambda df: df.variable.str[1:].astype('int'))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 99,
   "id": "17271ef2-c04c-4544-9517-296f9fce5bbe",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th>element</th>\n",
       "      <th>id</th>\n",
       "      <th>date</th>\n",
       "      <th>tmin</th>\n",
       "      <th>tmax</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>MX000017004</td>\n",
       "      <td>1955-04-01</td>\n",
       "      <td>15.0</td>\n",
       "      <td>31.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>11</th>\n",
       "      <td>MX000017004</td>\n",
       "      <td>1955-04-02</td>\n",
       "      <td>15.0</td>\n",
       "      <td>31.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>22</th>\n",
       "      <td>MX000017004</td>\n",
       "      <td>1955-04-03</td>\n",
       "      <td>16.0</td>\n",
       "      <td>31.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>25</th>\n",
       "      <td>MX000017004</td>\n",
       "      <td>1955-04-04</td>\n",
       "      <td>15.0</td>\n",
       "      <td>32.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>26</th>\n",
       "      <td>MX000017004</td>\n",
       "      <td>1955-04-05</td>\n",
       "      <td>16.0</td>\n",
       "      <td>33.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>17502</th>\n",
       "      <td>MX000017004</td>\n",
       "      <td>2011-04-26</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>17503</th>\n",
       "      <td>MX000017004</td>\n",
       "      <td>2011-04-27</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>17504</th>\n",
       "      <td>MX000017004</td>\n",
       "      <td>2011-04-28</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>17505</th>\n",
       "      <td>MX000017004</td>\n",
       "      <td>2011-04-29</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>17507</th>\n",
       "      <td>MX000017004</td>\n",
       "      <td>2011-04-30</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>17204 rows × 4 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "element           id       date  tmin  tmax\n",
       "0        MX000017004 1955-04-01  15.0  31.0\n",
       "11       MX000017004 1955-04-02  15.0  31.0\n",
       "22       MX000017004 1955-04-03  16.0  31.0\n",
       "25       MX000017004 1955-04-04  15.0  32.0\n",
       "26       MX000017004 1955-04-05  16.0  33.0\n",
       "...              ...        ...   ...   ...\n",
       "17502    MX000017004 2011-04-26   NaN   NaN\n",
       "17503    MX000017004 2011-04-27   NaN   NaN\n",
       "17504    MX000017004 2011-04-28   NaN   NaN\n",
       "17505    MX000017004 2011-04-29   NaN   NaN\n",
       "17507    MX000017004 2011-04-30   NaN   NaN\n",
       "\n",
       "[17204 rows x 4 columns]"
      ]
     },
     "execution_count": 99,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "wdfa_out = wdfa_pivot.assign(date=pd.to_datetime(wdfa_pivot[['year','month','day']],errors='coerce'))[['id','date','tmin','tmax']].query('date.notnull()').sort_values('date')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 100,
   "id": "03e3ae7f-84de-431e-8291-055361d481a3",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th>element</th>\n",
       "      <th>tmin</th>\n",
       "      <th>tmax</th>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>date</th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>1955</th>\n",
       "      <td>14.461818</td>\n",
       "      <td>26.647273</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1956</th>\n",
       "      <td>13.764881</td>\n",
       "      <td>26.526786</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1957</th>\n",
       "      <td>14.883582</td>\n",
       "      <td>27.913433</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1958</th>\n",
       "      <td>14.695890</td>\n",
       "      <td>26.723288</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1959</th>\n",
       "      <td>15.109589</td>\n",
       "      <td>26.802740</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1960</th>\n",
       "      <td>15.338798</td>\n",
       "      <td>27.519126</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1961</th>\n",
       "      <td>14.400000</td>\n",
       "      <td>26.989041</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1962</th>\n",
       "      <td>14.169604</td>\n",
       "      <td>28.002193</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1963</th>\n",
       "      <td>14.156934</td>\n",
       "      <td>23.952555</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1964</th>\n",
       "      <td>14.883582</td>\n",
       "      <td>25.895522</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1965</th>\n",
       "      <td>14.581522</td>\n",
       "      <td>24.873188</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1966</th>\n",
       "      <td>14.325275</td>\n",
       "      <td>25.731044</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1967</th>\n",
       "      <td>14.986849</td>\n",
       "      <td>27.406301</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1968</th>\n",
       "      <td>14.738251</td>\n",
       "      <td>26.098634</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1969</th>\n",
       "      <td>15.793132</td>\n",
       "      <td>26.959178</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1970</th>\n",
       "      <td>15.183014</td>\n",
       "      <td>27.375342</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1971</th>\n",
       "      <td>13.975092</td>\n",
       "      <td>25.882051</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1972</th>\n",
       "      <td>14.431694</td>\n",
       "      <td>25.725410</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1973</th>\n",
       "      <td>15.153968</td>\n",
       "      <td>25.882166</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1974</th>\n",
       "      <td>14.888268</td>\n",
       "      <td>26.262570</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1975</th>\n",
       "      <td>14.826027</td>\n",
       "      <td>25.853425</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1976</th>\n",
       "      <td>15.005556</td>\n",
       "      <td>25.848611</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1977</th>\n",
       "      <td>14.954795</td>\n",
       "      <td>26.610411</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1978</th>\n",
       "      <td>15.053571</td>\n",
       "      <td>26.532967</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1979</th>\n",
       "      <td>14.148352</td>\n",
       "      <td>27.968407</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1980</th>\n",
       "      <td>15.692623</td>\n",
       "      <td>26.822404</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1981</th>\n",
       "      <td>12.333333</td>\n",
       "      <td>24.666667</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1982</th>\n",
       "      <td>13.833333</td>\n",
       "      <td>33.000000</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1983</th>\n",
       "      <td>10.200000</td>\n",
       "      <td>27.300000</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1985</th>\n",
       "      <td>8.300000</td>\n",
       "      <td>26.300000</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1986</th>\n",
       "      <td>13.443750</td>\n",
       "      <td>29.606250</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1987</th>\n",
       "      <td>15.300000</td>\n",
       "      <td>30.362500</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1988</th>\n",
       "      <td>15.242308</td>\n",
       "      <td>30.565517</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1989</th>\n",
       "      <td>13.589809</td>\n",
       "      <td>29.883333</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1990</th>\n",
       "      <td>13.353676</td>\n",
       "      <td>28.583654</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1991</th>\n",
       "      <td>14.747387</td>\n",
       "      <td>28.954054</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1992</th>\n",
       "      <td>14.032698</td>\n",
       "      <td>28.200000</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1993</th>\n",
       "      <td>14.473000</td>\n",
       "      <td>29.608571</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1994</th>\n",
       "      <td>13.891324</td>\n",
       "      <td>28.620800</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1995</th>\n",
       "      <td>12.712351</td>\n",
       "      <td>27.896939</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1996</th>\n",
       "      <td>12.215200</td>\n",
       "      <td>27.966667</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1997</th>\n",
       "      <td>13.961404</td>\n",
       "      <td>27.749123</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1998</th>\n",
       "      <td>15.146739</td>\n",
       "      <td>32.223913</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1999</th>\n",
       "      <td>11.366667</td>\n",
       "      <td>26.769444</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2000</th>\n",
       "      <td>13.952147</td>\n",
       "      <td>28.984663</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2001</th>\n",
       "      <td>14.000515</td>\n",
       "      <td>29.129381</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2002</th>\n",
       "      <td>13.974096</td>\n",
       "      <td>29.958434</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2003</th>\n",
       "      <td>13.855782</td>\n",
       "      <td>30.220408</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2004</th>\n",
       "      <td>11.918644</td>\n",
       "      <td>29.215254</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2005</th>\n",
       "      <td>13.909091</td>\n",
       "      <td>32.091919</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2006</th>\n",
       "      <td>13.980220</td>\n",
       "      <td>31.435165</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2007</th>\n",
       "      <td>14.207547</td>\n",
       "      <td>31.026415</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2008</th>\n",
       "      <td>14.466667</td>\n",
       "      <td>31.596970</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2009</th>\n",
       "      <td>13.373913</td>\n",
       "      <td>29.113043</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2010</th>\n",
       "      <td>14.651515</td>\n",
       "      <td>29.190909</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2011</th>\n",
       "      <td>14.170000</td>\n",
       "      <td>32.100000</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "element       tmin       tmax\n",
       "date                         \n",
       "1955     14.461818  26.647273\n",
       "1956     13.764881  26.526786\n",
       "1957     14.883582  27.913433\n",
       "1958     14.695890  26.723288\n",
       "1959     15.109589  26.802740\n",
       "1960     15.338798  27.519126\n",
       "1961     14.400000  26.989041\n",
       "1962     14.169604  28.002193\n",
       "1963     14.156934  23.952555\n",
       "1964     14.883582  25.895522\n",
       "1965     14.581522  24.873188\n",
       "1966     14.325275  25.731044\n",
       "1967     14.986849  27.406301\n",
       "1968     14.738251  26.098634\n",
       "1969     15.793132  26.959178\n",
       "1970     15.183014  27.375342\n",
       "1971     13.975092  25.882051\n",
       "1972     14.431694  25.725410\n",
       "1973     15.153968  25.882166\n",
       "1974     14.888268  26.262570\n",
       "1975     14.826027  25.853425\n",
       "1976     15.005556  25.848611\n",
       "1977     14.954795  26.610411\n",
       "1978     15.053571  26.532967\n",
       "1979     14.148352  27.968407\n",
       "1980     15.692623  26.822404\n",
       "1981     12.333333  24.666667\n",
       "1982     13.833333  33.000000\n",
       "1983     10.200000  27.300000\n",
       "1985      8.300000  26.300000\n",
       "1986     13.443750  29.606250\n",
       "1987     15.300000  30.362500\n",
       "1988     15.242308  30.565517\n",
       "1989     13.589809  29.883333\n",
       "1990     13.353676  28.583654\n",
       "1991     14.747387  28.954054\n",
       "1992     14.032698  28.200000\n",
       "1993     14.473000  29.608571\n",
       "1994     13.891324  28.620800\n",
       "1995     12.712351  27.896939\n",
       "1996     12.215200  27.966667\n",
       "1997     13.961404  27.749123\n",
       "1998     15.146739  32.223913\n",
       "1999     11.366667  26.769444\n",
       "2000     13.952147  28.984663\n",
       "2001     14.000515  29.129381\n",
       "2002     13.974096  29.958434\n",
       "2003     13.855782  30.220408\n",
       "2004     11.918644  29.215254\n",
       "2005     13.909091  32.091919\n",
       "2006     13.980220  31.435165\n",
       "2007     14.207547  31.026415\n",
       "2008     14.466667  31.596970\n",
       "2009     13.373913  29.113043\n",
       "2010     14.651515  29.190909\n",
       "2011     14.170000  32.100000"
      ]
     },
     "execution_count": 100,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "wdfa_out.groupby(wdfa_out['date'].dt.year)[['tmin','tmax']].mean()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "652715ee-6bf0-423f-b933-16d8353537af",
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3 (ipykernel)",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.14.2"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
