{ "cells": [ { "cell_type": "markdown", "metadata": {}, "source": [ "# GroupBy examples\n", "\n", "Allen Downey\n", "\n", "[MIT License](https://en.wikipedia.org/wiki/MIT_License)" ] }, { "cell_type": "code", "execution_count": 1, "metadata": {}, "outputs": [], "source": [ "%matplotlib inline\n", "\n", "import pandas as pd\n", "import numpy as np\n", "\n", "import matplotlib.pyplot as plt\n", "import seaborn as sns\n", "sns.set(style='white')\n", "\n", "from thinkstats2 import Pmf, Cdf\n", "\n", "import thinkstats2\n", "import thinkplot\n", "\n", "decorate = thinkplot.config" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "Let's load the GSS dataset." ] }, { "cell_type": "code", "execution_count": 2, "metadata": {}, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "CPU times: user 164 ms, sys: 40.2 ms, total: 204 ms\n", "Wall time: 203 ms\n" ] }, { "data": { "text/html": [ "
\n", " | year | \n", "id_ | \n", "agewed | \n", "divorce | \n", "sibs | \n", "childs | \n", "age | \n", "educ | \n", "paeduc | \n", "maeduc | \n", "... | \n", "memchurh | \n", "realinc | \n", "cohort | \n", "marcohrt | \n", "ballot | \n", "wtssall | \n", "adults | \n", "compuse | \n", "databank | \n", "wtssnr | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", "1972 | \n", "167 | \n", "0 | \n", "0 | \n", "2 | \n", "0 | \n", "26.0 | \n", "18.0 | \n", "12 | \n", "12 | \n", "... | \n", "0 | \n", "13537.0 | \n", "1946.0 | \n", "0 | \n", "0 | \n", "0.8893 | \n", "2.0 | \n", "0 | \n", "0 | \n", "1.0 | \n", "
1 | \n", "1972 | \n", "1256 | \n", "30 | \n", "2 | \n", "0 | \n", "1 | \n", "38.0 | \n", "12.0 | \n", "97 | \n", "99 | \n", "... | \n", "0 | \n", "18951.0 | \n", "1934.0 | \n", "1964 | \n", "0 | \n", "0.4446 | \n", "1.0 | \n", "0 | \n", "0 | \n", "1.0 | \n", "
2 | \n", "1972 | \n", "415 | \n", "0 | \n", "0 | \n", "7 | \n", "0 | \n", "57.0 | \n", "12.0 | \n", "7 | \n", "7 | \n", "... | \n", "0 | \n", "30458.0 | \n", "1915.0 | \n", "0 | \n", "0 | \n", "1.3339 | \n", "3.0 | \n", "0 | \n", "0 | \n", "1.0 | \n", "
3 | \n", "1972 | \n", "234 | \n", "18 | \n", "1 | \n", "6 | \n", "3 | \n", "61.0 | \n", "14.0 | \n", "8 | \n", "5 | \n", "... | \n", "0 | \n", "37226.0 | \n", "1911.0 | \n", "1929 | \n", "0 | \n", "0.8893 | \n", "2.0 | \n", "0 | \n", "0 | \n", "1.0 | \n", "
4 | \n", "1972 | \n", "554 | \n", "22 | \n", "2 | \n", "3 | \n", "3 | \n", "59.0 | \n", "12.0 | \n", "6 | \n", "11 | \n", "... | \n", "0 | \n", "30458.0 | \n", "1913.0 | \n", "1935 | \n", "0 | \n", "0.8893 | \n", "2.0 | \n", "0 | \n", "0 | \n", "1.0 | \n", "
5 rows × 101 columns
\n", "