diff --git a/notebooks/c05_Big_Data/Working_with_Big_Data.ipynb b/notebooks/c05_Big_Data/Working_with_Big_Data.ipynb index 24fccdf..00ea6c9 100644 --- a/notebooks/c05_Big_Data/Working_with_Big_Data.ipynb +++ b/notebooks/c05_Big_Data/Working_with_Big_Data.ipynb @@ -10,23 +10,14 @@ }, { "cell_type": "code", - "execution_count": 1, + "execution_count": 4, "metadata": { "ExecuteTime": { - "end_time": "2020-10-04T07:13:00.534431Z", - "start_time": "2020-10-04T07:12:59.476700Z" + "end_time": "2020-10-14T02:29:11.178151Z", + "start_time": "2020-10-14T02:29:10.385397Z" } }, - "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "/home/wassname/.pyenv/versions/jup3.7.3/lib/python3.7/site-packages/dask/dataframe/utils.py:14: FutureWarning: pandas.util.testing is deprecated. Use the functions in the public API at pandas.testing instead.\n", - " import pandas.util.testing as tm\n" - ] - } - ], + "outputs": [], "source": [ "import pandas as pd\n", "import numpy as np\n", @@ -47,11 +38,11 @@ }, { "cell_type": "code", - "execution_count": 2, + "execution_count": 5, "metadata": { "ExecuteTime": { - "end_time": "2020-10-04T07:13:00.541259Z", - "start_time": "2020-10-04T07:13:00.537506Z" + "end_time": "2020-10-14T02:29:11.181724Z", + "start_time": "2020-10-14T02:29:11.179663Z" } }, "outputs": [], @@ -68,11 +59,11 @@ }, { "cell_type": "code", - "execution_count": 3, + "execution_count": 6, "metadata": { "ExecuteTime": { - "end_time": "2020-10-04T07:13:00.558769Z", - "start_time": "2020-10-04T07:13:00.550951Z" + "end_time": "2020-10-14T02:29:11.575247Z", + "start_time": "2020-10-14T02:29:11.571877Z" } }, "outputs": [], @@ -99,11 +90,11 @@ }, { "cell_type": "code", - "execution_count": 4, + "execution_count": 7, "metadata": { "ExecuteTime": { - "end_time": "2020-10-04T07:13:00.572954Z", - "start_time": "2020-10-04T07:13:00.561729Z" + "end_time": "2020-10-14T02:29:12.597702Z", + "start_time": "2020-10-14T02:29:12.592553Z" } }, "outputs": [ @@ -111,16 +102,16 @@ "name": "stdout", "output_type": "stream", "text": [ - "[Process 3303031 uses 116.1MB]\n" + "[Process 2285 uses 121.8MB]\n" ] }, { "data": { "text/plain": [ - "116.05078125" + "121.80078125" ] }, - "execution_count": 4, + "execution_count": 7, "metadata": {}, "output_type": "execute_result" } @@ -139,11 +130,11 @@ }, { "cell_type": "code", - "execution_count": 5, + "execution_count": 8, "metadata": { "ExecuteTime": { - "end_time": "2020-10-04T07:13:04.327228Z", - "start_time": "2020-10-04T07:13:00.576215Z" + "end_time": "2020-10-14T02:29:46.295397Z", + "start_time": "2020-10-14T02:29:39.406596Z" } }, "outputs": [ @@ -151,8 +142,8 @@ "name": "stdout", "output_type": "stream", "text": [ - "CPU times: user 3.41 s, sys: 315 ms, total: 3.73 s\n", - "Wall time: 3.74 s\n" + "CPU times: user 2.41 s, sys: 343 ms, total: 2.75 s\n", + "Wall time: 6.89 s\n" ] } ], @@ -163,11 +154,11 @@ }, { "cell_type": "code", - "execution_count": 6, + "execution_count": 9, "metadata": { "ExecuteTime": { - "end_time": "2020-10-04T07:13:04.338688Z", - "start_time": "2020-10-04T07:13:04.330235Z" + "end_time": "2020-10-14T02:30:08.792445Z", + "start_time": "2020-10-14T02:30:08.788405Z" } }, "outputs": [ @@ -175,16 +166,16 @@ "name": "stdout", "output_type": "stream", "text": [ - "[Process 3303031 uses 624.0MB]\n" + "[Process 2285 uses 628.9MB]\n" ] }, { "data": { "text/plain": [ - "624.02734375" + "628.921875" ] }, - "execution_count": 6, + "execution_count": 9, "metadata": {}, "output_type": "execute_result" } @@ -203,11 +194,11 @@ }, { "cell_type": "code", - "execution_count": 7, + "execution_count": 10, "metadata": { "ExecuteTime": { - "end_time": "2020-10-04T07:13:04.622452Z", - "start_time": "2020-10-04T07:13:04.345357Z" + "end_time": "2020-10-14T02:30:29.733889Z", + "start_time": "2020-10-14T02:30:29.665680Z" } }, "outputs": [ @@ -215,8 +206,8 @@ "name": "stdout", "output_type": "stream", "text": [ - "CPU times: user 271 ms, sys: 235 µs, total: 271 ms\n", - "Wall time: 270 ms\n" + "CPU times: user 62.2 ms, sys: 4.01 ms, total: 66.2 ms\n", + "Wall time: 65.2 ms\n" ] } ], @@ -227,11 +218,11 @@ }, { "cell_type": "code", - "execution_count": 8, + "execution_count": 11, "metadata": { "ExecuteTime": { - "end_time": "2020-10-04T07:13:04.632554Z", - "start_time": "2020-10-04T07:13:04.625654Z" + "end_time": "2020-10-14T02:30:38.969341Z", + "start_time": "2020-10-14T02:30:38.964629Z" } }, "outputs": [ @@ -239,16 +230,16 @@ "name": "stdout", "output_type": "stream", "text": [ - "[Process 3303031 uses 624.0MB]\n" + "[Process 2285 uses 628.9MB]\n" ] }, { "data": { "text/plain": [ - "624.02734375" + "628.921875" ] }, - "execution_count": 8, + "execution_count": 11, "metadata": {}, "output_type": "execute_result" } @@ -275,11 +266,11 @@ }, { "cell_type": "code", - "execution_count": 9, + "execution_count": 12, "metadata": { "ExecuteTime": { - "end_time": "2020-10-04T07:13:04.652509Z", - "start_time": "2020-10-04T07:13:04.635259Z" + "end_time": "2020-10-14T02:31:12.339688Z", + "start_time": "2020-10-14T02:31:12.327592Z" } }, "outputs": [ @@ -287,8 +278,8 @@ "name": "stdout", "output_type": "stream", "text": [ - "CPU times: user 4.35 ms, sys: 3.89 ms, total: 8.24 ms\n", - "Wall time: 7.08 ms\n" + "CPU times: user 6.89 ms, sys: 0 ns, total: 6.89 ms\n", + "Wall time: 6.24 ms\n" ] }, { @@ -308,7 +299,7 @@ "Length: 100, dtype: float64" ] }, - "execution_count": 9, + "execution_count": 12, "metadata": {}, "output_type": "execute_result" } @@ -328,11 +319,11 @@ }, { "cell_type": "code", - "execution_count": 10, + "execution_count": 13, "metadata": { "ExecuteTime": { - "end_time": "2020-10-04T07:13:04.735404Z", - "start_time": "2020-10-04T07:13:04.654934Z" + "end_time": "2020-10-14T02:32:05.591164Z", + "start_time": "2020-10-14T02:32:05.550701Z" } }, "outputs": [ @@ -340,8 +331,8 @@ "name": "stdout", "output_type": "stream", "text": [ - "CPU times: user 76.8 ms, sys: 199 µs, total: 77 ms\n", - "Wall time: 75.2 ms\n" + "CPU times: user 38.3 ms, sys: 16 µs, total: 38.3 ms\n", + "Wall time: 37.3 ms\n" ] } ], @@ -359,11 +350,11 @@ }, { "cell_type": "code", - "execution_count": 11, + "execution_count": 14, "metadata": { "ExecuteTime": { - "end_time": "2020-10-04T07:13:04.746367Z", - "start_time": "2020-10-04T07:13:04.738422Z" + "end_time": "2020-10-14T02:32:16.632186Z", + "start_time": "2020-10-14T02:32:16.627016Z" } }, "outputs": [ @@ -375,10 +366,10 @@ "pixel100 float64\n", "pixel99 ...\n", "dtype: float64\n", - "Dask Name: dataframe-mean, 15 tasks" + "Dask Name: dataframe-mean, 11 tasks" ] }, - "execution_count": 11, + "execution_count": 14, "metadata": {}, "output_type": "execute_result" } @@ -397,11 +388,11 @@ }, { "cell_type": "code", - "execution_count": 12, + "execution_count": 15, "metadata": { "ExecuteTime": { - "end_time": "2020-10-04T07:13:08.971892Z", - "start_time": "2020-10-04T07:13:04.750170Z" + "end_time": "2020-10-14T02:33:00.902439Z", + "start_time": "2020-10-14T02:32:58.210666Z" } }, "outputs": [ @@ -409,8 +400,8 @@ "name": "stdout", "output_type": "stream", "text": [ - "CPU times: user 4.52 s, sys: 543 ms, total: 5.06 s\n", - "Wall time: 4.21 s\n" + "CPU times: user 2.76 s, sys: 470 ms, total: 3.23 s\n", + "Wall time: 2.69 s\n" ] }, { @@ -430,7 +421,7 @@ "Length: 100, dtype: float64" ] }, - "execution_count": 12, + "execution_count": 15, "metadata": {}, "output_type": "execute_result" } @@ -472,11 +463,11 @@ }, { "cell_type": "code", - "execution_count": 13, + "execution_count": 16, "metadata": { "ExecuteTime": { - "end_time": "2020-10-04T07:13:08.978326Z", - "start_time": "2020-10-04T07:13:08.975521Z" + "end_time": "2020-10-14T02:38:10.718460Z", + "start_time": "2020-10-14T02:38:10.716474Z" } }, "outputs": [], @@ -494,11 +485,11 @@ }, { "cell_type": "code", - "execution_count": 14, + "execution_count": 17, "metadata": { "ExecuteTime": { - "end_time": "2020-10-04T07:13:09.062783Z", - "start_time": "2020-10-04T07:13:08.981747Z" + "end_time": "2020-10-14T02:38:11.564096Z", + "start_time": "2020-10-14T02:38:11.523227Z" } }, "outputs": [], @@ -522,11 +513,11 @@ }, { "cell_type": "code", - "execution_count": 15, + "execution_count": 18, "metadata": { "ExecuteTime": { - "end_time": "2020-10-04T07:13:13.684735Z", - "start_time": "2020-10-04T07:13:09.065291Z" + "end_time": "2020-10-14T02:38:16.671639Z", + "start_time": "2020-10-14T02:38:14.308997Z" } }, "outputs": [ @@ -534,7 +525,7 @@ "name": "stdout", "output_type": "stream", "text": [ - "[########################################] | 100% Completed | 4.6s\n" + "[########################################] | 100% Completed | 2.4s\n" ] } ], @@ -554,11 +545,11 @@ }, { "cell_type": "code", - "execution_count": 16, + "execution_count": 19, "metadata": { "ExecuteTime": { - "end_time": "2020-10-04T07:13:14.051240Z", - "start_time": "2020-10-04T07:13:13.686819Z" + "end_time": "2020-10-14T02:39:07.219912Z", + "start_time": "2020-10-14T02:39:07.048911Z" } }, "outputs": [], @@ -568,11 +559,11 @@ }, { "cell_type": "code", - "execution_count": 17, + "execution_count": 20, "metadata": { "ExecuteTime": { - "end_time": "2020-10-04T07:13:19.196451Z", - "start_time": "2020-10-04T07:13:14.053718Z" + "end_time": "2020-10-14T02:39:10.886195Z", + "start_time": "2020-10-14T02:39:07.601655Z" } }, "outputs": [ @@ -580,7 +571,7 @@ "name": "stdout", "output_type": "stream", "text": [ - "[########################################] | 100% Completed | 5.1s\n" + "[########################################] | 100% Completed | 3.3s\n" ] } ], @@ -591,11 +582,11 @@ }, { "cell_type": "code", - "execution_count": 18, + "execution_count": 21, "metadata": { "ExecuteTime": { - "end_time": "2020-10-04T07:13:19.210681Z", - "start_time": "2020-10-04T07:13:19.200112Z" + "end_time": "2020-10-14T02:39:42.422134Z", + "start_time": "2020-10-14T02:39:42.417217Z" } }, "outputs": [ @@ -616,7 +607,7 @@ "Length: 785, dtype: float64" ] }, - "execution_count": 18, + "execution_count": 21, "metadata": {}, "output_type": "execute_result" } @@ -627,11 +618,11 @@ }, { "cell_type": "code", - "execution_count": 19, + "execution_count": 22, "metadata": { "ExecuteTime": { - "end_time": "2020-10-04T07:13:19.257560Z", - "start_time": "2020-10-04T07:13:19.214249Z" + "end_time": "2020-10-14T02:39:45.447075Z", + "start_time": "2020-10-14T02:39:45.426516Z" } }, "outputs": [], @@ -641,11 +632,11 @@ }, { "cell_type": "code", - "execution_count": 20, + "execution_count": 23, "metadata": { "ExecuteTime": { - "end_time": "2020-10-04T07:13:23.551522Z", - "start_time": "2020-10-04T07:13:19.260901Z" + "end_time": "2020-10-14T02:39:48.551108Z", + "start_time": "2020-10-14T02:39:45.975978Z" } }, "outputs": [ @@ -653,7 +644,7 @@ "name": "stdout", "output_type": "stream", "text": [ - "[########################################] | 100% Completed | 4.3s\n" + "[########################################] | 100% Completed | 2.6s\n" ] } ], @@ -664,11 +655,11 @@ }, { "cell_type": "code", - "execution_count": 21, + "execution_count": 24, "metadata": { "ExecuteTime": { - "end_time": "2020-10-04T07:13:23.576434Z", - "start_time": "2020-10-04T07:13:23.555071Z" + "end_time": "2020-10-14T02:39:54.015896Z", + "start_time": "2020-10-14T02:39:54.007397Z" } }, "outputs": [ @@ -784,7 +775,7 @@ "9 0.000000 77.106256 0.142550" ] }, - "execution_count": 21, + "execution_count": 24, "metadata": {}, "output_type": "execute_result" } @@ -795,704 +786,8242 @@ }, { "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "
\n", - "

Exercise

\n", - "\n", - "Use Dask dataframe of MNIST (df2) and follow these steps:\n", - " \n", - "1. Add a new column called `sum` to the dataframe which contains sum of all the pixels\n", - "2. Use groupby to find the mean value for `sum` for each label\n", - " \n", - "\n", - "
\n", - " → Hints\n", - "\n", - " * Columns 1 onwards are the pixels. You can access them with `pixels=df2.iloc[:, 1:]`\n", - " * Instead of `df['sum']=pixels.sum()` try `df['sum']=pixels.sum(axis=1)` because we want to sum along columns, not rows\n", - " * If the dask output is confusing, try with df1 first\n", - " * to groupby use `df2.groupby('label').?`, where you replace the `?` with the aggregation operation\n", - "\n", - "
\n", - "\n", - "
\n", - "
\n", - "
\n", - " \n", - " → Solution\n", - " \n", - "\n", - " ```python\n", - " # With pandas\n", - " pixels = df1.loc[:, ['pixel' in c for c in df1.columns]]\n", - " df1['sum']=pixels.sum(axis=1)\n", - " task = df1[['label','sum']].groupby('label').mean()\n", - " print(result)\n", - "\n", - " # With dask\n", - " pixels = df2.loc[:, ['pixel' in c for c in df2.columns]]\n", - " df2['sum']=pixels.sum(axis=1)\n", - " task = df2[['label','sum']].groupby('label').mean()\n", - " with ProgressBar():\n", - " result=task.compute() \n", - " print(result)\n", - " ```\n", - "\n", - "
\n", - "\n", - "
" - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "## When to use Dask DataFrame?\n", - "\n", - "Lets visit [the dask page](https://docs.dask.org/en/latest/dataframe.html#common-uses-and-anti-uses) to look at when we should use it\n", - "\n", - "It is harder so only if you dataset is larger than memory.\n", - "\n", - "If fact also consider:\n", - "- a database (if you have lots of structured queries)\n", - "- https://downloadmoreram.com/ ;p\n", - "- dask array" - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "## Dask Array\n", - "Dask is not just used to replace pandas. There are also multiple numpy functions which can be replaced by Dask. Dask array is Dask equivalent of a numpy array. By doing so, we can perform the computations in parallel and get the results faster." - ] - }, - { - "cell_type": "code", - "execution_count": 22, - "metadata": { - "ExecuteTime": { - "end_time": "2020-10-04T07:13:23.588550Z", - "start_time": "2020-10-04T07:13:23.584811Z" - } - }, - "outputs": [], - "source": [ - "from dask import array" - ] - }, - { - "cell_type": "code", - "execution_count": 23, - "metadata": { - "ExecuteTime": { - "end_time": "2020-10-04T07:13:23.605397Z", - "start_time": "2020-10-04T07:13:23.593664Z" - } - }, - "outputs": [], - "source": [ - "big_array = array.random.normal(size=(10000000, 100), chunks=200000)" - ] - }, - { - "cell_type": "code", - "execution_count": 24, + "execution_count": 29, "metadata": { "ExecuteTime": { - "end_time": "2020-10-04T07:13:23.616314Z", - "start_time": "2020-10-04T07:13:23.608703Z" + "end_time": "2020-10-14T02:46:19.562831Z", + "start_time": "2020-10-14T02:46:18.729080Z" } }, "outputs": [ { "data": { "text/html": [ - "\n", - "\n", - "\n", - "\n", - "\n", - "\n", - "
\n", - "\n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - "
Array Chunk
Bytes 8.00 GB 160.00 MB
Shape (10000000, 100) (200000, 100)
Count 50 Tasks 50 Chunks
Type float64 numpy.ndarray
\n", - "
\n", - "\n", - "\n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - "\n", - " \n", - " \n", - " \n", + "
Dask DataFrame Structure:
\n", + "
\n", + "\n", + "\n", " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - "
Array Chunk
Bytes 800 B 800 B
Shape (100,) (100,)
Count 68 Tasks 1 Chunks
Type float64 numpy.ndarray
\n", - "
\n", - "\n", - "\n", - " \n", - " \n", - " \n", - "\n", - " \n", - " \n", - " \n", - "\n", - " \n", - " \n", - "\n", - " \n", - " 100\n", - " 1\n", - "\n", - "
" - ], - "text/plain": [ - "dask.array" - ] - }, - "execution_count": 29, - "metadata": {}, - "output_type": "execute_result" - } - ], - "source": [ - "task" - ] - }, - { - "cell_type": "code", - "execution_count": 30, - "metadata": { - "ExecuteTime": { - "end_time": "2020-10-04T07:13:53.277483Z", - "start_time": "2020-10-04T07:13:53.268206Z" - } - }, - "outputs": [ - { - "data": { - "text/plain": [ - "array([-1.17109224e-04, -2.37748610e-05, 1.67655302e-04, 9.72602555e-05,\n", - " -1.21246755e-04, 1.86229870e-04, -2.90821428e-04, -2.79825330e-04,\n", - " 1.36715765e-04, -5.00321866e-06, -8.71579028e-05, -5.53870480e-05,\n", - " -2.99278608e-04, 8.90632815e-05, 2.23756405e-05, -8.12409603e-05,\n", - " 1.15169616e-04, -3.89092182e-04, -1.53707025e-06, 2.39661084e-04,\n", - " -1.80096422e-04, 2.74128387e-04, -2.44078965e-04, -1.83305381e-04,\n", - " -3.63807417e-05, -3.47435128e-04, -7.35919945e-05, 2.29875992e-04,\n", - " 2.71309995e-04, 2.23522462e-04, -3.06297908e-04, 1.31446736e-04,\n", - " 4.68200987e-04, -4.46962346e-04, -1.98344059e-04, -2.83531171e-04,\n", - " 1.67231803e-04, 2.33479578e-04, -1.16014913e-04, -8.46083969e-05,\n", - " 3.82956303e-05, -7.75966025e-05, -9.45842315e-05, -1.46859581e-04,\n", - " 2.66761928e-05, 5.43888756e-04, 1.30971229e-04, 3.03536632e-04,\n", - " -2.70213468e-04, -3.35363834e-04, -4.89288567e-04, -1.24321567e-04,\n", - " 9.31827182e-06, 3.91525970e-04, 1.39809241e-04, 5.34253751e-04,\n", - " 2.57985579e-05, -3.90105425e-04, 2.16084327e-04, -3.36460548e-04,\n", - " -3.10813633e-05, 2.96684317e-04, 3.42895144e-04, 2.19669624e-05,\n", - " -1.82899301e-05, -6.85668196e-06, -2.03926052e-05, -1.92327105e-04,\n", - " -5.36787318e-05, -1.75316594e-04, 5.00921038e-04, 1.45688893e-04,\n", - " -3.96319489e-05, 7.60191739e-05, 1.03714211e-04, 3.41146659e-04,\n", - " 3.12939637e-04, -1.25675053e-04, 3.47103013e-05, -4.55230167e-04,\n", - " 2.66342456e-04, 3.01029884e-04, -1.44831019e-04, -1.02233797e-04,\n", - " 3.72579009e-04, -1.29388430e-04, 1.84378422e-04, -1.72381630e-04,\n", - " 2.03004813e-04, 2.35664428e-04, 3.33605329e-04, -1.46503189e-04,\n", - " -4.94174663e-06, 4.60467235e-05, 1.21205920e-04, 1.01241642e-04,\n", - " -8.10986294e-06, 1.66141228e-05, -2.12343799e-04, -3.61209569e-04])" - ] - }, - "execution_count": 30, - "metadata": {}, - "output_type": "execute_result" - } + " \n", + " \n", + " label\n", + " pixel0\n", + " pixel1\n", + " pixel2\n", + " pixel3\n", + " pixel4\n", + " pixel5\n", + " pixel6\n", + " pixel7\n", + " pixel8\n", + " pixel9\n", + " pixel10\n", + " pixel11\n", + " pixel12\n", + " pixel13\n", + " pixel14\n", + " pixel15\n", + " pixel16\n", + " pixel17\n", + " pixel18\n", + " pixel19\n", + " pixel20\n", + " pixel21\n", + " pixel22\n", + " pixel23\n", + " pixel24\n", + " pixel25\n", + " pixel26\n", + " pixel27\n", + " pixel28\n", + " pixel29\n", + " pixel30\n", + " pixel31\n", + " pixel32\n", + " pixel33\n", + " pixel34\n", + " pixel35\n", + " pixel36\n", + " pixel37\n", + " pixel38\n", + " pixel39\n", + " pixel40\n", + " pixel41\n", + " pixel42\n", + " pixel43\n", + " pixel44\n", + " pixel45\n", + " pixel46\n", + " pixel47\n", + " pixel48\n", + " pixel49\n", + " pixel50\n", + " pixel51\n", + " pixel52\n", + " pixel53\n", + " pixel54\n", + " pixel55\n", + " pixel56\n", + " pixel57\n", + " pixel58\n", + " pixel59\n", + " pixel60\n", + " pixel61\n", + " pixel62\n", + " pixel63\n", + " pixel64\n", + " pixel65\n", + " pixel66\n", + " pixel67\n", + " pixel68\n", + " pixel69\n", + " pixel70\n", + " pixel71\n", + " pixel72\n", + " pixel73\n", + " pixel74\n", + " pixel75\n", + " pixel76\n", + " pixel77\n", + " pixel78\n", + " pixel79\n", + " pixel80\n", + " pixel81\n", + " pixel82\n", + " pixel83\n", + " pixel84\n", + " pixel85\n", + " pixel86\n", + " pixel87\n", + " pixel88\n", + " pixel89\n", + " pixel90\n", + " pixel91\n", + " pixel92\n", + " pixel93\n", + " pixel94\n", + " pixel95\n", + " pixel96\n", + " pixel97\n", + " pixel98\n", + " pixel99\n", + " pixel100\n", + " pixel101\n", + " pixel102\n", + " pixel103\n", + " pixel104\n", + " pixel105\n", + " pixel106\n", + " pixel107\n", + " pixel108\n", + " pixel109\n", + " pixel110\n", + " pixel111\n", + " pixel112\n", + " pixel113\n", + " pixel114\n", + " pixel115\n", + " pixel116\n", + " pixel117\n", + " pixel118\n", + " pixel119\n", + " pixel120\n", + " pixel121\n", + " pixel122\n", + " pixel123\n", + " pixel124\n", + " pixel125\n", + " pixel126\n", + " pixel127\n", + " pixel128\n", + " pixel129\n", + " pixel130\n", + " pixel131\n", + " pixel132\n", + " pixel133\n", + " pixel134\n", + " pixel135\n", + " pixel136\n", + " pixel137\n", + " pixel138\n", + " pixel139\n", + " pixel140\n", + " pixel141\n", + " pixel142\n", + " pixel143\n", + " pixel144\n", + " pixel145\n", + " pixel146\n", + " pixel147\n", + " pixel148\n", + " pixel149\n", + " pixel150\n", + " pixel151\n", + " pixel152\n", + " pixel153\n", + " pixel154\n", + " pixel155\n", + " pixel156\n", + " pixel157\n", + " pixel158\n", + " pixel159\n", + " pixel160\n", + " pixel161\n", + " pixel162\n", + " pixel163\n", + " pixel164\n", + " pixel165\n", + " pixel166\n", + " pixel167\n", + " pixel168\n", + " pixel169\n", + " pixel170\n", + " pixel171\n", + " pixel172\n", + " pixel173\n", + " pixel174\n", + " pixel175\n", + " pixel176\n", + " pixel177\n", + " pixel178\n", + " pixel179\n", + " pixel180\n", + " pixel181\n", + " pixel182\n", + " pixel183\n", + " pixel184\n", + " pixel185\n", + " pixel186\n", + " pixel187\n", + " pixel188\n", + " pixel189\n", + " pixel190\n", + " pixel191\n", + " pixel192\n", + " pixel193\n", + " pixel194\n", + " pixel195\n", + " pixel196\n", + " pixel197\n", + " pixel198\n", + " pixel199\n", + " pixel200\n", + " pixel201\n", + " pixel202\n", + " pixel203\n", + " pixel204\n", + " pixel205\n", + " pixel206\n", + " pixel207\n", + " pixel208\n", + " pixel209\n", + " pixel210\n", + " pixel211\n", + " pixel212\n", + " pixel213\n", + " pixel214\n", + " pixel215\n", + " pixel216\n", + " pixel217\n", + " pixel218\n", + " pixel219\n", + " pixel220\n", + " pixel221\n", + " pixel222\n", + " pixel223\n", + " pixel224\n", + " pixel225\n", + " pixel226\n", + " pixel227\n", + " pixel228\n", + " pixel229\n", + " pixel230\n", + " pixel231\n", + " pixel232\n", + " pixel233\n", + " pixel234\n", + " pixel235\n", + " pixel236\n", + " pixel237\n", + " pixel238\n", + " pixel239\n", + " pixel240\n", + " pixel241\n", + " pixel242\n", + " pixel243\n", + " pixel244\n", + " pixel245\n", + " pixel246\n", + " pixel247\n", + " pixel248\n", + " pixel249\n", + " pixel250\n", + " pixel251\n", + " pixel252\n", + " pixel253\n", + " pixel254\n", + " pixel255\n", + " pixel256\n", + " pixel257\n", + " pixel258\n", + " pixel259\n", + " pixel260\n", + " pixel261\n", + " pixel262\n", + " pixel263\n", + " pixel264\n", + " pixel265\n", + " pixel266\n", + " pixel267\n", + " pixel268\n", + " pixel269\n", + " pixel270\n", + " pixel271\n", + " pixel272\n", + " pixel273\n", + " pixel274\n", + " pixel275\n", + " pixel276\n", + " pixel277\n", + " pixel278\n", + " pixel279\n", + " pixel280\n", + " pixel281\n", + " pixel282\n", + " pixel283\n", + " pixel284\n", + " pixel285\n", + " pixel286\n", + " pixel287\n", + " pixel288\n", + " pixel289\n", + " pixel290\n", + " pixel291\n", + " pixel292\n", + " pixel293\n", + " pixel294\n", + " pixel295\n", + " pixel296\n", + " pixel297\n", + " pixel298\n", + " pixel299\n", + " pixel300\n", + " pixel301\n", + " pixel302\n", + " pixel303\n", + " pixel304\n", + " pixel305\n", + " pixel306\n", + " pixel307\n", + " pixel308\n", + " pixel309\n", + " pixel310\n", + " pixel311\n", + " pixel312\n", + " pixel313\n", + " pixel314\n", + " pixel315\n", + " pixel316\n", + " pixel317\n", + " pixel318\n", + " pixel319\n", + " pixel320\n", + " pixel321\n", + " pixel322\n", + " pixel323\n", + " pixel324\n", + " pixel325\n", + " pixel326\n", + " pixel327\n", + " pixel328\n", + " pixel329\n", + " pixel330\n", + " pixel331\n", + " pixel332\n", + " pixel333\n", + " pixel334\n", + " pixel335\n", + " pixel336\n", + " pixel337\n", + " pixel338\n", + " pixel339\n", + " pixel340\n", + " pixel341\n", + " pixel342\n", + " pixel343\n", + " pixel344\n", + " pixel345\n", + " pixel346\n", + " pixel347\n", + " pixel348\n", + " pixel349\n", + " pixel350\n", + " pixel351\n", + " pixel352\n", + " pixel353\n", + " pixel354\n", + " pixel355\n", + " pixel356\n", + " pixel357\n", + " pixel358\n", + " pixel359\n", + " pixel360\n", + " pixel361\n", + " pixel362\n", + " pixel363\n", + " pixel364\n", + " pixel365\n", + " pixel366\n", + " pixel367\n", + " pixel368\n", + " pixel369\n", + " pixel370\n", + " pixel371\n", + " pixel372\n", + " pixel373\n", + " pixel374\n", + " pixel375\n", + " pixel376\n", + " pixel377\n", + " pixel378\n", + " pixel379\n", + " pixel380\n", + " pixel381\n", + " pixel382\n", + " pixel383\n", + " pixel384\n", + " pixel385\n", + " pixel386\n", + " pixel387\n", + " pixel388\n", + " pixel389\n", + " pixel390\n", + " pixel391\n", + " pixel392\n", + " pixel393\n", + " pixel394\n", + " pixel395\n", + " pixel396\n", + " pixel397\n", + " pixel398\n", + " pixel399\n", + " pixel400\n", + " pixel401\n", + " pixel402\n", + " pixel403\n", + " pixel404\n", + " pixel405\n", + " pixel406\n", + " pixel407\n", + " pixel408\n", + " pixel409\n", + " pixel410\n", + " pixel411\n", + " pixel412\n", + " pixel413\n", + " pixel414\n", + " pixel415\n", + " pixel416\n", + " pixel417\n", + " pixel418\n", + " pixel419\n", + " pixel420\n", + " pixel421\n", + " pixel422\n", + " pixel423\n", + " pixel424\n", + " pixel425\n", + " pixel426\n", + " pixel427\n", + " pixel428\n", + " pixel429\n", + " pixel430\n", + " pixel431\n", + " pixel432\n", + " pixel433\n", + " pixel434\n", + " pixel435\n", + " pixel436\n", + " pixel437\n", + " pixel438\n", + " pixel439\n", + " pixel440\n", + " pixel441\n", + " pixel442\n", + " pixel443\n", + " pixel444\n", + " pixel445\n", + " pixel446\n", + " pixel447\n", + " pixel448\n", + " pixel449\n", + " pixel450\n", + " pixel451\n", + " pixel452\n", + " pixel453\n", + " pixel454\n", + " pixel455\n", + " pixel456\n", + " pixel457\n", + " pixel458\n", + " pixel459\n", + " pixel460\n", + " pixel461\n", + " pixel462\n", + " pixel463\n", + " pixel464\n", + " pixel465\n", + " pixel466\n", + " pixel467\n", + " pixel468\n", + " pixel469\n", + " pixel470\n", + " pixel471\n", + " pixel472\n", + " pixel473\n", + " pixel474\n", + " pixel475\n", + " pixel476\n", + " pixel477\n", + " pixel478\n", + " pixel479\n", + " pixel480\n", + " pixel481\n", + " pixel482\n", + " pixel483\n", + " pixel484\n", + " pixel485\n", + " pixel486\n", + " pixel487\n", + " pixel488\n", + " pixel489\n", + " pixel490\n", + " pixel491\n", + " pixel492\n", + " pixel493\n", + " pixel494\n", + " pixel495\n", + " pixel496\n", + " pixel497\n", + " pixel498\n", + " pixel499\n", + " pixel500\n", + " pixel501\n", + " pixel502\n", + " pixel503\n", + " pixel504\n", + " pixel505\n", + " pixel506\n", + " pixel507\n", + " pixel508\n", + " pixel509\n", + " pixel510\n", + " pixel511\n", + " pixel512\n", + " pixel513\n", + " pixel514\n", + " pixel515\n", + " pixel516\n", + " pixel517\n", + " pixel518\n", + " pixel519\n", + " pixel520\n", + " pixel521\n", + " pixel522\n", + " pixel523\n", + " pixel524\n", + " pixel525\n", + " pixel526\n", + " pixel527\n", + " pixel528\n", + " pixel529\n", + " pixel530\n", + " pixel531\n", + " pixel532\n", + " pixel533\n", + " pixel534\n", + " pixel535\n", + " pixel536\n", + " pixel537\n", + " pixel538\n", + " pixel539\n", + " pixel540\n", + " pixel541\n", + " pixel542\n", + " pixel543\n", + " pixel544\n", + " pixel545\n", + " pixel546\n", + " pixel547\n", + " pixel548\n", + " pixel549\n", + " pixel550\n", + " pixel551\n", + " pixel552\n", + " pixel553\n", + " pixel554\n", + " pixel555\n", + " pixel556\n", + " pixel557\n", + " pixel558\n", + " pixel559\n", + " pixel560\n", + " pixel561\n", + " pixel562\n", + " pixel563\n", + " pixel564\n", + " pixel565\n", + " pixel566\n", + " pixel567\n", + " pixel568\n", + " pixel569\n", + " pixel570\n", + " pixel571\n", + " pixel572\n", + " pixel573\n", + " pixel574\n", + " pixel575\n", + " pixel576\n", + " pixel577\n", + " pixel578\n", + " pixel579\n", + " pixel580\n", + " pixel581\n", + " pixel582\n", + " pixel583\n", + " pixel584\n", + " pixel585\n", + " pixel586\n", + " pixel587\n", + " pixel588\n", + " pixel589\n", + " pixel590\n", + " pixel591\n", + " pixel592\n", + " pixel593\n", + " pixel594\n", + " pixel595\n", + " pixel596\n", + " pixel597\n", + " pixel598\n", + " pixel599\n", + " pixel600\n", + " pixel601\n", + " pixel602\n", + " pixel603\n", + " pixel604\n", + " pixel605\n", + " pixel606\n", + " pixel607\n", + " pixel608\n", + " pixel609\n", + " pixel610\n", + " pixel611\n", + " pixel612\n", + " pixel613\n", + " pixel614\n", + " pixel615\n", + " pixel616\n", + " pixel617\n", + " pixel618\n", + " pixel619\n", + " pixel620\n", + " pixel621\n", + " pixel622\n", + " pixel623\n", + " pixel624\n", + " pixel625\n", + " pixel626\n", + " pixel627\n", + " pixel628\n", + " pixel629\n", + " pixel630\n", + " pixel631\n", + " pixel632\n", + " pixel633\n", + " pixel634\n", + " pixel635\n", + " pixel636\n", + " pixel637\n", + " pixel638\n", + " pixel639\n", + " pixel640\n", + " pixel641\n", + " pixel642\n", + " pixel643\n", + " pixel644\n", + " pixel645\n", + " pixel646\n", + " pixel647\n", + " pixel648\n", + " pixel649\n", + " pixel650\n", + " pixel651\n", + " pixel652\n", + " pixel653\n", + " pixel654\n", + " pixel655\n", + " pixel656\n", + " pixel657\n", + " pixel658\n", + " pixel659\n", + " pixel660\n", + " pixel661\n", + " pixel662\n", + " pixel663\n", + " pixel664\n", + " pixel665\n", + " pixel666\n", + " pixel667\n", + " pixel668\n", + " pixel669\n", + " pixel670\n", + " pixel671\n", + " pixel672\n", + " pixel673\n", + " pixel674\n", + " pixel675\n", + " pixel676\n", + " pixel677\n", + " pixel678\n", + " pixel679\n", + " pixel680\n", + " pixel681\n", + " pixel682\n", + " pixel683\n", + " pixel684\n", + " pixel685\n", + " pixel686\n", + " pixel687\n", + " pixel688\n", + " pixel689\n", + " pixel690\n", + " pixel691\n", + " pixel692\n", + " pixel693\n", + " pixel694\n", + " pixel695\n", + " pixel696\n", + " pixel697\n", + " pixel698\n", + " pixel699\n", + " pixel700\n", + " pixel701\n", + " pixel702\n", + " pixel703\n", + " pixel704\n", + " pixel705\n", + " pixel706\n", + " pixel707\n", + " pixel708\n", + " pixel709\n", + " pixel710\n", + " pixel711\n", + " pixel712\n", + " pixel713\n", + " pixel714\n", + " pixel715\n", + " pixel716\n", + " pixel717\n", + " pixel718\n", + " pixel719\n", + " pixel720\n", + " pixel721\n", + " pixel722\n", + " pixel723\n", + " pixel724\n", + " pixel725\n", + " pixel726\n", + " pixel727\n", + " pixel728\n", + " pixel729\n", + " pixel730\n", + " pixel731\n", + " pixel732\n", + " pixel733\n", + " pixel734\n", + " pixel735\n", + " pixel736\n", + " pixel737\n", + " pixel738\n", + " pixel739\n", + " pixel740\n", + " pixel741\n", + " pixel742\n", + " pixel743\n", + " pixel744\n", + " pixel745\n", + " pixel746\n", + " pixel747\n", + " pixel748\n", + " pixel749\n", + " pixel750\n", + " pixel751\n", + " pixel752\n", + " pixel753\n", + " pixel754\n", + " pixel755\n", + " pixel756\n", + " pixel757\n", + " pixel758\n", + " pixel759\n", + " pixel760\n", + " pixel761\n", + " pixel762\n", + " pixel763\n", + " pixel764\n", + " pixel765\n", + " pixel766\n", + " pixel767\n", + " pixel768\n", + " pixel769\n", + " pixel770\n", + " pixel771\n", + " pixel772\n", + " pixel773\n", + " pixel774\n", + " pixel775\n", + " pixel776\n", + " pixel777\n", + " pixel778\n", + " pixel779\n", + " pixel780\n", + " pixel781\n", + " pixel782\n", + " pixel783\n", + " \n", + " \n", + " npartitions=2\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " int64\n", + " \n", + " \n", + " \n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " \n", + " \n", + " \n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " ...\n", + " \n", + " \n", + "\n", + "\n", + "
Dask Name: read-csv, 2 tasks
" + ], + "text/plain": [ + "Dask DataFrame Structure:\n", + " label pixel0 pixel1 pixel2 pixel3 pixel4 pixel5 pixel6 pixel7 pixel8 pixel9 pixel10 pixel11 pixel12 pixel13 pixel14 pixel15 pixel16 pixel17 pixel18 pixel19 pixel20 pixel21 pixel22 pixel23 pixel24 pixel25 pixel26 pixel27 pixel28 pixel29 pixel30 pixel31 pixel32 pixel33 pixel34 pixel35 pixel36 pixel37 pixel38 pixel39 pixel40 pixel41 pixel42 pixel43 pixel44 pixel45 pixel46 pixel47 pixel48 pixel49 pixel50 pixel51 pixel52 pixel53 pixel54 pixel55 pixel56 pixel57 pixel58 pixel59 pixel60 pixel61 pixel62 pixel63 pixel64 pixel65 pixel66 pixel67 pixel68 pixel69 pixel70 pixel71 pixel72 pixel73 pixel74 pixel75 pixel76 pixel77 pixel78 pixel79 pixel80 pixel81 pixel82 pixel83 pixel84 pixel85 pixel86 pixel87 pixel88 pixel89 pixel90 pixel91 pixel92 pixel93 pixel94 pixel95 pixel96 pixel97 pixel98 pixel99 pixel100 pixel101 pixel102 pixel103 pixel104 pixel105 pixel106 pixel107 pixel108 pixel109 pixel110 pixel111 pixel112 pixel113 pixel114 pixel115 pixel116 pixel117 pixel118 pixel119 pixel120 pixel121 pixel122 pixel123 pixel124 pixel125 pixel126 pixel127 pixel128 pixel129 pixel130 pixel131 pixel132 pixel133 pixel134 pixel135 pixel136 pixel137 pixel138 pixel139 pixel140 pixel141 pixel142 pixel143 pixel144 pixel145 pixel146 pixel147 pixel148 pixel149 pixel150 pixel151 pixel152 pixel153 pixel154 pixel155 pixel156 pixel157 pixel158 pixel159 pixel160 pixel161 pixel162 pixel163 pixel164 pixel165 pixel166 pixel167 pixel168 pixel169 pixel170 pixel171 pixel172 pixel173 pixel174 pixel175 pixel176 pixel177 pixel178 pixel179 pixel180 pixel181 pixel182 pixel183 pixel184 pixel185 pixel186 pixel187 pixel188 pixel189 pixel190 pixel191 pixel192 pixel193 pixel194 pixel195 pixel196 pixel197 pixel198 pixel199 pixel200 pixel201 pixel202 pixel203 pixel204 pixel205 pixel206 pixel207 pixel208 pixel209 pixel210 pixel211 pixel212 pixel213 pixel214 pixel215 pixel216 pixel217 pixel218 pixel219 pixel220 pixel221 pixel222 pixel223 pixel224 pixel225 pixel226 pixel227 pixel228 pixel229 pixel230 pixel231 pixel232 pixel233 pixel234 pixel235 pixel236 pixel237 pixel238 pixel239 pixel240 pixel241 pixel242 pixel243 pixel244 pixel245 pixel246 pixel247 pixel248 pixel249 pixel250 pixel251 pixel252 pixel253 pixel254 pixel255 pixel256 pixel257 pixel258 pixel259 pixel260 pixel261 pixel262 pixel263 pixel264 pixel265 pixel266 pixel267 pixel268 pixel269 pixel270 pixel271 pixel272 pixel273 pixel274 pixel275 pixel276 pixel277 pixel278 pixel279 pixel280 pixel281 pixel282 pixel283 pixel284 pixel285 pixel286 pixel287 pixel288 pixel289 pixel290 pixel291 pixel292 pixel293 pixel294 pixel295 pixel296 pixel297 pixel298 pixel299 pixel300 pixel301 pixel302 pixel303 pixel304 pixel305 pixel306 pixel307 pixel308 pixel309 pixel310 pixel311 pixel312 pixel313 pixel314 pixel315 pixel316 pixel317 pixel318 pixel319 pixel320 pixel321 pixel322 pixel323 pixel324 pixel325 pixel326 pixel327 pixel328 pixel329 pixel330 pixel331 pixel332 pixel333 pixel334 pixel335 pixel336 pixel337 pixel338 pixel339 pixel340 pixel341 pixel342 pixel343 pixel344 pixel345 pixel346 pixel347 pixel348 pixel349 pixel350 pixel351 pixel352 pixel353 pixel354 pixel355 pixel356 pixel357 pixel358 pixel359 pixel360 pixel361 pixel362 pixel363 pixel364 pixel365 pixel366 pixel367 pixel368 pixel369 pixel370 pixel371 pixel372 pixel373 pixel374 pixel375 pixel376 pixel377 pixel378 pixel379 pixel380 pixel381 pixel382 pixel383 pixel384 pixel385 pixel386 pixel387 pixel388 pixel389 pixel390 pixel391 pixel392 pixel393 pixel394 pixel395 pixel396 pixel397 pixel398 pixel399 pixel400 pixel401 pixel402 pixel403 pixel404 pixel405 pixel406 pixel407 pixel408 pixel409 pixel410 pixel411 pixel412 pixel413 pixel414 pixel415 pixel416 pixel417 pixel418 pixel419 pixel420 pixel421 pixel422 pixel423 pixel424 pixel425 pixel426 pixel427 pixel428 pixel429 pixel430 pixel431 pixel432 pixel433 pixel434 pixel435 pixel436 pixel437 pixel438 pixel439 pixel440 pixel441 pixel442 pixel443 pixel444 pixel445 pixel446 pixel447 pixel448 pixel449 pixel450 pixel451 pixel452 pixel453 pixel454 pixel455 pixel456 pixel457 pixel458 pixel459 pixel460 pixel461 pixel462 pixel463 pixel464 pixel465 pixel466 pixel467 pixel468 pixel469 pixel470 pixel471 pixel472 pixel473 pixel474 pixel475 pixel476 pixel477 pixel478 pixel479 pixel480 pixel481 pixel482 pixel483 pixel484 pixel485 pixel486 pixel487 pixel488 pixel489 pixel490 pixel491 pixel492 pixel493 pixel494 pixel495 pixel496 pixel497 pixel498 pixel499 pixel500 pixel501 pixel502 pixel503 pixel504 pixel505 pixel506 pixel507 pixel508 pixel509 pixel510 pixel511 pixel512 pixel513 pixel514 pixel515 pixel516 pixel517 pixel518 pixel519 pixel520 pixel521 pixel522 pixel523 pixel524 pixel525 pixel526 pixel527 pixel528 pixel529 pixel530 pixel531 pixel532 pixel533 pixel534 pixel535 pixel536 pixel537 pixel538 pixel539 pixel540 pixel541 pixel542 pixel543 pixel544 pixel545 pixel546 pixel547 pixel548 pixel549 pixel550 pixel551 pixel552 pixel553 pixel554 pixel555 pixel556 pixel557 pixel558 pixel559 pixel560 pixel561 pixel562 pixel563 pixel564 pixel565 pixel566 pixel567 pixel568 pixel569 pixel570 pixel571 pixel572 pixel573 pixel574 pixel575 pixel576 pixel577 pixel578 pixel579 pixel580 pixel581 pixel582 pixel583 pixel584 pixel585 pixel586 pixel587 pixel588 pixel589 pixel590 pixel591 pixel592 pixel593 pixel594 pixel595 pixel596 pixel597 pixel598 pixel599 pixel600 pixel601 pixel602 pixel603 pixel604 pixel605 pixel606 pixel607 pixel608 pixel609 pixel610 pixel611 pixel612 pixel613 pixel614 pixel615 pixel616 pixel617 pixel618 pixel619 pixel620 pixel621 pixel622 pixel623 pixel624 pixel625 pixel626 pixel627 pixel628 pixel629 pixel630 pixel631 pixel632 pixel633 pixel634 pixel635 pixel636 pixel637 pixel638 pixel639 pixel640 pixel641 pixel642 pixel643 pixel644 pixel645 pixel646 pixel647 pixel648 pixel649 pixel650 pixel651 pixel652 pixel653 pixel654 pixel655 pixel656 pixel657 pixel658 pixel659 pixel660 pixel661 pixel662 pixel663 pixel664 pixel665 pixel666 pixel667 pixel668 pixel669 pixel670 pixel671 pixel672 pixel673 pixel674 pixel675 pixel676 pixel677 pixel678 pixel679 pixel680 pixel681 pixel682 pixel683 pixel684 pixel685 pixel686 pixel687 pixel688 pixel689 pixel690 pixel691 pixel692 pixel693 pixel694 pixel695 pixel696 pixel697 pixel698 pixel699 pixel700 pixel701 pixel702 pixel703 pixel704 pixel705 pixel706 pixel707 pixel708 pixel709 pixel710 pixel711 pixel712 pixel713 pixel714 pixel715 pixel716 pixel717 pixel718 pixel719 pixel720 pixel721 pixel722 pixel723 pixel724 pixel725 pixel726 pixel727 pixel728 pixel729 pixel730 pixel731 pixel732 pixel733 pixel734 pixel735 pixel736 pixel737 pixel738 pixel739 pixel740 pixel741 pixel742 pixel743 pixel744 pixel745 pixel746 pixel747 pixel748 pixel749 pixel750 pixel751 pixel752 pixel753 pixel754 pixel755 pixel756 pixel757 pixel758 pixel759 pixel760 pixel761 pixel762 pixel763 pixel764 pixel765 pixel766 pixel767 pixel768 pixel769 pixel770 pixel771 pixel772 pixel773 pixel774 pixel775 pixel776 pixel777 pixel778 pixel779 pixel780 pixel781 pixel782 pixel783\n", + "npartitions=2 \n", + " int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64\nnn", + "Dask Name: read-csv, 2 tasks" + ] + }, + "execution_count": 29, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df2" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "
\n", + "

Exercise

\n", + "\n", + "Use Dask dataframe of MNIST (df2) and follow these steps:\n", + " \n", + "1. Add a new column called `sum` to the dataframe which contains sum of all the pixels\n", + "2. Use groupby to find the mean value for `sum` for each label\n", + " \n", + "\n", + "
\n", + " → Hints\n", + "\n", + " * Columns 1 onwards are the pixels. You can access them with `pixels=df2.iloc[:, 1:]`\n", + " * Instead of `df['sum']=pixels.sum()` try `df['sum']=pixels.sum(axis=1)` because we want to sum along columns, not rows\n", + " * If the dask output is confusing, try with df1 first\n", + " * to groupby use `df2.groupby('label').?`, where you replace the `?` with the aggregation operation\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "
\n", + " \n", + " → Solution\n", + " \n", + "\n", + " ```python\n", + " # With pandas\n", + " pixels = df1.loc[:, ['pixel' in c for c in df1.columns]]\n", + " df1['sum']=pixels.sum(axis=1)\n", + " task = df1[['label','sum']].groupby('label').mean()\n", + " print(result)\n", + "\n", + " # With dask\n", + " pixels = df2.loc[:, ['pixel' in c for c in df2.columns]]\n", + " df2['sum']=pixels.sum(axis=1)\n", + " task = df2[['label','sum']].groupby('label').mean()\n", + " with ProgressBar():\n", + " result=task.compute() \n", + " print(result)\n", + " ```\n", + "\n", + "
\n", + "\n", + "\n", + "
" + ] + }, + { + "cell_type": "code", + "execution_count": 56, + "metadata": { + "ExecuteTime": { + "end_time": "2020-10-14T02:59:56.210856Z", + "start_time": "2020-10-14T02:59:55.313285Z" + } + }, + "outputs": [ + { + "data": { + "text/html": [ + "
Dask DataFrame Structure:
\n", + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
pixel0pixel1pixel2pixel3pixel4pixel5pixel6pixel7pixel8pixel9pixel10pixel11pixel12pixel13pixel14pixel15pixel16pixel17pixel18pixel19pixel20pixel21pixel22pixel23pixel24pixel25pixel26pixel27pixel28pixel29pixel30pixel31pixel32pixel33pixel34pixel35pixel36pixel37pixel38pixel39pixel40pixel41pixel42pixel43pixel44pixel45pixel46pixel47pixel48pixel49pixel50pixel51pixel52pixel53pixel54pixel55pixel56pixel57pixel58pixel59pixel60pixel61pixel62pixel63pixel64pixel65pixel66pixel67pixel68pixel69pixel70pixel71pixel72pixel73pixel74pixel75pixel76pixel77pixel78pixel79pixel80pixel81pixel82pixel83pixel84pixel85pixel86pixel87pixel88pixel89pixel90pixel91pixel92pixel93pixel94pixel95pixel96pixel97pixel98pixel99pixel100pixel101pixel102pixel103pixel104pixel105pixel106pixel107pixel108pixel109pixel110pixel111pixel112pixel113pixel114pixel115pixel116pixel117pixel118pixel119pixel120pixel121pixel122pixel123pixel124pixel125pixel126pixel127pixel128pixel129pixel130pixel131pixel132pixel133pixel134pixel135pixel136pixel137pixel138pixel139pixel140pixel141pixel142pixel143pixel144pixel145pixel146pixel147pixel148pixel149pixel150pixel151pixel152pixel153pixel154pixel155pixel156pixel157pixel158pixel159pixel160pixel161pixel162pixel163pixel164pixel165pixel166pixel167pixel168pixel169pixel170pixel171pixel172pixel173pixel174pixel175pixel176pixel177pixel178pixel179pixel180pixel181pixel182pixel183pixel184pixel185pixel186pixel187pixel188pixel189pixel190pixel191pixel192pixel193pixel194pixel195pixel196pixel197pixel198pixel199pixel200pixel201pixel202pixel203pixel204pixel205pixel206pixel207pixel208pixel209pixel210pixel211pixel212pixel213pixel214pixel215pixel216pixel217pixel218pixel219pixel220pixel221pixel222pixel223pixel224pixel225pixel226pixel227pixel228pixel229pixel230pixel231pixel232pixel233pixel234pixel235pixel236pixel237pixel238pixel239pixel240pixel241pixel242pixel243pixel244pixel245pixel246pixel247pixel248pixel249pixel250pixel251pixel252pixel253pixel254pixel255pixel256pixel257pixel258pixel259pixel260pixel261pixel262pixel263pixel264pixel265pixel266pixel267pixel268pixel269pixel270pixel271pixel272pixel273pixel274pixel275pixel276pixel277pixel278pixel279pixel280pixel281pixel282pixel283pixel284pixel285pixel286pixel287pixel288pixel289pixel290pixel291pixel292pixel293pixel294pixel295pixel296pixel297pixel298pixel299pixel300pixel301pixel302pixel303pixel304pixel305pixel306pixel307pixel308pixel309pixel310pixel311pixel312pixel313pixel314pixel315pixel316pixel317pixel318pixel319pixel320pixel321pixel322pixel323pixel324pixel325pixel326pixel327pixel328pixel329pixel330pixel331pixel332pixel333pixel334pixel335pixel336pixel337pixel338pixel339pixel340pixel341pixel342pixel343pixel344pixel345pixel346pixel347pixel348pixel349pixel350pixel351pixel352pixel353pixel354pixel355pixel356pixel357pixel358pixel359pixel360pixel361pixel362pixel363pixel364pixel365pixel366pixel367pixel368pixel369pixel370pixel371pixel372pixel373pixel374pixel375pixel376pixel377pixel378pixel379pixel380pixel381pixel382pixel383pixel384pixel385pixel386pixel387pixel388pixel389pixel390pixel391pixel392pixel393pixel394pixel395pixel396pixel397pixel398pixel399pixel400pixel401pixel402pixel403pixel404pixel405pixel406pixel407pixel408pixel409pixel410pixel411pixel412pixel413pixel414pixel415pixel416pixel417pixel418pixel419pixel420pixel421pixel422pixel423pixel424pixel425pixel426pixel427pixel428pixel429pixel430pixel431pixel432pixel433pixel434pixel435pixel436pixel437pixel438pixel439pixel440pixel441pixel442pixel443pixel444pixel445pixel446pixel447pixel448pixel449pixel450pixel451pixel452pixel453pixel454pixel455pixel456pixel457pixel458pixel459pixel460pixel461pixel462pixel463pixel464pixel465pixel466pixel467pixel468pixel469pixel470pixel471pixel472pixel473pixel474pixel475pixel476pixel477pixel478pixel479pixel480pixel481pixel482pixel483pixel484pixel485pixel486pixel487pixel488pixel489pixel490pixel491pixel492pixel493pixel494pixel495pixel496pixel497pixel498pixel499pixel500pixel501pixel502pixel503pixel504pixel505pixel506pixel507pixel508pixel509pixel510pixel511pixel512pixel513pixel514pixel515pixel516pixel517pixel518pixel519pixel520pixel521pixel522pixel523pixel524pixel525pixel526pixel527pixel528pixel529pixel530pixel531pixel532pixel533pixel534pixel535pixel536pixel537pixel538pixel539pixel540pixel541pixel542pixel543pixel544pixel545pixel546pixel547pixel548pixel549pixel550pixel551pixel552pixel553pixel554pixel555pixel556pixel557pixel558pixel559pixel560pixel561pixel562pixel563pixel564pixel565pixel566pixel567pixel568pixel569pixel570pixel571pixel572pixel573pixel574pixel575pixel576pixel577pixel578pixel579pixel580pixel581pixel582pixel583pixel584pixel585pixel586pixel587pixel588pixel589pixel590pixel591pixel592pixel593pixel594pixel595pixel596pixel597pixel598pixel599pixel600pixel601pixel602pixel603pixel604pixel605pixel606pixel607pixel608pixel609pixel610pixel611pixel612pixel613pixel614pixel615pixel616pixel617pixel618pixel619pixel620pixel621pixel622pixel623pixel624pixel625pixel626pixel627pixel628pixel629pixel630pixel631pixel632pixel633pixel634pixel635pixel636pixel637pixel638pixel639pixel640pixel641pixel642pixel643pixel644pixel645pixel646pixel647pixel648pixel649pixel650pixel651pixel652pixel653pixel654pixel655pixel656pixel657pixel658pixel659pixel660pixel661pixel662pixel663pixel664pixel665pixel666pixel667pixel668pixel669pixel670pixel671pixel672pixel673pixel674pixel675pixel676pixel677pixel678pixel679pixel680pixel681pixel682pixel683pixel684pixel685pixel686pixel687pixel688pixel689pixel690pixel691pixel692pixel693pixel694pixel695pixel696pixel697pixel698pixel699pixel700pixel701pixel702pixel703pixel704pixel705pixel706pixel707pixel708pixel709pixel710pixel711pixel712pixel713pixel714pixel715pixel716pixel717pixel718pixel719pixel720pixel721pixel722pixel723pixel724pixel725pixel726pixel727pixel728pixel729pixel730pixel731pixel732pixel733pixel734pixel735pixel736pixel737pixel738pixel739pixel740pixel741pixel742pixel743pixel744pixel745pixel746pixel747pixel748pixel749pixel750pixel751pixel752pixel753pixel754pixel755pixel756pixel757pixel758pixel759pixel760pixel761pixel762pixel763pixel764pixel765pixel766pixel767pixel768pixel769pixel770pixel771pixel772pixel773pixel774pixel775pixel776pixel777pixel778pixel779pixel780pixel781pixel782pixel783
npartitions=2
int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64int64


\n", + "
\n", + "
Dask Name: try_loc, 61 tasks
" + ], + "text/plain": [ + "Dask DataFrame Structure:\n", + " pixel0 pixel1 pixel2 pixel3 pixel4 pixel5 pixel6 pixel7 pixel8 pixel9 pixel10 pixel11 pixel12 pixel13 pixel14 pixel15 pixel16 pixel17 pixel18 pixel19 pixel20 pixel21 pixel22 pixel23 pixel24 pixel25 pixel26 pixel27 pixel28 pixel29 pixel30 pixel31 pixel32 pixel33 pixel34 pixel35 pixel36 pixel37 pixel38 pixel39 pixel40 pixel41 pixel42 pixel43 pixel44 pixel45 pixel46 pixel47 pixel48 pixel49 pixel50 pixel51 pixel52 pixel53 pixel54 pixel55 pixel56 pixel57 pixel58 pixel59 pixel60 pixel61 pixel62 pixel63 pixel64 pixel65 pixel66 pixel67 pixel68 pixel69 pixel70 pixel71 pixel72 pixel73 pixel74 pixel75 pixel76 pixel77 pixel78 pixel79 pixel80 pixel81 pixel82 pixel83 pixel84 pixel85 pixel86 pixel87 pixel88 pixel89 pixel90 pixel91 pixel92 pixel93 pixel94 pixel95 pixel96 pixel97 pixel98 pixel99 pixel100 pixel101 pixel102 pixel103 pixel104 pixel105 pixel106 pixel107 pixel108 pixel109 pixel110 pixel111 pixel112 pixel113 pixel114 pixel115 pixel116 pixel117 pixel118 pixel119 pixel120 pixel121 pixel122 pixel123 pixel124 pixel125 pixel126 pixel127 pixel128 pixel129 pixel130 pixel131 pixel132 pixel133 pixel134 pixel135 pixel136 pixel137 pixel138 pixel139 pixel140 pixel141 pixel142 pixel143 pixel144 pixel145 pixel146 pixel147 pixel148 pixel149 pixel150 pixel151 pixel152 pixel153 pixel154 pixel155 pixel156 pixel157 pixel158 pixel159 pixel160 pixel161 pixel162 pixel163 pixel164 pixel165 pixel166 pixel167 pixel168 pixel169 pixel170 pixel171 pixel172 pixel173 pixel174 pixel175 pixel176 pixel177 pixel178 pixel179 pixel180 pixel181 pixel182 pixel183 pixel184 pixel185 pixel186 pixel187 pixel188 pixel189 pixel190 pixel191 pixel192 pixel193 pixel194 pixel195 pixel196 pixel197 pixel198 pixel199 pixel200 pixel201 pixel202 pixel203 pixel204 pixel205 pixel206 pixel207 pixel208 pixel209 pixel210 pixel211 pixel212 pixel213 pixel214 pixel215 pixel216 pixel217 pixel218 pixel219 pixel220 pixel221 pixel222 pixel223 pixel224 pixel225 pixel226 pixel227 pixel228 pixel229 pixel230 pixel231 pixel232 pixel233 pixel234 pixel235 pixel236 pixel237 pixel238 pixel239 pixel240 pixel241 pixel242 pixel243 pixel244 pixel245 pixel246 pixel247 pixel248 pixel249 pixel250 pixel251 pixel252 pixel253 pixel254 pixel255 pixel256 pixel257 pixel258 pixel259 pixel260 pixel261 pixel262 pixel263 pixel264 pixel265 pixel266 pixel267 pixel268 pixel269 pixel270 pixel271 pixel272 pixel273 pixel274 pixel275 pixel276 pixel277 pixel278 pixel279 pixel280 pixel281 pixel282 pixel283 pixel284 pixel285 pixel286 pixel287 pixel288 pixel289 pixel290 pixel291 pixel292 pixel293 pixel294 pixel295 pixel296 pixel297 pixel298 pixel299 pixel300 pixel301 pixel302 pixel303 pixel304 pixel305 pixel306 pixel307 pixel308 pixel309 pixel310 pixel311 pixel312 pixel313 pixel314 pixel315 pixel316 pixel317 pixel318 pixel319 pixel320 pixel321 pixel322 pixel323 pixel324 pixel325 pixel326 pixel327 pixel328 pixel329 pixel330 pixel331 pixel332 pixel333 pixel334 pixel335 pixel336 pixel337 pixel338 pixel339 pixel340 pixel341 pixel342 pixel343 pixel344 pixel345 pixel346 pixel347 pixel348 pixel349 pixel350 pixel351 pixel352 pixel353 pixel354 pixel355 pixel356 pixel357 pixel358 pixel359 pixel360 pixel361 pixel362 pixel363 pixel364 pixel365 pixel366 pixel367 pixel368 pixel369 pixel370 pixel371 pixel372 pixel373 pixel374 pixel375 pixel376 pixel377 pixel378 pixel379 pixel380 pixel381 pixel382 pixel383 pixel384 pixel385 pixel386 pixel387 pixel388 pixel389 pixel390 pixel391 pixel392 pixel393 pixel394 pixel395 pixel396 pixel397 pixel398 pixel399 pixel400 pixel401 pixel402 pixel403 pixel404 pixel405 pixel406 pixel407 pixel408 pixel409 pixel410 pixel411 pixel412 pixel413 pixel414 pixel415 pixel416 pixel417 pixel418 pixel419 pixel420 pixel421 pixel422 pixel423 pixel424 pixel425 pixel426 pixel427 pixel428 pixel429 pixel430 pixel431 pixel432 pixel433 pixel434 pixel435 pixel436 pixel437 pixel438 pixel439 pixel440 pixel441 pixel442 pixel443 pixel444 pixel445 pixel446 pixel447 pixel448 pixel449 pixel450 pixel451 pixel452 pixel453 pixel454 pixel455 pixel456 pixel457 pixel458 pixel459 pixel460 pixel461 pixel462 pixel463 pixel464 pixel465 pixel466 pixel467 pixel468 pixel469 pixel470 pixel471 pixel472 pixel473 pixel474 pixel475 pixel476 pixel477 pixel478 pixel479 pixel480 pixel481 pixel482 pixel483 pixel484 pixel485 pixel486 pixel487 pixel488 pixel489 pixel490 pixel491 pixel492 pixel493 pixel494 pixel495 pixel496 pixel497 pixel498 pixel499 pixel500 pixel501 pixel502 pixel503 pixel504 pixel505 pixel506 pixel507 pixel508 pixel509 pixel510 pixel511 pixel512 pixel513 pixel514 pixel515 pixel516 pixel517 pixel518 pixel519 pixel520 pixel521 pixel522 pixel523 pixel524 pixel525 pixel526 pixel527 pixel528 pixel529 pixel530 pixel531 pixel532 pixel533 pixel534 pixel535 pixel536 pixel537 pixel538 pixel539 pixel540 pixel541 pixel542 pixel543 pixel544 pixel545 pixel546 pixel547 pixel548 pixel549 pixel550 pixel551 pixel552 pixel553 pixel554 pixel555 pixel556 pixel557 pixel558 pixel559 pixel560 pixel561 pixel562 pixel563 pixel564 pixel565 pixel566 pixel567 pixel568 pixel569 pixel570 pixel571 pixel572 pixel573 pixel574 pixel575 pixel576 pixel577 pixel578 pixel579 pixel580 pixel581 pixel582 pixel583 pixel584 pixel585 pixel586 pixel587 pixel588 pixel589 pixel590 pixel591 pixel592 pixel593 pixel594 pixel595 pixel596 pixel597 pixel598 pixel599 pixel600 pixel601 pixel602 pixel603 pixel604 pixel605 pixel606 pixel607 pixel608 pixel609 pixel610 pixel611 pixel612 pixel613 pixel614 pixel615 pixel616 pixel617 pixel618 pixel619 pixel620 pixel621 pixel622 pixel623 pixel624 pixel625 pixel626 pixel627 pixel628 pixel629 pixel630 pixel631 pixel632 pixel633 pixel634 pixel635 pixel636 pixel637 pixel638 pixel639 pixel640 pixel641 pixel642 pixel643 pixel644 pixel645 pixel646 pixel647 pixel648 pixel649 pixel650 pixel651 pixel652 pixel653 pixel654 pixel655 pixel656 pixel657 pixel658 pixel659 pixel660 pixel661 pixel662 pixel663 pixel664 pixel665 pixel666 pixel667 pixel668 pixel669 pixel670 pixel671 pixel672 pixel673 pixel674 pixel675 pixel676 pixel677 pixel678 pixel679 pixel680 pixel681 pixel682 pixel683 pixel684 pixel685 pixel686 pixel687 pixel688 pixel689 pixel690 pixel691 pixel692 pixel693 pixel694 pixel695 pixel696 pixel697 pixel698 pixel699 pixel700 pixel701 pixel702 pixel703 pixel704 pixel705 pixel706 pixel707 pixel708 pixel709 pixel710 pixel711 pixel712 pixel713 pixel714 pixel715 pixel716 pixel717 pixel718 pixel719 pixel720 pixel721 pixel722 pixel723 pixel724 pixel725 pixel726 pixel727 pixel728 pixel729 pixel730 pixel731 pixel732 pixel733 pixel734 pixel735 pixel736 pixel737 pixel738 pixel739 pixel740 pixel741 pixel742 pixel743 pixel744 pixel745 pixel746 pixel747 pixel748 pixel749 pixel750 pixel751 pixel752 pixel753 pixel754 pixel755 pixel756 pixel757 pixel758 pixel759 pixel760 pixel761 pixel762 pixel763 pixel764 pixel765 pixel766 pixel767 pixel768 pixel769 pixel770 pixel771 pixel772 pixel773 pixel774 pixel775 pixel776 pixel777 pixel778 pixel779 pixel780 pixel781 pixel782 pixel783\n", + "npartitions=2 \n", + " int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64 int64\nnn", + "Dask Name: try_loc, 61 tasks" + ] + }, + "execution_count": 56, + "metadata": {}, + "output_type": "execute_result" + } ], "source": [ - "res" - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "### Exercise\n", + "# With pandas\n", + "# pixels = df1.loc[:, ['pixel' in c for c in df1.columns]]\n", + "pixels = df1.loc[:, 'pixel1':'pixel783']\n", + "pixels\n", + "df1['sum']=pixels.sum(axis=1)\n", + "df1['sum']\n", + "# task = df1[['label','sum']].groupby('label').mean()\n", + "df1[['label','sum']].groupby('label').mean()\n", "\n", - "- Create two Dask random arrays of size 10,000,000-by-100. \n", - "- Find the difference between the two `y = ..`\n", - "- and pass it to `array.linalg.norm` using argument `axis=1`. \n", - "- Calculate the result and create a histogram of it." - ] - }, - { - "cell_type": "code", - "execution_count": 31, - "metadata": { - "ExecuteTime": { - "end_time": "2020-10-04T07:13:53.285755Z", - "start_time": "2020-10-04T07:13:53.281047Z" - } - }, - "outputs": [], - "source": [ - "from matplotlib.pyplot import hist" + "gg = df1[['label','sum']].groupby('label')\n", + "list(gg)[0]\n", + "# df1.loc[:, 'pixel1':'pixel783'].csum\n", + "# print(result)\n", + "\n", + "# # With dask\n", + "pixels = df2.loc[:, ['pixel' in c for c in df2.columns]]\n", + "pixels\n", + "# df2['sum']=pixels.sum(axis=1)\n", + "# task = df2[['label','sum']].groupby('label').mean()\n", + "# with ProgressBar():\n", + "# result=task.compute() \n", + "# print(result)" ] }, { "cell_type": "markdown", - "metadata": { - "ExecuteTime": { - "end_time": "2020-10-04T07:04:25.331001Z", - "start_time": "2020-10-04T07:04:25.308406Z" - } - }, + "metadata": {}, "source": [ - "
\n", - "

Exercise

\n", - "\n", - " Description:\n", - "\n", - "- Create two Dask random arrays of size 10,000,000-by-100. \n", - "- Find the difference between the two `y = ..`\n", - "- and pass it to `array.linalg.norm` using argument `axis=1`. \n", - "- Calculate the result and create a histogram of it.\n", - " \n", - "\n", - "
\n", - " → Hints\n", - " \n", - " Replace the question marks `?`\n", - "\n", - "```python\n", - "a = array.random.normal(size=(10000000, 100), chunks=200000)\n", - "b = array.random.normal(size=(10000000, 100), chunks=200000)\n", - "r = array.linalg.norm(?, axis=1)\n", - "r.?\n", - "```\n", - "\n", - "
\n", - "\n", - "
\n", - "
\n", - "
\n", - " \n", - " → Solution\n", - " \n", + "## When to use Dask DataFrame?\n", "\n", - " ```python\n", - " x1 = array.random.random(size=(10000000,100))\n", - " x2 = array.random.random(size=(10000000,100))\n", - " y = x2-x1\n", - " d = array.linalg.norm(y,axis=1)\n", - " with ProgressBar():\n", - " result = d.compute()\n", - " hist(result,bins=100);\n", - " ```\n", + "Lets visit [the dask page](https://docs.dask.org/en/latest/dataframe.html#common-uses-and-anti-uses) to look at when we should use it\n", "\n", - "
\n", + "It is harder so only if you dataset is larger than memory.\n", "\n", - "
" - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "## Delayed\n", - "Dask delayed is a method for parallelising code where you can't write your code directly as dataframe or array operation. `Dask.delayed` is an easy-to-use tool to quickly parallelise these tasks." + "If fact also consider:\n", + "- a database (if you have lots of structured queries)\n", + "- https://downloadmoreram.com/ ;p\n", + "- dask array" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ - "Consider the following functions. The first one takes an input, waits for one second and returns the value. The second function takes two inputs, waits for one second and returns the sum. We are using these functions to represent tasks that are time consuming." + "## Dask Array\n", + "Dask is not just used to replace pandas. There are also multiple numpy functions which can be replaced by Dask. Dask array is Dask equivalent of a numpy array. By doing so, we can perform the computations in parallel and get the results faster." ] }, { "cell_type": "code", - "execution_count": 32, + "execution_count": 57, "metadata": { "ExecuteTime": { - "end_time": "2020-10-04T07:13:53.300877Z", - "start_time": "2020-10-04T07:13:53.289192Z" + "end_time": "2020-10-14T03:03:00.931400Z", + "start_time": "2020-10-14T03:03:00.929055Z" } }, "outputs": [], "source": [ - "from time import sleep\n", - "\n", - "\n", - "def task1(x):\n", - " sleep(1)\n", - " return x\n", - "\n", - "\n", - "def task2(x, y):\n", - " sleep(1)\n", - " return x + y" - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "Now, if we pass two values separately into the first function and then pass the results into the second function, we will have the following code:" + "from dask import array" ] }, { "cell_type": "code", - "execution_count": 33, + "execution_count": 58, "metadata": { "ExecuteTime": { - "end_time": "2020-10-04T07:13:56.315870Z", - "start_time": "2020-10-04T07:13:53.304926Z" + "end_time": "2020-10-14T03:03:01.407137Z", + "start_time": "2020-10-14T03:03:01.400443Z" } }, - "outputs": [ - { - "name": "stdout", - "output_type": "stream", - "text": [ - "CPU times: user 4.81 ms, sys: 74 µs, total: 4.89 ms\n", - "Wall time: 3 s\n" - ] - } - ], - "source": [ - "%%time\n", - "x1 = task1(1)\n", - "x2 = task1(2)\n", - "y = task2(x1,x2)" - ] - }, - { - "cell_type": "markdown", - "metadata": {}, + "outputs": [], "source": [ - "Since each of these functions are taking one second; therefore, the entire block takes three seconds. But the calculation for `x1` is totally independent of the calculation for `x2`. If we were able to do these operation simultaneously we could save time. This is where `Dask.delayed` comes into play. We need to convert the functions into `delayed` functions so Dask can handle parallelisation." + "big_array = array.random.normal(size=(10000000, 100), chunks=200000)" ] }, { "cell_type": "code", - "execution_count": 34, + "execution_count": 59, "metadata": { "ExecuteTime": { - "end_time": "2020-10-04T07:13:56.325303Z", - "start_time": "2020-10-04T07:13:56.319479Z" + "end_time": "2020-10-14T03:03:01.852375Z", + "start_time": "2020-10-14T03:03:01.846761Z" } }, - "outputs": [], + "outputs": [ + { + "data": { + "text/html": [ + "\n", + "\n", + "\n", + "\n", + "\n", + "
\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
Array Chunk
Bytes 8.00 GB 160.00 MB
Shape (10000000, 100) (200000, 100)
Count 50 Tasks 50 Chunks
Type float64 numpy.ndarray
\n", + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "\n", + " \n", + " \n", + " \n", + "\n", + " \n", + " \n", + "\n", + " \n", + " 100\n", + " 10000000\n", + "\n", + "
" + ], + "text/plain": [ + "dask.array" + ] + }, + "execution_count": 59, + "metadata": {}, + "output_type": "execute_result" + } + ], "source": [ - "task1_delayed = dask.delayed(task1)\n", - "task2_delayed = dask.delayed(task2)" + "big_array" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ - "And now instead of the original function we use the delayed functions:" + "This data takes 8 GB if we wanted to store it in RAM. But Dask only generates the numbers in chunks when it needs them. So at each steps it has to deal with a chunk which is ~160 MB in this case." ] }, { "cell_type": "code", - "execution_count": 35, + "execution_count": 60, "metadata": { "ExecuteTime": { - "end_time": "2020-10-04T07:13:56.338070Z", - "start_time": "2020-10-04T07:13:56.329559Z" + "end_time": "2020-10-14T03:04:16.237275Z", + "start_time": "2020-10-14T03:04:06.749275Z" } }, "outputs": [ @@ -1500,96 +9029,113 @@ "name": "stdout", "output_type": "stream", "text": [ - "CPU times: user 524 µs, sys: 0 ns, total: 524 µs\n", - "Wall time: 465 µs\n" + "[########################################] | 100% Completed | 9.5s\n" ] } ], "source": [ - "%%time\n", - "x1 = task1_delayed(1)\n", - "x2 = task1_delayed(2)\n", - "y = task2_delayed(x1,x2)" + "task = (big_array * big_array).mean(axis=1)\n", + "with ProgressBar():\n", + " res = task.compute()" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "We can set the chunk size:" ] }, { "cell_type": "code", - "execution_count": 36, + "execution_count": 61, "metadata": { "ExecuteTime": { - "end_time": "2020-10-04T07:13:58.355308Z", - "start_time": "2020-10-04T07:13:56.341660Z" + "end_time": "2020-10-14T03:04:50.034869Z", + "start_time": "2020-10-14T03:04:50.028940Z" } }, "outputs": [ - { - "name": "stdout", - "output_type": "stream", - "text": [ - "CPU times: user 5.72 ms, sys: 0 ns, total: 5.72 ms\n", - "Wall time: 2 s\n" - ] - }, { "data": { + "text/html": [ + "\n", + "\n", + "\n", + "\n", + "\n", + "
\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
Array Chunk
Bytes 8.00 GB 419.43 MB
Shape (10000000, 100) (524288, 100)
Count 20 Tasks 20 Chunks
Type float64 numpy.ndarray
\n", + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "\n", + " \n", + " \n", + " \n", + "\n", + " \n", + " \n", + "\n", + " \n", + " 100\n", + " 10000000\n", + "\n", + "
" + ], "text/plain": [ - "3" + "dask.array" ] }, - "execution_count": 36, + "execution_count": 61, "metadata": {}, "output_type": "execute_result" } ], "source": [ - "%%time\n", - "y.compute()" - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "And we saved one second! `x1` and `x2` where calculated in parallel, and then `y` was calculated using `x1` and `x2`." - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "We can directly create delayed functions using `dask.delayed` decorator." - ] - }, - { - "cell_type": "code", - "execution_count": 37, - "metadata": { - "ExecuteTime": { - "end_time": "2020-10-04T07:13:58.365973Z", - "start_time": "2020-10-04T07:13:58.358782Z" - } - }, - "outputs": [], - "source": [ - "@dask.delayed\n", - "def task1(x):\n", - " sleep(1)\n", - " return x\n", - "\n", - "\n", - "@dask.delayed\n", - "def task2(x, y):\n", - " sleep(1)\n", - " return x + y" + "big_array = array.random.normal(size=(10000000, 100), chunks=(2 ** 19, 100))\n", + "big_array" ] }, { "cell_type": "code", - "execution_count": 38, + "execution_count": 62, "metadata": { "ExecuteTime": { - "end_time": "2020-10-04T07:14:00.383619Z", - "start_time": "2020-10-04T07:13:58.369716Z" + "end_time": "2020-10-14T03:05:01.836720Z", + "start_time": "2020-10-14T03:04:51.480886Z" } }, "outputs": [ @@ -1597,239 +9143,294 @@ "name": "stdout", "output_type": "stream", "text": [ - "CPU times: user 1.85 ms, sys: 3.8 ms, total: 5.65 ms\n", - "Wall time: 2 s\n" + "[########################################] | 100% Completed | 10.3s\n" ] - }, - { - "data": { - "text/plain": [ - "3" - ] - }, - "execution_count": 38, - "metadata": {}, - "output_type": "execute_result" } ], "source": [ - "%%time\n", - "x1 = task1(1)\n", - "x2 = task1(2)\n", - "y = task2(x1,x2)\n", - "y.compute()" - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "# Introduction to Numba" - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "## What is Numba?\n", - "\n", - "Numba is a **just-in-time**, **type-specializing**, **function compiler** for accelerating **numerically-focused** Python. That's a long list, so let's break down those terms:\n", - "\n", - " * **function compiler**: Numba compiles Python functions, not entire applications, and not parts of functions. Numba does not replace your Python interpreter, but is just another Python module that can turn a function into a (usually) faster function. \n", - " * **type-specializing**: Numba speeds up your function by generating a specialized implementation for the specific data types you are using. Python functions are designed to operate on generic data types, which makes them very flexible, but also very slow. In practice, you only will call a function with a small number of argument types, so Numba will generate a fast implementation for each set of types.\n", - " * **just-in-time**: Numba translates functions when they are first called. This ensures the compiler knows what argument types you will be using. This also allows Numba to be used interactively in a Jupyter notebook just as easily as a traditional application\n", - " * **numerically-focused**: Currently, Numba is focused on numerical data types, like `int`, `float`, and `complex`. There is very limited string processing support, and many string use cases are not going to work well on the GPU. To get best results with Numba, you will likely be using NumPy arrays.\n" + "task = (big_array * big_array).mean(axis=1)\n", + "with ProgressBar():\n", + " res = task.compute()" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ - "### First Steps\n", - "\n", - "Let's write our first Numba function and compile it for the **CPU**. The Numba compiler is typically enabled by applying a *decorator* to a Python function. Decorators are functions that transform Python functions. Here we will use the CPU compilation decorator:" + "We can also apply most of common numpy functions to the array." ] }, { "cell_type": "code", - "execution_count": 39, + "execution_count": 63, "metadata": { "ExecuteTime": { - "end_time": "2020-10-04T07:14:01.058402Z", - "start_time": "2020-10-04T07:14:00.387277Z" + "end_time": "2020-10-14T03:05:16.433299Z", + "start_time": "2020-10-14T03:05:01.838300Z" } }, - "outputs": [], - "source": [ - "from numba import jit\n", - "import math\n", - "\n", - "\n", - "@jit\n", - "def hypot(x, y):\n", - " # Implementation from https://en.wikipedia.org/wiki/Hypot\n", - " x = abs(x)\n", - " y = abs(y)\n", - " t = min(x, y)\n", - " x = max(x, y)\n", - " t = t / x\n", - " return x * math.sqrt(1 + t * t)" - ] - }, - { - "cell_type": "markdown", - "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "[########################################] | 100% Completed | 14.6s\n" + ] + } + ], "source": [ - "The above code is equivalent to writing:\n", - "``` python\n", - "def hypot(x, y):\n", - " x = abs(x);\n", - " y = abs(y);\n", - " t = min(x, y);\n", - " x = max(x, y);\n", - " t = t / x;\n", - " return x * math.sqrt(1+t*t)\n", - " \n", - "hypot = jit(hypot)\n", - "```\n", - "This means that the Numba compiler is just a function you can call whenever you want!\n", - "\n", - "Let's try out our hypotenuse calculation:" + "task = np.sin(big_array).mean(axis=0)\n", + "with ProgressBar():\n", + " res = task.compute()" ] }, { "cell_type": "code", - "execution_count": 40, + "execution_count": 64, "metadata": { "ExecuteTime": { - "end_time": "2020-10-04T07:14:01.282029Z", - "start_time": "2020-10-04T07:14:01.061236Z" + "end_time": "2020-10-14T03:05:16.439009Z", + "start_time": "2020-10-14T03:05:16.435073Z" } }, "outputs": [ { "data": { + "text/html": [ + "\n", + "\n", + "\n", + "\n", + "\n", + "
\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
Array Chunk
Bytes 800 B 800 B
Shape (100,) (100,)
Count 68 Tasks 1 Chunks
Type float64 numpy.ndarray
\n", + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + "\n", + " \n", + " \n", + " \n", + "\n", + " \n", + " \n", + "\n", + " \n", + " 100\n", + " 1\n", + "\n", + "
" + ], "text/plain": [ - "5.0" + "dask.array" ] }, - "execution_count": 40, + "execution_count": 64, "metadata": {}, "output_type": "execute_result" - } - ], - "source": [ - "hypot(3.0, 4.0)" - ] - }, - { - "cell_type": "markdown", - "metadata": {}, + } + ], "source": [ - "The first time we call `hypot`, the compiler is triggered and compiles a machine code implementation for float inputs. Numba also saves the original Python implementation of the function in the `.py_func` attribute, so we can call the original Python code to make sure we get the same answer:" + "task" ] }, { "cell_type": "code", - "execution_count": 41, + "execution_count": 65, "metadata": { "ExecuteTime": { - "end_time": "2020-10-04T07:14:01.289853Z", - "start_time": "2020-10-04T07:14:01.284540Z" + "end_time": "2020-10-14T03:05:16.506778Z", + "start_time": "2020-10-14T03:05:16.440443Z" } }, "outputs": [ { "data": { "text/plain": [ - "5.0" + "array([-4.96623569e-05, -9.21618151e-05, 1.77109021e-04, 2.67433735e-04,\n", + " -4.54797760e-05, 2.92740013e-04, 1.02261515e-04, -2.70215806e-04,\n", + " 5.37307664e-04, 2.86031036e-04, -6.97538808e-06, -3.66262279e-05,\n", + " 6.74122747e-05, 1.83273347e-04, 2.11252086e-04, 1.64897837e-04,\n", + " 3.59514362e-05, 1.71063759e-04, -9.70854531e-05, -1.43783037e-04,\n", + " -2.34059994e-04, 1.52175767e-04, -1.31447779e-04, 3.49086909e-04,\n", + " 4.92961515e-05, -6.34444433e-04, -5.88597059e-05, 2.33904797e-05,\n", + " 1.43739722e-04, 2.98193817e-04, -3.17477335e-05, -2.08925932e-04,\n", + " 2.05396399e-04, 6.85760116e-05, 1.15092378e-04, 1.36169168e-05,\n", + " -3.61674345e-04, 2.09824264e-04, -1.25670866e-04, 2.50631214e-04,\n", + " 4.12638901e-06, -3.03833410e-04, -6.33738351e-05, -1.26853903e-04,\n", + " 1.51523004e-04, -2.89482462e-04, -1.38021839e-04, -9.12122807e-05,\n", + " -1.00218247e-04, -4.24066366e-05, 2.81373079e-04, -1.40732558e-04,\n", + " 3.44148003e-04, 4.80461779e-04, 1.59566155e-04, -2.33837880e-04,\n", + " 1.94673201e-04, -1.12906923e-04, 1.65474798e-04, 3.24221883e-04,\n", + " -1.06062398e-04, 1.97985690e-04, -2.05774209e-04, 3.99499162e-05,\n", + " -6.56359293e-04, 1.74988815e-04, -1.26379504e-04, -1.44962937e-04,\n", + " -6.18747968e-05, 3.76777761e-04, -1.30070472e-05, 1.80178223e-04,\n", + " -1.27134975e-04, -6.65599327e-05, 7.29711967e-05, -1.86057964e-04,\n", + " -2.11766175e-04, 4.26616018e-05, 3.74094549e-04, -1.60232094e-05,\n", + " 7.24228099e-05, 2.65367915e-06, 8.58840574e-06, -1.23935576e-04,\n", + " -9.25305321e-05, -2.75633942e-04, 5.31312702e-05, 1.16043460e-04,\n", + " -4.12244514e-04, -1.11056734e-04, -7.11785755e-05, 1.73886249e-05,\n", + " -8.71786971e-05, 3.79871916e-04, 5.61180778e-05, -1.19167936e-04,\n", + " -3.42306665e-04, -1.49317602e-04, -3.93023952e-05, 6.51016327e-05])" ] }, - "execution_count": 41, + "execution_count": 65, "metadata": {}, "output_type": "execute_result" } ], "source": [ - "hypot.py_func(3.0, 4.0)" + "res" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ - "### Benchmarking\n", + "### Exercise\n", "\n", - "An important part of using Numba is measuring the performance of your new code. Let's see if we actually sped anything up. The easiest way to do this in the Jupyter notebook is to use the `%timeit` magic function. Let's first measure the speed of the original Python:" + "- Create two Dask random arrays of size 10,000,000-by-100. \n", + "- Find the difference between the two `y = ..`\n", + "- and pass it to `array.linalg.norm` using argument `axis=1`. \n", + "- Calculate the result and create a histogram of it." ] }, { "cell_type": "code", - "execution_count": 42, + "execution_count": 31, "metadata": { "ExecuteTime": { - "end_time": "2020-10-04T07:14:10.897755Z", - "start_time": "2020-10-04T07:14:01.292519Z" + "end_time": "2020-10-04T07:13:53.285755Z", + "start_time": "2020-10-04T07:13:53.281047Z" } }, - "outputs": [ - { - "name": "stdout", - "output_type": "stream", - "text": [ - "1.18 µs ± 33.4 ns per loop (mean ± std. dev. of 7 runs, 1000000 loops each)\n" - ] + "outputs": [], + "source": [ + "from matplotlib.pyplot import hist" + ] + }, + { + "cell_type": "markdown", + "metadata": { + "ExecuteTime": { + "end_time": "2020-10-04T07:04:25.331001Z", + "start_time": "2020-10-04T07:04:25.308406Z" } - ], + }, "source": [ - "%timeit hypot.py_func(3.0, 4.0)" + "
\n", + "

Exercise

\n", + "\n", + " Description:\n", + "\n", + "- Create two Dask random arrays of size 10,000,000-by-100. \n", + "- Find the difference between the two `y = ..`\n", + "- and pass it to `array.linalg.norm` using argument `axis=1`. \n", + "- Calculate the result and create a histogram of it.\n", + " \n", + "\n", + "
\n", + " → Hints\n", + " \n", + " Replace the question marks `?`\n", + "\n", + "```python\n", + "a = array.random.normal(size=(10000000, 100), chunks=200000)\n", + "b = array.random.normal(size=(10000000, 100), chunks=200000)\n", + "r = array.linalg.norm(?, axis=1)\n", + "r.?\n", + "```\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "
\n", + " \n", + " → Solution\n", + " \n", + "\n", + " ```python\n", + " x1 = array.random.random(size=(10000000,100))\n", + " x2 = array.random.random(size=(10000000,100))\n", + " y = x2-x1\n", + " d = array.linalg.norm(y,axis=1)\n", + " with ProgressBar():\n", + " result = d.compute()\n", + " plt.hist(result,bins=100);\n", + " ```\n", + "\n", + "
\n", + "\n", + "
" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ - "The `%timeit` magic runs the statement many times to get an accurate estimate of the run time." + "## Delayed\n", + "Dask delayed is a method for parallelising code where you can't write your code directly as dataframe or array operation. `Dask.delayed` is an easy-to-use tool to quickly parallelise these tasks." + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "Consider the following functions. The first one takes an input, waits for one second and returns the value. The second function takes two inputs, waits for one second and returns the sum. We are using these functions to represent tasks that are time consuming." ] }, { "cell_type": "code", - "execution_count": 43, + "execution_count": 69, "metadata": { "ExecuteTime": { - "end_time": "2020-10-04T07:14:13.554235Z", - "start_time": "2020-10-04T07:14:10.900691Z" + "end_time": "2020-10-14T03:15:10.324957Z", + "start_time": "2020-10-14T03:15:10.321859Z" } }, - "outputs": [ - { - "name": "stdout", - "output_type": "stream", - "text": [ - "322 ns ± 8.11 ns per loop (mean ± std. dev. of 7 runs, 1000000 loops each)\n" - ] - } - ], + "outputs": [], "source": [ - "%timeit hypot(3.0, 4.0)" + "from time import sleep\n", + "\n", + "\n", + "def task1(x):\n", + " sleep(1)\n", + " return x\n", + "\n", + "\n", + "def task2(x, y):\n", + " sleep(1)\n", + " return x + y" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ - "Numba did a pretty good job with this function. It's 3x faster than the pure Python version.\n", - "\n", - "Of course, the `hypot` function is already present in the Python module:" + "Now, if we pass two values separately into the first function and then pass the results into the second function, we will have the following code:" ] }, { "cell_type": "code", - "execution_count": 44, + "execution_count": 70, "metadata": { "ExecuteTime": { - "end_time": "2020-10-04T07:14:15.594561Z", - "start_time": "2020-10-04T07:14:13.556497Z" + "end_time": "2020-10-14T03:15:14.035901Z", + "start_time": "2020-10-14T03:15:11.029409Z" } }, "outputs": [ @@ -1837,43 +9438,54 @@ "name": "stdout", "output_type": "stream", "text": [ - "247 ns ± 1.24 ns per loop (mean ± std. dev. of 7 runs, 1000000 loops each)\n" + "CPU times: user 0 ns, sys: 2.15 ms, total: 2.15 ms\n", + "Wall time: 3 s\n" ] } ], "source": [ - "%timeit math.hypot(3.0, 4.0)" + "%%time\n", + "x1 = task1(1)\n", + "x2 = task1(2)\n", + "y = task2(x1,x2)" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ - "Python's built-in is even faster than Numba! This is because Numba does introduce some overhead to each function call that is larger than the function call overhead of Python itself. Extremely fast functions (like the above one) will be hurt by this.\n", - "\n", - "(However, if you call one Numba function from another one, there is very little function overhead, sometimes even zero if the compiler inlines the function into the other one.)" + "Since each of these functions are taking one second; therefore, the entire block takes three seconds. But the calculation for `x1` is totally independent of the calculation for `x2`. If we were able to do these operation simultaneously we could save time. This is where `Dask.delayed` comes into play. We need to convert the functions into `delayed` functions so Dask can handle parallelisation." + ] + }, + { + "cell_type": "code", + "execution_count": 71, + "metadata": { + "ExecuteTime": { + "end_time": "2020-10-14T03:15:30.151401Z", + "start_time": "2020-10-14T03:15:30.148783Z" + } + }, + "outputs": [], + "source": [ + "task1_delayed = dask.delayed(task1)\n", + "task2_delayed = dask.delayed(task2)" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ - "### How does Numba work?\n", - "\n", - "The first time we called our Numba-wrapped `hypot` function, the following process was initiated:\n", - "\n", - "![Numba Flowchart](img/numba_flowchart.png \"The compilation process\")\n", - "\n", - "We can see the result of type inference by using the `.inspect_types()` method, which prints an annotated version of the source code:" + "And now instead of the original function we use the delayed functions:" ] }, { "cell_type": "code", - "execution_count": 45, + "execution_count": 72, "metadata": { "ExecuteTime": { - "end_time": "2020-10-04T07:14:15.605026Z", - "start_time": "2020-10-04T07:14:15.598417Z" + "end_time": "2020-10-14T03:16:02.623513Z", + "start_time": "2020-10-14T03:16:02.619917Z" } }, "outputs": [ @@ -1881,407 +9493,739 @@ "name": "stdout", "output_type": "stream", "text": [ - "hypot (float64, float64)\n", - "--------------------------------------------------------------------------------\n", - "# File: \n", - "# --- LINE 5 --- \n", - "# label 0\n", - "\n", - "@jit\n", - "\n", - "# --- LINE 6 --- \n", - "\n", - "def hypot(x, y):\n", - "\n", - " # --- LINE 7 --- \n", - "\n", - " # Implementation from https://en.wikipedia.org/wiki/Hypot\n", - "\n", - " # --- LINE 8 --- \n", - " # x = arg(0, name=x) :: float64\n", - " # y = arg(1, name=y) :: float64\n", - " # $0.1 = global(abs: ) :: Function()\n", - " # $0.3 = call $0.1(x, func=$0.1, args=[Var(x, (8))], kws=(), vararg=None) :: (float64,) -> float64\n", - " # del x\n", - " # del $0.1\n", - " # x.1 = $0.3 :: float64\n", - " # del $0.3\n", - "\n", - " x = abs(x)\n", - "\n", - " # --- LINE 9 --- \n", - " # $0.4 = global(abs: ) :: Function()\n", - " # $0.6 = call $0.4(y, func=$0.4, args=[Var(y, (8))], kws=(), vararg=None) :: (float64,) -> float64\n", - " # del y\n", - " # del $0.4\n", - " # y.1 = $0.6 :: float64\n", - " # del $0.6\n", - "\n", - " y = abs(y)\n", - "\n", - " # --- LINE 10 --- \n", - " # $0.7 = global(min: ) :: Function()\n", - " # $0.10 = call $0.7(x.1, y.1, func=$0.7, args=[Var(x.1, (8)), Var(y.1, (9))], kws=(), vararg=None) :: (float64, float64) -> float64\n", - " # del $0.7\n", - " # t = $0.10 :: float64\n", - " # del $0.10\n", - "\n", - " t = min(x, y)\n", - "\n", - " # --- LINE 11 --- \n", - " # $0.11 = global(max: ) :: Function()\n", - " # $0.14 = call $0.11(x.1, y.1, func=$0.11, args=[Var(x.1, (8)), Var(y.1, (9))], kws=(), vararg=None) :: (float64, float64) -> float64\n", - " # del y.1\n", - " # del x.1\n", - " # del $0.11\n", - " # x.2 = $0.14 :: float64\n", - " # del $0.14\n", - "\n", - " x = max(x, y)\n", - "\n", - " # --- LINE 12 --- \n", - " # $0.17 = t / x.2 :: float64\n", - " # del t\n", - " # t.1 = $0.17 :: float64\n", - " # del $0.17\n", - "\n", - " t = t / x\n", - "\n", - " # --- LINE 13 --- \n", - " # $0.19 = global(math: ) :: Module()\n", - " # $0.20 = getattr(value=$0.19, attr=sqrt) :: Function()\n", - " # del $0.19\n", - " # $const0.21 = const(int, 1) :: Literal[int](1)\n", - " # $0.24 = t.1 * t.1 :: float64\n", - " # del t.1\n", - " # $0.25 = $const0.21 + $0.24 :: float64\n", - " # del $const0.21\n", - " # del $0.24\n", - " # $0.26 = call $0.20($0.25, func=$0.20, args=[Var($0.25, (13))], kws=(), vararg=None) :: (float64,) -> float64\n", - " # del $0.25\n", - " # del $0.20\n", - " # $0.27 = x.2 * $0.26 :: float64\n", - " # del x.2\n", - " # del $0.26\n", - " # $0.28 = cast(value=$0.27) :: float64\n", - " # del $0.27\n", - " # return $0.28\n", - "\n", - " return x * math.sqrt(1 + t * t)\n", - "\n", - "\n", - "================================================================================\n" + "CPU times: user 522 µs, sys: 75 µs, total: 597 µs\n", + "Wall time: 439 µs\n" ] } ], "source": [ - "hypot.inspect_types()" - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "Note that Numba's type names tend to mirror the NumPy type names, so a Python `float` is a `float64` (also called \"double precision\" in other languages). Taking a look at the data types can sometimes be important in GPU code because the performance of `float32` and `float64` computations will be very different on CUDA devices. An accidental upcast can dramatically slow down a function." - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "### When Things Go Wrong\n", - "\n", - "Numba cannot compile all Python code. Some functions don't have a Numba-translation, and some kinds of Python types can't be efficiently compiled at all (yet). For example, Numba does not support `FrozenSet` (as of this tutorial):" + "%%time\n", + "x1 = task1_delayed(1)\n", + "x2 = task1_delayed(2)\n", + "y = task2_delayed(x1,x2)" ] }, { "cell_type": "code", - "execution_count": 46, + "execution_count": 73, "metadata": { "ExecuteTime": { - "end_time": "2020-10-04T07:14:15.680101Z", - "start_time": "2020-10-04T07:14:15.607250Z" - }, - "scrolled": true + "end_time": "2020-10-14T03:16:05.539712Z", + "start_time": "2020-10-14T03:16:03.532253Z" + } }, "outputs": [ { - "name": "stderr", + "name": "stdout", "output_type": "stream", "text": [ - ":1: NumbaWarning: \u001b[1m\n", - "Compilation is falling back to object mode WITH looplifting enabled because Function \"cannot_compile\" failed type inference due to: \u001b[1m\u001b[1mnon-precise type pyobject\u001b[0m\n", - "\u001b[0m\u001b[1m[1] During: typing of argument at (3)\u001b[0m\n", - "\u001b[1m\n", - "File \"\", line 3:\u001b[0m\n", - "\u001b[1mdef cannot_compile(x):\n", - "\u001b[1m return \"a\" in x\n", - "\u001b[0m \u001b[1m^\u001b[0m\u001b[0m\n", - "\u001b[0m\n", - " @jit\n", - "/home/wassname/.pyenv/versions/jup3.7.3/lib/python3.7/site-packages/numba/object_mode_passes.py:178: NumbaWarning: \u001b[1mFunction \"cannot_compile\" was compiled in object mode without forceobj=True.\n", - "\u001b[1m\n", - "File \"\", line 2:\u001b[0m\n", - "\u001b[1m@jit\n", - "\u001b[1mdef cannot_compile(x):\n", - "\u001b[0m\u001b[1m^\u001b[0m\u001b[0m\n", - "\u001b[0m\n", - " state.func_ir.loc))\n", - "/home/wassname/.pyenv/versions/jup3.7.3/lib/python3.7/site-packages/numba/object_mode_passes.py:187: NumbaDeprecationWarning: \u001b[1m\n", - "Fall-back from the nopython compilation path to the object mode compilation path has been detected, this is deprecated behaviour.\n", - "\n", - "For more information visit http://numba.pydata.org/numba-doc/latest/reference/deprecation.html#deprecation-of-object-mode-fall-back-behaviour-when-using-jit\n", - "\u001b[1m\n", - "File \"\", line 2:\u001b[0m\n", - "\u001b[1m@jit\n", - "\u001b[1mdef cannot_compile(x):\n", - "\u001b[0m\u001b[1m^\u001b[0m\u001b[0m\n", - "\u001b[0m\n", - " warnings.warn(errors.NumbaDeprecationWarning(msg, state.func_ir.loc))\n" + "CPU times: user 2.72 ms, sys: 394 µs, total: 3.11 ms\n", + "Wall time: 2 s\n" ] }, { "data": { "text/plain": [ - "True" + "3" ] }, - "execution_count": 46, + "execution_count": 73, "metadata": {}, "output_type": "execute_result" } ], "source": [ - "@jit\n", - "def cannot_compile(x):\n", - " return \"a\" in x\n", - "\n", - "\n", - "cannot_compile(frozenset((\"a\", \"b\", \"c\")))" + "%%time\n", + "y.compute()" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ - "Wait, what happened?? By default, Numba will fall back to a mode, called \"object mode,\" which does not do type-specialization. Object mode exists to enable other Numba functionality, but in many cases, you want Numba to tell you if type inference fails. You can force \"nopython mode\" (the other compilation mode) by passing arguments to the decorator:" + "And we saved one second! `x1` and `x2` where calculated in parallel, and then `y` was calculated using `x1` and `x2`." + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "We can directly create delayed functions using `dask.delayed` decorator." + ] + }, + { + "cell_type": "code", + "execution_count": 74, + "metadata": { + "ExecuteTime": { + "end_time": "2020-10-14T03:19:36.667741Z", + "start_time": "2020-10-14T03:19:36.664494Z" + } + }, + "outputs": [], + "source": [ + "@dask.delayed\n", + "def task1(x):\n", + " sleep(1)\n", + " return x\n", + "\n", + "\n", + "@dask.delayed\n", + "def task2(x, y):\n", + " sleep(1)\n", + " return x + y" ] }, { "cell_type": "code", - "execution_count": 47, + "execution_count": 75, "metadata": { "ExecuteTime": { - "end_time": "2020-10-04T07:14:15.702891Z", - "start_time": "2020-10-04T07:14:15.683207Z" - }, - "scrolled": true + "end_time": "2020-10-14T03:19:44.870446Z", + "start_time": "2020-10-14T03:19:42.862419Z" + } }, "outputs": [ { - "name": "stderr", + "name": "stdout", "output_type": "stream", "text": [ - "ERROR:root:Failed in nopython mode pipeline (step: nopython frontend)\n", - "\u001b[1m\u001b[1mnon-precise type pyobject\u001b[0m\n", - "\u001b[0m\u001b[1m[1] During: typing of argument at (3)\u001b[0m\n", - "\u001b[1m\n", - "File \"\", line 3:\u001b[0m\n", - "\u001b[1mdef cannot_compile(x):\n", - "\u001b[1m return \"a\" in x\n", - "\u001b[0m \u001b[1m^\u001b[0m\u001b[0m\n", - "\n", - "This error may have been caused by the following argument(s):\n", - "- argument 0: \u001b[1mcannot determine Numba type of \u001b[0m\n", - "\n", - "This is not usually a problem with Numba itself but instead often caused by\n", - "the use of unsupported features or an issue in resolving types.\n", - "\n", - "To see Python/NumPy features supported by the latest release of Numba visit:\n", - "http://numba.pydata.org/numba-doc/latest/reference/pysupported.html\n", - "and\n", - "http://numba.pydata.org/numba-doc/latest/reference/numpysupported.html\n", - "\n", - "For more information about typing errors and how to debug them visit:\n", - "http://numba.pydata.org/numba-doc/latest/user/troubleshoot.html#my-code-doesn-t-compile\n", - "\n", - "If you think your code should work with Numba, please report the error message\n", - "and traceback, along with a minimal reproducer at:\n", - "https://github.com/numba/numba/issues/new\n", - "Traceback (most recent call last):\n", - " File \"\", line 6, in \n", - " cannot_compile(frozenset((\"a\", \"b\", \"c\")))\n", - " File \"/home/wassname/.pyenv/versions/jup3.7.3/lib/python3.7/site-packages/numba/dispatcher.py\", line 401, in _compile_for_args\n", - " error_rewrite(e, 'typing')\n", - " File \"/home/wassname/.pyenv/versions/jup3.7.3/lib/python3.7/site-packages/numba/dispatcher.py\", line 344, in error_rewrite\n", - " reraise(type(e), e, None)\n", - " File \"/home/wassname/.pyenv/versions/jup3.7.3/lib/python3.7/site-packages/numba/six.py\", line 668, in reraise\n", - " raise value.with_traceback(tb)\n", - "numba.errors.TypingError: Failed in nopython mode pipeline (step: nopython frontend)\n", - "\u001b[1m\u001b[1mnon-precise type pyobject\u001b[0m\n", - "\u001b[0m\u001b[1m[1] During: typing of argument at (3)\u001b[0m\n", - "\u001b[1m\n", - "File \"\", line 3:\u001b[0m\n", - "\u001b[1mdef cannot_compile(x):\n", - "\u001b[1m return \"a\" in x\n", - "\u001b[0m \u001b[1m^\u001b[0m\u001b[0m\n", - "\n", - "This error may have been caused by the following argument(s):\n", - "- argument 0: \u001b[1mcannot determine Numba type of \u001b[0m\n", - "\n", - "This is not usually a problem with Numba itself but instead often caused by\n", - "the use of unsupported features or an issue in resolving types.\n", - "\n", - "To see Python/NumPy features supported by the latest release of Numba visit:\n", - "http://numba.pydata.org/numba-doc/latest/reference/pysupported.html\n", - "and\n", - "http://numba.pydata.org/numba-doc/latest/reference/numpysupported.html\n", - "\n", - "For more information about typing errors and how to debug them visit:\n", - "http://numba.pydata.org/numba-doc/latest/user/troubleshoot.html#my-code-doesn-t-compile\n", - "\n", - "If you think your code should work with Numba, please report the error message\n", - "and traceback, along with a minimal reproducer at:\n", - "https://github.com/numba/numba/issues/new\n", - "\n" + "CPU times: user 3.28 ms, sys: 475 µs, total: 3.75 ms\n", + "Wall time: 2 s\n" ] + }, + { + "data": { + "text/plain": [ + "3" + ] + }, + "execution_count": 75, + "metadata": {}, + "output_type": "execute_result" } ], "source": [ - "@jit(nopython=True)\n", - "def cannot_compile(x):\n", - " return \"a\" in x\n", - "\n", - "try:\n", - " cannot_compile(frozenset((\"a\", \"b\", \"c\")))\n", - "except Exception as e:\n", - " logging.exception(e)" - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "Now we get an exception when Numba tries to compile the function, with an error that says:\n", - "```\n", - "- argument 0: cannot determine Numba type of \n", - "```\n", - "which is the underlying problem. Numba doesn't know about frozenset. There are classes that we use regularly in our code but they might not be defined in Numba. An example of a common class that you cannot use in Numba is pandas data frames.
Now the question is: what does Numba support? Some of the types/classes that are supported by Numba are listed below:\n", - "* Numbers (integers, floats, etc)\n", - "* Numpy arrays\n", - "* Strings\n", - "* Lists and tuples (note that a list/tuple of numbers or strings is supported but a list of lists is not)" + "%%time\n", + "x1 = task1(1)\n", + "x2 = task1(2)\n", + "y = task2(x1,x2)\n", + "y.compute()" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ - "So, if we want the last example to be compiled successfully by Numba jit, we need to use a tuple or a list." + "# Xarray\n", + "\n", + "Xarray is pandas for N-dimensional data. It also has a [dask backend](http://xarray.pydata.org/en/stable/dask.html)" ] }, { "cell_type": "code", - "execution_count": 48, + "execution_count": 77, "metadata": { "ExecuteTime": { - "end_time": "2020-10-04T07:14:16.550823Z", - "start_time": "2020-10-04T07:14:15.708748Z" + "end_time": "2020-10-14T03:25:15.644058Z", + "start_time": "2020-10-14T03:25:15.588851Z" } }, "outputs": [ { "data": { + "text/html": [ + "
\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "
<xarray.Dataset>\n",
+       "Dimensions:  (time: 36, x: 275, y: 205)\n",
+       "Coordinates:\n",
+       "  * time     (time) object 1980-09-16 12:00:00 ... 1983-08-17 00:00:00\n",
+       "    xc       (y, x) float64 dask.array<chunksize=(205, 275), meta=np.ndarray>\n",
+       "    yc       (y, x) float64 dask.array<chunksize=(205, 275), meta=np.ndarray>\n",
+       "Dimensions without coordinates: x, y\n",
+       "Data variables:\n",
+       "    Tair     (time, y, x) float64 dask.array<chunksize=(10, 205, 275), meta=np.ndarray>\n",
+       "Attributes:\n",
+       "    title:                     /workspace/jhamman/processed/R1002RBRxaaa01a/l...\n",
+       "    institution:               U.W.\n",
+       "    source:                    RACM R1002RBRxaaa01a\n",
+       "    output_frequency:          daily\n",
+       "    output_mode:               averaged\n",
+       "    convention:                CF-1.4\n",
+       "    references:                Based on the initial model of Liang et al., 19...\n",
+       "    comment:                   Output from the Variable Infiltration Capacity...\n",
+       "    nco_openmp_thread_number:  1\n",
+       "    NCO:                       netCDF Operators version 4.7.9 (Homepage = htt...\n",
+       "    history:                   Fri Aug  7 17:57:38 2020: ncatted -a bounds,,d...
" + ], "text/plain": [ - "True" + "\n", + "Dimensions: (time: 36, x: 275, y: 205)\n", + "Coordinates:\n", + " * time (time) object 1980-09-16 12:00:00 ... 1983-08-17 00:00:00\n", + " xc (y, x) float64 dask.array\n", + " yc (y, x) float64 dask.array\n", + "Dimensions without coordinates: x, y\n", + "Data variables:\n", + " Tair (time, y, x) float64 dask.array\n", + "Attributes:\n", + " title: /workspace/jhamman/processed/R1002RBRxaaa01a/l...\n", + " institution: U.W.\n", + " source: RACM R1002RBRxaaa01a\n", + " output_frequency: daily\n", + " output_mode: averaged\n", + " convention: CF-1.4\n", + " references: Based on the initial model of Liang et al., 19...\n", + " comment: Output from the Variable Infiltration Capacity...\n", + " nco_openmp_thread_number: 1\n", + " NCO: netCDF Operators version 4.7.9 (Homepage = htt...\n", + " history: Fri Aug 7 17:57:38 2020: ncatted -a bounds,,d..." ] }, - "execution_count": 48, + "execution_count": 77, "metadata": {}, "output_type": "execute_result" } ], "source": [ - "@jit(nopython=True)\n", - "def can_compile(x):\n", - " return \"a\" in x\n", - "\n", - "\n", - "can_compile((\"a\", \"b\", \"c\"))" - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "### Exercise\n", - "Gregory–Leibniz infinite series converges to $\\pi$:\n", - "$$\\pi = \\frac{4}{1} - \\frac{4}{3} + \\frac{4}{5} - \\frac{4}{7} + \\frac{4}{9} - \\frac{4}{11} + \\frac{4}{13} - \\cdots$$\n", - "\n", - "Write a Numba function which calculates the sum of first $n$ terms in this series. Then test its speed agains normal Python function for $ n = 1000000$." - ] - }, - { - "cell_type": "code", - "execution_count": 49, - "metadata": { - "ExecuteTime": { - "end_time": "2020-10-04T07:14:16.556883Z", - "start_time": "2020-10-04T07:14:16.553515Z" - } - }, - "outputs": [], - "source": [ - "# Code Here" - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "
Solution\n", - "\n", - "```Python\n", - " @jit\n", - " def gl_pi(n):\n", - " pi = 0\n", - " for i in range(n):\n", - " if i%2 ==0:\n", - " pi += 4/(2*i+1)\n", - " else:\n", - " pi -= 4/(2*i+1)\n", - " return pi \n", - "```\n", - "\n", - "Numba function speed test:\n", - "```Python\n", - " %timeit gl_pi(1000000) \n", - "```\n", - " \n", - "Normal Python function speed test:\n", - "```Python\n", - " %timeit gl_pi.py_func(1000000) \n", - "```\n", - " \n", - "
" - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "# Xarray\n", + "%matplotlib inline\n", + "import numpy as np\n", + "import pandas as pd\n", + "import xarray as xr\n", + "import matplotlib.pyplot as plt\n", "\n", - "Xarray is pandas for N-dimensional data. It also has a [dask backend](http://xarray.pydata.org/en/stable/dask.html)" + "ds = xr.tutorial.open_dataset('rasm').load().chunk(dict(time=10))\n", + "ds" ] }, { "cell_type": "code", - "execution_count": 1, + "execution_count": 79, "metadata": { "ExecuteTime": { - "end_time": "2020-10-13T11:22:29.816836Z", - "start_time": "2020-10-13T11:22:28.707555Z" + "end_time": "2020-10-14T03:26:30.730070Z", + "start_time": "2020-10-14T03:26:30.473977Z" } }, "outputs": [ @@ -2639,61 +10583,26 @@ " fill: currentColor;\n", "}\n", "
<xarray.Dataset>\n",
-       "Dimensions:  (time: 36, x: 275, y: 205)\n",
+       "Dimensions:  (x: 275, y: 205)\n",
        "Coordinates:\n",
-       "  * time     (time) object 1980-09-16 12:00:00 ... 1983-08-17 00:00:00\n",
-       "    xc       (y, x) float64 dask.array<chunksize=(205, 275), meta=np.ndarray>\n",
-       "    yc       (y, x) float64 dask.array<chunksize=(205, 275), meta=np.ndarray>\n",
-       "Dimensions without coordinates: x, y\n",
-       "Data variables:\n",
-       "    Tair     (time, y, x) float64 dask.array<chunksize=(10, 205, 275), meta=np.ndarray>\n",
-       "Attributes:\n",
-       "    title:                     /workspace/jhamman/processed/R1002RBRxaaa01a/l...\n",
-       "    institution:               U.W.\n",
-       "    source:                    RACM R1002RBRxaaa01a\n",
-       "    output_frequency:          daily\n",
-       "    output_mode:               averaged\n",
-       "    convention:                CF-1.4\n",
-       "    references:                Based on the initial model of Liang et al., 19...\n",
-       "    comment:                   Output from the Variable Infiltration Capacity...\n",
-       "    nco_openmp_thread_number:  1\n",
-       "    NCO:                       netCDF Operators version 4.7.9 (Homepage = htt...\n",
-       "    history:                   Fri Aug  7 17:57:38 2020: ncatted -a bounds,,d...
" ], "text/plain": [ - "\n", - "Dimensions: (x: 275, y: 205)\n", + "\n", + "dask.array\n", "Coordinates:\n", - " time object 1981-07-17 00:00:00\n", - " xc (y, x) float64 dask.array\n", - " yc (y, x) float64 dask.array\n", - "Dimensions without coordinates: x, y\n", - "Data variables:\n", - " Tair (y, x) float64 dask.array\n", - "Attributes:\n", - " title: /workspace/jhamman/processed/R1002RBRxaaa01a/l...\n", - " institution: U.W.\n", - " source: RACM R1002RBRxaaa01a\n", - " output_frequency: daily\n", - " output_mode: averaged\n", - " convention: CF-1.4\n", - " references: Based on the initial model of Liang et al., 19...\n", - " comment: Output from the Variable Infiltration Capacity...\n", - " nco_openmp_thread_number: 1\n", - " NCO: netCDF Operators version 4.7.9 (Homepage = htt...\n", - " history: Fri Aug 7 17:57:38 2020: ncatted -a bounds,,d..." + " * time (time) object 1980-12-31 00:00:00 ... 1983-12-31 00:00:00\n", + " xc float64 dask.array\n", + " yc float64 dask.array" ] }, - "execution_count": 2, + "execution_count": 3, "metadata": {}, "output_type": "execute_result" - }, - { - "data": { - "image/png": "\n", - "text/plain": [ - "
" - ] - }, - "metadata": { - "needs_background": "light" - }, - "output_type": "display_data" } ], "source": [ - "# You can use isel instead of iloc. You always need to specify the dimension\n", - "ds.isel(time=10)['Tair'].plot.pcolormesh(\n", - " vmin=-30, vmax=30, cmap='Spectral_r',\n", - " add_colorbar=True, extend='both')\n", - "\n", - "ds.isel(time=10)" + "# You can also resample by date\n", + "res = ds.resample(time='A').mean().isel(x=200, y=200)['Tair']\n", + "# The result is a dask array\n", + "res" ] }, { "cell_type": "code", - "execution_count": 3, + "execution_count": 4, "metadata": { "ExecuteTime": { - "end_time": "2020-10-13T11:22:30.241311Z", - "start_time": "2020-10-13T11:22:30.199187Z" + "end_time": "2020-10-13T11:22:30.348149Z", + "start_time": "2020-10-13T11:22:30.246775Z" } }, "outputs": [ + { + "name": "stderr", + "output_type": "stream", + "text": [ + "/anaconda/envs/py37_pytorch/lib/python3.7/site-packages/dask/array/numpy_compat.py:40: RuntimeWarning: invalid value encountered in true_divide\n", + " x = np.divide(x1, x2, out)\n" + ] + }, { "data": { "text/html": [ @@ -3779,130 +11605,136 @@ " fill: currentColor;\n", "}\n", "
<xarray.DataArray 'Tair' (time: 4)>\n",
-       "dask.array<getitem, shape=(4,), dtype=float64, chunksize=(1,), chunktype=numpy.ndarray>\n",
+       "array([ 6.75662201,  8.97479849, 10.49235584,  9.59892096])\n",
        "Coordinates:\n",
        "  * time     (time) object 1980-12-31 00:00:00 ... 1983-12-31 00:00:00\n",
-       "    xc       float64 dask.array<chunksize=(), meta=np.ndarray>\n",
-       "    yc       float64 dask.array<chunksize=(), meta=np.ndarray>
  • " ], "text/plain": [ "\n", - "dask.array\n", + "array([ 6.75662201, 8.97479849, 10.49235584, 9.59892096])\n", "Coordinates:\n", " * time (time) object 1980-12-31 00:00:00 ... 1983-12-31 00:00:00\n", - " xc float64 dask.array\n", - " yc float64 dask.array" + " xc float64 42.47\n", + " yc float64 44.82" ] }, - "execution_count": 3, + "execution_count": 4, "metadata": {}, "output_type": "execute_result" } ], "source": [ - "# You can also resample by date\n", - "res = ds.resample(time='A').mean().isel(x=200, y=200)['Tair']\n", - "# The result is a dask array\n", - "res" + "# But you can use .compute\n", + "res.compute()" ] }, { "cell_type": "code", - "execution_count": 4, + "execution_count": 111, "metadata": { "ExecuteTime": { - "end_time": "2020-10-13T11:22:30.348149Z", - "start_time": "2020-10-13T11:22:30.246775Z" + "end_time": "2020-10-15T23:30:03.058359Z", + "start_time": "2020-10-15T23:30:03.052799Z" } }, "outputs": [ { - "name": "stderr", + "name": "stdout", "output_type": "stream", "text": [ - "/anaconda/envs/py37_pytorch/lib/python3.7/site-packages/dask/array/numpy_compat.py:40: RuntimeWarning: invalid value encountered in true_divide\n", - " x = np.divide(x1, x2, out)\n" + "\n" ] }, + { + "data": { + "text/plain": [ + "['__class__',\n", + " '__delattr__',\n", + " '__dict__',\n", + " '__dir__',\n", + " '__doc__',\n", + " '__eq__',\n", + " '__format__',\n", + " '__ge__',\n", + " '__getattribute__',\n", + " '__gt__',\n", + " '__hash__',\n", + " '__init__',\n", + " '__init_subclass__',\n", + " '__le__',\n", + " '__lt__',\n", + " '__module__',\n", + " '__ne__',\n", + " '__new__',\n", + " '__reduce__',\n", + " '__reduce_ex__',\n", + " '__repr__',\n", + " '__setattr__',\n", + " '__sizeof__',\n", + " '__str__',\n", + " '__subclasshook__',\n", + " '__weakref__',\n", + " '_obj',\n", + " '_tslib_field_accessor',\n", + " '_tslib_round_accessor',\n", + " 'ceil',\n", + " 'day',\n", + " 'dayofweek',\n", + " 'dayofyear',\n", + " 'days_in_month',\n", + " 'daysinmonth',\n", + " 'floor',\n", + " 'hour',\n", + " 'is_leap_year',\n", + " 'is_month_end',\n", + " 'is_month_start',\n", + " 'is_quarter_end',\n", + " 'is_quarter_start',\n", + " 'is_year_end',\n", + " 'is_year_start',\n", + " 'microsecond',\n", + " 'minute',\n", + " 'month',\n", + " 'nanosecond',\n", + " 'quarter',\n", + " 'round',\n", + " 'season',\n", + " 'second',\n", + " 'strftime',\n", + " 'time',\n", + " 'week',\n", + " 'weekday',\n", + " 'weekday_name',\n", + " 'weekofyear',\n", + " 'year']" + ] + }, + "execution_count": 111, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "# You can see all the datetime methods\n", + "print(ds.time.dt)\n", + "dir(ds.time.dt)" + ] + }, + { + "cell_type": "code", + "execution_count": 112, + "metadata": { + "ExecuteTime": { + "end_time": "2020-10-15T23:30:49.426672Z", + "start_time": "2020-10-15T23:30:49.417263Z" + } + }, + "outputs": [ { "data": { "text/html": [ @@ -4256,87 +12088,770 @@ " stroke: currentColor;\n", " fill: currentColor;\n", "}\n", - "
    <xarray.DataArray 'Tair' (time: 4)>\n",
    -       "array([ 6.75662201,  8.97479849, 10.49235584,  9.59892096])\n",
    +       "
    <xarray.DataArray 'season' (time: 36)>\n",
    +       "array(['SON', 'SON', 'SON', 'DJF', 'DJF', 'DJF', 'MAM', 'MAM', 'MAM',\n",
    +       "       'JJA', 'JJA', 'JJA', 'SON', 'SON', 'SON', 'DJF', 'DJF', 'DJF',\n",
    +       "       'MAM', 'MAM', 'MAM', 'JJA', 'JJA', 'JJA', 'SON', 'SON', 'SON',\n",
    +       "       'DJF', 'DJF', 'DJF', 'MAM', 'MAM', 'MAM', 'JJA', 'JJA', 'JJA'],\n",
    +       "      dtype='<U3')\n",
            "Coordinates:\n",
    -       "  * time     (time) object 1980-12-31 00:00:00 ... 1983-12-31 00:00:00\n",
    -       "    xc       float64 42.47\n",
    -       "    yc       float64 44.82
    " + " * time (time) object 1980-09-16 12:00:00 ... 1983-08-17 00:00:00
    " ], "text/plain": [ - "\n", - "array([ 6.75662201, 8.97479849, 10.49235584, 9.59892096])\n", - "Coordinates:\n", - " * time (time) object 1980-12-31 00:00:00 ... 1983-12-31 00:00:00\n", - " xc float64 42.47\n", - " yc float64 44.82" + "\n", + "array(['SON', 'SON', 'SON', 'DJF', 'DJF', 'DJF', 'MAM', 'MAM', 'MAM',\n", + " 'JJA', 'JJA', 'JJA', 'SON', 'SON', 'SON', 'DJF', 'DJF', 'DJF',\n", + " 'MAM', 'MAM', 'MAM', 'JJA', 'JJA', 'JJA', 'SON', 'SON', 'SON',\n", + " 'DJF', 'DJF', 'DJF', 'MAM', 'MAM', 'MAM', 'JJA', 'JJA', 'JJA'],\n", + " dtype='\n", + "

    Exercise

    \n", + "\n", + " 1. Look at the output of `ds.time.dt.season`\n", + " 2. Try grouping by season and getting the mean\n", + " 3. Plot each season (use the plotting code from above)\n", + " \n", + "\n", + "
    \n", + " → Hints\n", + "\n", + " * You do a for loop over groups `for season, ds_season in ds.groupby(ds.time.dt.season):`\n", + " * You need to remove the time dimension, with `.mean('time')`\n", + " * Use `mean['Tair'].plot.pcolormesh()` to plot\n", + "\n", + "
    \n", + "\n", + "
    \n", + "
    \n", + "
    \n", + " \n", + " → Solution\n", + " \n", + "\n", + " ```python\n", + " for season, ds_season in ds.groupby(ds.time.dt.season): \n", + " mean = ds_season.mean('time')\n", + " mean['Tair'].plot.pcolormesh(\n", + " vmin=-30, vmax=30)\n", + " plt.title(season)\n", + " plt.show()\n", + " ```\n", + "\n", + "
    \n", + "\n", + " " + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "# Introduction to Numba" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## What is Numba?\n", + "\n", + "Numba is a **just-in-time**, **type-specializing**, **function compiler** for accelerating **numerically-focused** Python. That's a long list, so let's break down those terms:\n", + "\n", + " * **function compiler**: Numba compiles Python functions, not entire applications, and not parts of functions. Numba does not replace your Python interpreter, but is just another Python module that can turn a function into a (usually) faster function. \n", + " * **type-specializing**: Numba speeds up your function by generating a specialized implementation for the specific data types you are using. Python functions are designed to operate on generic data types, which makes them very flexible, but also very slow. In practice, you only will call a function with a small number of argument types, so Numba will generate a fast implementation for each set of types.\n", + " * **just-in-time**: Numba translates functions when they are first called. This ensures the compiler knows what argument types you will be using. This also allows Numba to be used interactively in a Jupyter notebook just as easily as a traditional application\n", + " * **numerically-focused**: Currently, Numba is focused on numerical data types, like `int`, `float`, and `complex`. There is very limited string processing support, and many string use cases are not going to work well on the GPU. To get best results with Numba, you will likely be using NumPy arrays.\n" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "### First Steps\n", + "\n", + "Let's write our first Numba function and compile it for the **CPU**. The Numba compiler is typically enabled by applying a *decorator* to a Python function. Decorators are functions that transform Python functions. Here we will use the CPU compilation decorator:" + ] + }, + { + "cell_type": "markdown", + "metadata": { + "ExecuteTime": { + "end_time": "2020-10-14T03:46:54.654222Z", + "start_time": "2020-10-14T03:46:54.652118Z" + } + }, + "source": [ + "\n", + "The length of the hypotenuse of a triangle is\n", + " \n", + "$r = \\sqrt{x^2 + y^2}.$\n", + "\n", + "However, the squares of very large or small values of x and y may exceed the range of machine precision when calculated on a computer, leading to an inaccurate result caused by arithmetic underflow and/or arithmetic overflow.\n", + "\n", + "$ hypot = |x| \\sqrt{1 + \\left(\\tfrac{y}{x}\\right)^2}$\n", + "\n" + ] + }, + { + "cell_type": "code", + "execution_count": 103, + "metadata": { + "ExecuteTime": { + "end_time": "2020-10-15T23:28:05.117434Z", + "start_time": "2020-10-15T23:28:05.113335Z" + } + }, + "outputs": [], + "source": [ + "from numba import jit\n", + "import math\n", + "\n", + "\n", + "@jit\n", + "def hypot(x, y):\n", + " # Implementation from https://en.wikipedia.org/wiki/Hypot\n", + " x = abs(x)\n", + " y = abs(y)\n", + " t = min(x, y)\n", + " x = max(x, y)\n", + " t = t / x\n", + " return x * math.sqrt(1 + t * t)" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "The above code is equivalent to writing:\n", + "``` python\n", + "def hypot(x, y):\n", + " x = abs(x);\n", + " y = abs(y);\n", + " t = min(x, y);\n", + " x = max(x, y);\n", + " t = t / x;\n", + " return x * math.sqrt(1+t*t)\n", + " \n", + "hypot = jit(hypot)\n", + "```\n", + "This means that the Numba compiler is just a function you can call whenever you want!\n", + "\n", + "Let's try out our hypotenuse calculation:" + ] + }, + { + "cell_type": "code", + "execution_count": 93, + "metadata": { + "ExecuteTime": { + "end_time": "2020-10-14T03:47:40.979991Z", + "start_time": "2020-10-14T03:47:40.975581Z" + } + }, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "CPU times: user 6 µs, sys: 1 µs, total: 7 µs\n", + "Wall time: 10.3 µs\n" + ] + }, + { + "data": { + "text/plain": [ + "5.0" + ] + }, + "execution_count": 93, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "%%time\n", + "hypot(3.0, 4.0)" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "The first time we call `hypot`, the compiler is triggered and compiles a machine code implementation for float inputs. Numba also saves the original Python implementation of the function in the `.py_func` attribute, so we can call the original Python code to make sure we get the same answer:" + ] + }, + { + "cell_type": "code", + "execution_count": 94, + "metadata": { + "ExecuteTime": { + "end_time": "2020-10-14T03:47:42.474371Z", + "start_time": "2020-10-14T03:47:42.469826Z" + } + }, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "CPU times: user 11 µs, sys: 2 µs, total: 13 µs\n", + "Wall time: 16.2 µs\n" + ] + }, + { + "data": { + "text/plain": [ + "5.0" + ] + }, + "execution_count": 94, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "%%time\n", + "hypot.py_func(3.0, 4.0)" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "### Benchmarking\n", + "\n", + "An important part of using Numba is measuring the performance of your new code. Let's see if we actually sped anything up. The easiest way to do this in the Jupyter notebook is to use the `%timeit` magic function. Let's first measure the speed of the original Python:" + ] + }, + { + "cell_type": "code", + "execution_count": 95, + "metadata": { + "ExecuteTime": { + "end_time": "2020-10-14T03:48:10.886616Z", + "start_time": "2020-10-14T03:48:05.339532Z" + } + }, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "684 ns ± 7.08 ns per loop (mean ± std. dev. of 7 runs, 1000000 loops each)\n" + ] + } + ], + "source": [ + "%timeit hypot.py_func(3.0, 4.0)" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "The `%timeit` magic runs the statement many times to get an accurate estimate of the run time." + ] + }, + { + "cell_type": "code", + "execution_count": 96, + "metadata": { + "ExecuteTime": { + "end_time": "2020-10-14T03:48:12.520692Z", + "start_time": "2020-10-14T03:48:10.888168Z" + } + }, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "201 ns ± 0.613 ns per loop (mean ± std. dev. of 7 runs, 1000000 loops each)\n" + ] + } + ], + "source": [ + "%timeit hypot(3.0, 4.0)" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "Numba did a pretty good job with this function. It's 3x faster than the pure Python version.\n", + "\n", + "Of course, the `hypot` function is already present in the Python module:" + ] + }, + { + "cell_type": "code", + "execution_count": 97, + "metadata": { + "ExecuteTime": { + "end_time": "2020-10-14T03:49:28.961742Z", + "start_time": "2020-10-14T03:49:17.857136Z" + } + }, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "137 ns ± 0.635 ns per loop (mean ± std. dev. of 7 runs, 10000000 loops each)\n" + ] + } + ], + "source": [ + "%timeit math.hypot(3.0, 4.0)" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "Python's built-in is even faster than Numba! This is because Numba does introduce some overhead to each function call that is larger than the function call overhead of Python itself. Extremely fast functions (like the above one) will be hurt by this.\n", + "\n", + "(However, if you call one Numba function from another one, there is very little function overhead, sometimes even zero if the compiler inlines the function into the other one.)" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "### How does Numba work?\n", + "\n", + "The first time we called our Numba-wrapped `hypot` function, the following process was initiated:\n", + "\n", + "![Numba Flowchart](img/numba_flowchart.png \"The compilation process\")\n", + "\n", + "We can see the result of type inference by using the `.inspect_types()` method, which prints an annotated version of the source code:" + ] + }, + { + "cell_type": "code", + "execution_count": 98, + "metadata": { + "ExecuteTime": { + "end_time": "2020-10-14T03:50:36.336290Z", + "start_time": "2020-10-14T03:50:36.332574Z" + } + }, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "hypot (float64, float64)\n", + "--------------------------------------------------------------------------------\n", + "# File: \n", + "# --- LINE 5 --- \n", + "\n", + "@jit\n", + "\n", + "# --- LINE 6 --- \n", + "\n", + "def hypot(x, y):\n", + "\n", + " # --- LINE 7 --- \n", + "\n", + " # Implementation from https://en.wikipedia.org/wiki/Hypot\n", + "\n", + " # --- LINE 8 --- \n", + " # label 0\n", + " # x = arg(0, name=x) :: float64\n", + " # y = arg(1, name=y) :: float64\n", + " # $2load_global.0 = global(abs: ) :: Function()\n", + " # $6call_function.2 = call $2load_global.0(x, func=$2load_global.0, args=[Var(x, :8)], kws=(), vararg=None) :: (float64,) -> float64\n", + " # del x\n", + " # del $2load_global.0\n", + " # x.1 = $6call_function.2 :: float64\n", + " # del $6call_function.2\n", + "\n", + " x = abs(x)\n", + "\n", + " # --- LINE 9 --- \n", + " # $10load_global.3 = global(abs: ) :: Function()\n", + " # $14call_function.5 = call $10load_global.3(y, func=$10load_global.3, args=[Var(y, :8)], kws=(), vararg=None) :: (float64,) -> float64\n", + " # del y\n", + " # del $10load_global.3\n", + " # y.1 = $14call_function.5 :: float64\n", + " # del $14call_function.5\n", + "\n", + " y = abs(y)\n", + "\n", + " # --- LINE 10 --- \n", + " # $18load_global.6 = global(min: ) :: Function()\n", + " # $24call_function.9 = call $18load_global.6(x.1, y.1, func=$18load_global.6, args=[Var(x.1, :8), Var(y.1, :9)], kws=(), vararg=None) :: (float64, float64) -> float64\n", + " # del $18load_global.6\n", + " # t = $24call_function.9 :: float64\n", + " # del $24call_function.9\n", + "\n", + " t = min(x, y)\n", + "\n", + " # --- LINE 11 --- \n", + " # $28load_global.10 = global(max: ) :: Function()\n", + " # $34call_function.13 = call $28load_global.10(x.1, y.1, func=$28load_global.10, args=[Var(x.1, :8), Var(y.1, :9)], kws=(), vararg=None) :: (float64, float64) -> float64\n", + " # del y.1\n", + " # del x.1\n", + " # del $28load_global.10\n", + " # x.2 = $34call_function.13 :: float64\n", + " # del $34call_function.13\n", + "\n", + " x = max(x, y)\n", + "\n", + " # --- LINE 12 --- \n", + " # $42binary_true_divide.16 = t / x.2 :: float64\n", + " # del t\n", + " # t.1 = $42binary_true_divide.16 :: float64\n", + " # del $42binary_true_divide.16\n", + "\n", + " t = t / x\n", + "\n", + " # --- LINE 13 --- \n", + " # $48load_global.18 = global(math: ) :: Module()\n", + " # $50load_method.19 = getattr(value=$48load_global.18, attr=sqrt) :: Function()\n", + " # del $48load_global.18\n", + " # $const52.20 = const(int, 1) :: Literal[int](1)\n", + " # $58binary_multiply.23 = t.1 * t.1 :: float64\n", + " # del t.1\n", + " # $60binary_add.24 = $const52.20 + $58binary_multiply.23 :: float64\n", + " # del $const52.20\n", + " # del $58binary_multiply.23\n", + " # $62call_method.25 = call $50load_method.19($60binary_add.24, func=$50load_method.19, args=[Var($60binary_add.24, :13)], kws=(), vararg=None) :: (float64,) -> float64\n", + " # del $60binary_add.24\n", + " # del $50load_method.19\n", + " # $64binary_multiply.26 = x.2 * $62call_method.25 :: float64\n", + " # del x.2\n", + " # del $62call_method.25\n", + " # $66return_value.27 = cast(value=$64binary_multiply.26) :: float64\n", + " # del $64binary_multiply.26\n", + " # return $66return_value.27\n", + "\n", + " return x * math.sqrt(1 + t * t)\n", + "\n", + "\n", + "================================================================================\n" + ] + } + ], + "source": [ + "hypot.inspect_types()" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "Note that Numba's type names tend to mirror the NumPy type names, so a Python `float` is a `float64` (also called \"double precision\" in other languages). Taking a look at the data types can sometimes be important in GPU code because the performance of `float32` and `float64` computations will be very different on CUDA devices. An accidental upcast can dramatically slow down a function." + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "### When Things Go Wrong\n", + "\n", + "Numba cannot compile all Python code. Some functions don't have a Numba-translation, and some kinds of Python types can't be efficiently compiled at all (yet). For example, Numba does not support `FrozenSet` (as of this tutorial):" + ] + }, + { + "cell_type": "code", + "execution_count": 99, + "metadata": { + "ExecuteTime": { + "end_time": "2020-10-14T03:51:04.544166Z", + "start_time": "2020-10-14T03:51:04.459625Z" + }, + "scrolled": true + }, + "outputs": [ + { + "name": "stderr", + "output_type": "stream", + "text": [ + ":1: NumbaWarning: \n", + "Compilation is falling back to object mode WITH looplifting enabled because Function \"cannot_compile\" failed type inference due to: non-precise type pyobject\n", + "During: typing of argument at (3)\n", + "\n", + "File \"\", line 3:\n", + "def cannot_compile(x):\n", + " return \"a\" in x\n", + " ^\n", + "\n", + " @jit\n", + "/anaconda/envs/py37_pytorch/lib/python3.7/site-packages/numba/core/object_mode_passes.py:178: NumbaWarning: Function \"cannot_compile\" was compiled in object mode without forceobj=True.\n", + "\n", + "File \"\", line 2:\n", + "@jit\n", + "def cannot_compile(x):\n", + "^\n", + "\n", + " state.func_ir.loc))\n", + "/anaconda/envs/py37_pytorch/lib/python3.7/site-packages/numba/core/object_mode_passes.py:188: NumbaDeprecationWarning: \n", + "Fall-back from the nopython compilation path to the object mode compilation path has been detected, this is deprecated behaviour.\n", + "\n", + "For more information visit https://numba.pydata.org/numba-doc/latest/reference/deprecation.html#deprecation-of-object-mode-fall-back-behaviour-when-using-jit\n", + "\n", + "File \"\", line 2:\n", + "@jit\n", + "def cannot_compile(x):\n", + "^\n", + "\n", + " state.func_ir.loc))\n" + ] + }, + { + "data": { + "text/plain": [ + "True" ] }, - "execution_count": 4, + "execution_count": 99, "metadata": {}, "output_type": "execute_result" } ], "source": [ - "# But you can use .compute\n", - "res.compute()" + "@jit\n", + "def cannot_compile(x):\n", + " return \"a\" in x\n", + "\n", + "\n", + "cannot_compile(frozenset((\"a\", \"b\", \"c\")))" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "Wait, what happened?? By default, Numba will fall back to a mode, called \"object mode,\" which does not do type-specialization. Object mode exists to enable other Numba functionality, but in many cases, you want Numba to tell you if type inference fails. You can force \"nopython mode\" (the other compilation mode) by passing arguments to the decorator:" ] }, { "cell_type": "code", - "execution_count": null, + "execution_count": 101, "metadata": { "ExecuteTime": { - "end_time": "2020-10-13T11:31:32.414803Z", - "start_time": "2020-10-13T11:31:31.326331Z" - } + "end_time": "2020-10-14T03:55:40.035890Z", + "start_time": "2020-10-14T03:55:40.026166Z" + }, + "scrolled": true }, - "outputs": [], - "source": [] + "outputs": [ + { + "name": "stderr", + "output_type": "stream", + "text": [ + "ERROR:root:Failed in nopython mode pipeline (step: nopython frontend)\n", + "non-precise type pyobject\n", + "During: typing of argument at (3)\n", + "\n", + "File \"\", line 3:\n", + "def cannot_compile(x):\n", + " return \"a\" in x\n", + " ^\n", + "\n", + "This error may have been caused by the following argument(s):\n", + "- argument 0: cannot determine Numba type of \n", + "Traceback (most recent call last):\n", + " File \"\", line 6, in \n", + " cannot_compile(frozenset((\"a\", \"b\", \"c\")))\n", + " File \"/anaconda/envs/py37_pytorch/lib/python3.7/site-packages/numba/core/dispatcher.py\", line 415, in _compile_for_args\n", + " error_rewrite(e, 'typing')\n", + " File \"/anaconda/envs/py37_pytorch/lib/python3.7/site-packages/numba/core/dispatcher.py\", line 358, in error_rewrite\n", + " reraise(type(e), e, None)\n", + " File \"/anaconda/envs/py37_pytorch/lib/python3.7/site-packages/numba/core/utils.py\", line 80, in reraise\n", + " raise value.with_traceback(tb)\n", + "numba.core.errors.TypingError: Failed in nopython mode pipeline (step: nopython frontend)\n", + "non-precise type pyobject\n", + "During: typing of argument at (3)\n", + "\n", + "File \"\", line 3:\n", + "def cannot_compile(x):\n", + " return \"a\" in x\n", + " ^\n", + "\n", + "This error may have been caused by the following argument(s):\n", + "- argument 0: cannot determine Numba type of \n", + "\n" + ] + } + ], + "source": [ + "@jit(nopython=True)\n", + "def cannot_compile(x):\n", + " return \"a\" in x\n", + "\n", + "try:\n", + " cannot_compile(frozenset((\"a\", \"b\", \"c\")))\n", + "except Exception as e:\n", + " logging.exception(e)" + ] }, { "cell_type": "markdown", "metadata": {}, "source": [ - "
    \n", - "

    Exercise

    \n", - "\n", - " 1. Look at the output of `ds.time.dt.season`\n", - " 2. Try grouping by season and getting the mean\n", - " 3. Plot each season (use the plotting code from above)\n", - " \n", - "\n", - "
    \n", - " → Hints\n", - "\n", - " * You do a for loop over groups `for season, ds_season in ds.groupby(ds.time.dt.season):`\n", - " * You need to remove the time dimension, with `.mean('time')`\n", - " * Use `mean['Tair'].plot.pcolormesh()` to plot\n", + "Now we get an exception when Numba tries to compile the function, with an error that says:\n", + "```\n", + "- argument 0: cannot determine Numba type of \n", + "```\n", + "which is the underlying problem. Numba doesn't know about frozenset. There are classes that we use regularly in our code but they might not be defined in Numba. An example of a common class that you cannot use in Numba is pandas data frames.
    Now the question is: what does Numba support? Some of the types/classes that are supported by Numba are listed below:\n", + "* Numbers (integers, floats, etc)\n", + "* Numpy arrays\n", + "* Strings\n", + "* Lists and tuples (note that a list/tuple of numbers or strings is supported but a list of lists is not)" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "So, if we want the last example to be compiled successfully by Numba jit, we need to use a tuple or a list." + ] + }, + { + "cell_type": "code", + "execution_count": 102, + "metadata": { + "ExecuteTime": { + "end_time": "2020-10-14T03:56:02.269146Z", + "start_time": "2020-10-14T03:56:01.765963Z" + } + }, + "outputs": [ + { + "data": { + "text/plain": [ + "True" + ] + }, + "execution_count": 102, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "@jit(nopython=True)\n", + "def can_compile(x):\n", + " return \"a\" in x\n", "\n", - "
    \n", "\n", - "
    \n", - "
    \n", - "
    \n", - " \n", - " → Solution\n", - " \n", + "can_compile((\"a\", \"b\", \"c\"))" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "### Exercise\n", + "Gregory–Leibniz infinite series converges to $\\pi$:\n", + "$$\\pi = \\frac{4}{1} - \\frac{4}{3} + \\frac{4}{5} - \\frac{4}{7} + \\frac{4}{9} - \\frac{4}{11} + \\frac{4}{13} - \\cdots$$\n", "\n", - " ```python\n", - " for season, ds_season in ds.groupby(ds.time.dt.season): \n", - " mean = ds_season.mean('time')\n", - " mean['Tair'].plot.pcolormesh(\n", - " vmin=-30, vmax=30)\n", - " plt.title(season)\n", - " plt.show()\n", - " ```\n", + "Write a Numba function which calculates the sum of first $n$ terms in this series. Then test its speed agains normal Python function for $ n = 1000000$." + ] + }, + { + "cell_type": "code", + "execution_count": 49, + "metadata": { + "ExecuteTime": { + "end_time": "2020-10-04T07:14:16.556883Z", + "start_time": "2020-10-04T07:14:16.553515Z" + } + }, + "outputs": [], + "source": [ + "# Code Here" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "
    Solution\n", "\n", - "
    \n", + "```Python\n", + " @jit\n", + " def gl_pi(n):\n", + " pi = 0\n", + " for i in range(n):\n", + " if i%2 ==0:\n", + " pi += 4/(2*i+1)\n", + " else:\n", + " pi -= 4/(2*i+1)\n", + " return pi \n", + "```\n", "\n", - "
    " + "Numba function speed test:\n", + "```Python\n", + " %timeit gl_pi(1000000) \n", + "```\n", + " \n", + "Normal Python function speed test:\n", + "```Python\n", + " %timeit gl_pi.py_func(1000000) \n", + "```\n", + " \n", + "" ] }, { diff --git a/notebooks/c05_Big_Data/Working_with_Big_Data.py b/notebooks/c05_Big_Data/Working_with_Big_Data.py index ea26a63..748c8ed 100644 --- a/notebooks/c05_Big_Data/Working_with_Big_Data.py +++ b/notebooks/c05_Big_Data/Working_with_Big_Data.py @@ -130,7 +130,7 @@ def memory_usage(): result - +df2 #
    #

    Exercise

    @@ -176,7 +176,33 @@ def memory_usage(): # # # -#
    +# +# + +# + +# With pandas +# pixels = df1.loc[:, ['pixel' in c for c in df1.columns]] +pixels = df1.loc[:, 'pixel1':'pixel783'] +pixels +df1['sum']=pixels.sum(axis=1) +df1['sum'] +# task = df1[['label','sum']].groupby('label').mean() +df1[['label','sum']].groupby('label').mean() + +gg = df1[['label','sum']].groupby('label') +list(gg)[0] +# df1.loc[:, 'pixel1':'pixel783'].csum +# print(result) + +# # With dask +pixels = df2.loc[:, ['pixel' in c for c in df2.columns]] +pixels +# df2['sum']=pixels.sum(axis=1) +# task = df2[['label','sum']].groupby('label').mean() +# with ProgressBar(): +# result=task.compute() +# print(result) +# - # ## When to use Dask DataFrame? # @@ -271,7 +297,7 @@ def memory_usage(): # d = array.linalg.norm(y,axis=1) # with ProgressBar(): # result = d.compute() -# hist(result,bins=100); +# plt.hist(result,bins=100); # ``` # # @@ -347,6 +373,83 @@ def task2(x, y): y = task2(x1,x2) y.compute() +# # Xarray +# +# Xarray is pandas for N-dimensional data. It also has a [dask backend](http://xarray.pydata.org/en/stable/dask.html) + +# + +# %matplotlib inline +import numpy as np +import pandas as pd +import xarray as xr +import matplotlib.pyplot as plt + +ds = xr.tutorial.open_dataset('rasm').load().chunk(dict(time=10)) +ds + +# + +# You can use isel instead of iloc. You always need to specify the dimension +ds.isel(time=10)['Tair'].plot.pcolormesh( + vmin=-30, vmax=30, cmap='Spectral_r', + add_colorbar=True, extend='both') + +ds.isel(time=10) +plt.title('Seasonal Surface Air Temperature') +# - + +# You can also resample by date +res = ds.resample(time='A').mean().isel(x=200, y=200)['Tair'] +# The result is a dask array +res + +# But you can use .compute +res.compute() + +# You can see all the datetime methods +print(ds.time.dt) +dir(ds.time.dt) + +# These are seasons specified by the months inside +# JJA = Jun, Jul, Aug. +ds.time.dt.season + +#
    +#

    Exercise

    +# +# 1. Look at the output of `ds.time.dt.season` +# 2. Try grouping by season and getting the mean +# 3. Plot each season (use the plotting code from above) +# +# +#
    +# → Hints +# +# * You do a for loop over groups `for season, ds_season in ds.groupby(ds.time.dt.season):` +# * You need to remove the time dimension, with `.mean('time')` +# * Use `mean['Tair'].plot.pcolormesh()` to plot +# +#
    +# +#
    +#
    +#
    +# +# → Solution +# +# +# ```python +# for season, ds_season in ds.groupby(ds.time.dt.season): +# mean = ds_season.mean('time') +# mean['Tair'].plot.pcolormesh( +# vmin=-30, vmax=30) +# plt.title(season) +# plt.show() +# ``` +# +#
    +# +#
    + # # Introduction to Numba # ## What is Numba? @@ -363,6 +466,17 @@ def task2(x, y): # # Let's write our first Numba function and compile it for the **CPU**. The Numba compiler is typically enabled by applying a *decorator* to a Python function. Decorators are functions that transform Python functions. Here we will use the CPU compilation decorator: +# +# The length of the hypotenuse of a triangle is +# +# $r = \sqrt{x^2 + y^2}.$ +# +# However, the squares of very large or small values of x and y may exceed the range of machine precision when calculated on a computer, leading to an inaccurate result caused by arithmetic underflow and/or arithmetic overflow. +# +# $ hypot = |x| \sqrt{1 + \left(\tfrac{y}{x}\right)^2}$ +# +# + # + from numba import jit import math @@ -397,10 +511,12 @@ def hypot(x, y): # # Let's try out our hypotenuse calculation: +# %%time hypot(3.0, 4.0) # The first time we call `hypot`, the compiler is triggered and compiles a machine code implementation for float inputs. Numba also saves the original Python implementation of the function in the `.py_func` attribute, so we can call the original Python code to make sure we get the same answer: +# %%time hypot.py_func(3.0, 4.0) # ### Benchmarking @@ -523,76 +639,6 @@ def can_compile(x): # # -# # Xarray -# -# Xarray is pandas for N-dimensional data. It also has a [dask backend](http://xarray.pydata.org/en/stable/dask.html) - -# + -# %matplotlib inline -import numpy as np -import pandas as pd -import xarray as xr -import matplotlib.pyplot as plt - -ds = xr.tutorial.open_dataset('rasm').load().chunk(dict(time=10)) -ds - -# + -# You can use isel instead of iloc. You always need to specify the dimension -ds.isel(time=10)['Tair'].plot.pcolormesh( - vmin=-30, vmax=30, cmap='Spectral_r', - add_colorbar=True, extend='both') - -ds.isel(time=10) -# - - -# You can also resample by date -res = ds.resample(time='A').mean().isel(x=200, y=200)['Tair'] -# The result is a dask array -res - -# But you can use .compute -res.compute() - - - -#
    -#

    Exercise

    -# -# 1. Look at the output of `ds.time.dt.season` -# 2. Try grouping by season and getting the mean -# 3. Plot each season (use the plotting code from above) -# -# -#
    -# → Hints -# -# * You do a for loop over groups `for season, ds_season in ds.groupby(ds.time.dt.season):` -# * You need to remove the time dimension, with `.mean('time')` -# * Use `mean['Tair'].plot.pcolormesh()` to plot -# -#
    -# -#
    -#
    -#
    -# -# → Solution -# -# -# ```python -# for season, ds_season in ds.groupby(ds.time.dt.season): -# mean = ds_season.mean('time') -# mean['Tair'].plot.pcolormesh( -# vmin=-30, vmax=30) -# plt.title(season) -# plt.show() -# ``` -# -#
    -# -#
    - # # References # The following sources where used for creation of this notebook: # - https://github.com/NCAR/ncar-python-tutorial