Skip to content

Commit 30f6e15

Browse files
committed
Created using Colaboratory
1 parent 0e53b9c commit 30f6e15

File tree

1 file changed

+38
-27
lines changed

1 file changed

+38
-27
lines changed

day_15/01_intro_dask.ipynb

Lines changed: 38 additions & 27 deletions
Original file line numberDiff line numberDiff line change
@@ -5,14 +5,25 @@
55
"colab": {
66
"name": "01_intro_dask.ipynb",
77
"provenance": [],
8-
"authorship_tag": "ABX9TyOkip/jPKANIdmhdkT7IEkI"
8+
"authorship_tag": "ABX9TyOkip/jPKANIdmhdkT7IEkI",
9+
"include_colab_link": true
910
},
1011
"kernelspec": {
1112
"name": "python3",
1213
"display_name": "Python 3"
1314
}
1415
},
1516
"cells": [
17+
{
18+
"cell_type": "markdown",
19+
"metadata": {
20+
"id": "view-in-github",
21+
"colab_type": "text"
22+
},
23+
"source": [
24+
"<a href=\"https://colab.research.google.com/github/gumdropsteve/intro_to_python/blob/main/day_15/01_intro_dask.ipynb\" target=\"_parent\"><img src=\"https://colab.research.google.com/assets/colab-badge.svg\" alt=\"Open In Colab\"/></a>"
25+
]
26+
},
1627
{
1728
"cell_type": "markdown",
1829
"metadata": {
@@ -46,7 +57,7 @@
4657
"\r\n",
4758
"df"
4859
],
49-
"execution_count": 1,
60+
"execution_count": null,
5061
"outputs": [
5162
{
5263
"output_type": "execute_result",
@@ -110,7 +121,7 @@
110121
"source": [
111122
"df.to_csv('small.csv', index=False)"
112123
],
113-
"execution_count": 2,
124+
"execution_count": null,
114125
"outputs": []
115126
},
116127
{
@@ -125,7 +136,7 @@
125136
"source": [
126137
"!python -m pip install \"dask[dataframe]\""
127138
],
128-
"execution_count": 4,
139+
"execution_count": null,
129140
"outputs": [
130141
{
131142
"output_type": "stream",
@@ -166,7 +177,7 @@
166177
"\r\n",
167178
"dd.read_csv('small.csv')"
168179
],
169-
"execution_count": 5,
180+
"execution_count": null,
170181
"outputs": [
171182
{
172183
"output_type": "execute_result",
@@ -254,7 +265,7 @@
254265
"source": [
255266
"dd.read_csv('small.csv').compute()"
256267
],
257-
"execution_count": 6,
268+
"execution_count": null,
258269
"outputs": [
259270
{
260271
"output_type": "execute_result",
@@ -322,7 +333,7 @@
322333
"source": [
323334
"type(dd.read_csv('small.csv').compute())"
324335
],
325-
"execution_count": 7,
336+
"execution_count": null,
326337
"outputs": [
327338
{
328339
"output_type": "execute_result",
@@ -353,7 +364,7 @@
353364
"\r\n",
354365
"df.describe()"
355366
],
356-
"execution_count": 12,
367+
"execution_count": null,
357368
"outputs": [
358369
{
359370
"output_type": "execute_result",
@@ -432,7 +443,7 @@
432443
"source": [
433444
"df.describe().compute()"
434445
],
435-
"execution_count": 13,
446+
"execution_count": null,
436447
"outputs": [
437448
{
438449
"output_type": "execute_result",
@@ -551,7 +562,7 @@
551562
"graph = df.__dask_graph__()\r\n",
552563
"graph.layers"
553564
],
554-
"execution_count": 18,
565+
"execution_count": null,
555566
"outputs": [
556567
{
557568
"output_type": "execute_result",
@@ -614,7 +625,7 @@
614625
"# dataframe as is now\r\n",
615626
"df"
616627
],
617-
"execution_count": 19,
628+
"execution_count": null,
618629
"outputs": [
619630
{
620631
"output_type": "execute_result",
@@ -694,7 +705,7 @@
694705
"# just reading\r\n",
695706
"dd.read_csv('small.csv')"
696707
],
697-
"execution_count": 20,
708+
"execution_count": null,
698709
"outputs": [
699710
{
700711
"output_type": "execute_result",
@@ -782,7 +793,7 @@
782793
"source": [
783794
"df.compute()"
784795
],
785-
"execution_count": 21,
796+
"execution_count": null,
786797
"outputs": [
787798
{
788799
"output_type": "execute_result",
@@ -862,7 +873,7 @@
862873
"\r\n",
863874
"!wget \"https://github.com/gumdropsteve/datasets/raw/master/airlines.parquet\""
864875
],
865-
"execution_count": 27,
876+
"execution_count": null,
866877
"outputs": [
867878
{
868879
"output_type": "stream",
@@ -902,7 +913,7 @@
902913
"%%time\r\n",
903914
"pd.read_parquet('airlines.parquet')"
904915
],
905-
"execution_count": 28,
916+
"execution_count": null,
906917
"outputs": [
907918
{
908919
"output_type": "stream",
@@ -1181,7 +1192,7 @@
11811192
"%%time\r\n",
11821193
"dd.read_parquet('airlines.parquet')"
11831194
],
1184-
"execution_count": 29,
1195+
"execution_count": null,
11851196
"outputs": [
11861197
{
11871198
"output_type": "stream",
@@ -1317,7 +1328,7 @@
13171328
"%%time\r\n",
13181329
"dd.read_parquet('airlines.parquet').compute()"
13191330
],
1320-
"execution_count": 33,
1331+
"execution_count": null,
13211332
"outputs": [
13221333
{
13231334
"output_type": "stream",
@@ -1599,7 +1610,7 @@
15991610
"\r\n",
16001611
"df.compute()"
16011612
],
1602-
"execution_count": 45,
1613+
"execution_count": null,
16031614
"outputs": [
16041615
{
16051616
"output_type": "stream",
@@ -1628,7 +1639,7 @@
16281639
"\r\n",
16291640
"df"
16301641
],
1631-
"execution_count": 46,
1642+
"execution_count": null,
16321643
"outputs": [
16331644
{
16341645
"output_type": "stream",
@@ -1681,7 +1692,7 @@
16811692
"total = sum(output)\r\n",
16821693
"total"
16831694
],
1684-
"execution_count": 7,
1695+
"execution_count": null,
16851696
"outputs": [
16861697
{
16871698
"output_type": "execute_result",
@@ -1721,7 +1732,7 @@
17211732
"\r\n",
17221733
"total.visualize()"
17231734
],
1724-
"execution_count": 10,
1735+
"execution_count": null,
17251736
"outputs": [
17261737
{
17271738
"output_type": "execute_result",
@@ -1750,7 +1761,7 @@
17501761
"source": [
17511762
"total.compute()"
17521763
],
1753-
"execution_count": 11,
1764+
"execution_count": null,
17541765
"outputs": [
17551766
{
17561767
"output_type": "execute_result",
@@ -1789,7 +1800,7 @@
17891800
"\r\n",
17901801
"compute(*[total, total])"
17911802
],
1792-
"execution_count": 12,
1803+
"execution_count": null,
17931804
"outputs": [
17941805
{
17951806
"output_type": "execute_result",
@@ -1826,7 +1837,7 @@
18261837
"\r\n",
18271838
"df = dd.read_csv('iris.csv')"
18281839
],
1829-
"execution_count": 17,
1840+
"execution_count": null,
18301841
"outputs": []
18311842
},
18321843
{
@@ -1841,7 +1852,7 @@
18411852
"source": [
18421853
"compute([df])"
18431854
],
1844-
"execution_count": 18,
1855+
"execution_count": null,
18451856
"outputs": [
18461857
{
18471858
"output_type": "execute_result",
@@ -1882,7 +1893,7 @@
18821893
"source": [
18831894
"compute(*[total, total, df])"
18841895
],
1885-
"execution_count": 19,
1896+
"execution_count": null,
18861897
"outputs": [
18871898
{
18881899
"output_type": "execute_result",
@@ -1925,7 +1936,7 @@
19251936
"source": [
19261937
"compute(*[total, df, total])"
19271938
],
1928-
"execution_count": 20,
1939+
"execution_count": null,
19291940
"outputs": [
19301941
{
19311942
"output_type": "execute_result",

0 commit comments

Comments
 (0)