Skip to content

Commit 1335010

Browse files
committed
update to DataFrames 0.11.7
1 parent aa7a4ba commit 1335010

File tree

8 files changed

+378
-335
lines changed

8 files changed

+378
-335
lines changed

01_constructors.ipynb

Lines changed: 105 additions & 79 deletions
Large diffs are not rendered by default.

02_basicinfo.ipynb

Lines changed: 67 additions & 104 deletions
Original file line numberDiff line numberDiff line change
@@ -5,15 +5,13 @@
55
"metadata": {},
66
"source": [
77
"# Introduction to DataFrames\n",
8-
"**[Bogumił Kamiński](http://bogumilkaminski.pl/about/), May 23, 2018**"
8+
"**[Bogumił Kamiński](http://bogumilkaminski.pl/about/), July 25, 2018**"
99
]
1010
},
1111
{
1212
"cell_type": "code",
1313
"execution_count": 1,
14-
"metadata": {
15-
"collapsed": true
16-
},
14+
"metadata": {},
1715
"outputs": [],
1816
"source": [
1917
"using DataFrames # load package"
@@ -122,75 +120,28 @@
122120
"metadata": {},
123121
"outputs": [
124122
{
125-
"name": "stdout",
126-
"output_type": "stream",
127-
"text": [
128-
"A\n",
129-
"Summary Stats:\n",
130-
"Mean: 1.500000\n",
131-
"Minimum: 1.000000\n",
132-
"1st Quartile: 1.250000\n",
133-
"Median: 1.500000\n",
134-
"3rd Quartile: 1.750000\n",
135-
"Maximum: 2.000000\n",
136-
"Length: 2\n",
137-
"Type: Int64\n",
138-
"\n",
139-
"B\n",
140-
"Summary Stats:\n",
141-
"Mean: 1.000000\n",
142-
"Minimum: 1.000000\n",
143-
"1st Quartile: 1.000000\n",
144-
"Median: 1.000000\n",
145-
"3rd Quartile: 1.000000\n",
146-
"Maximum: 1.000000\n",
147-
"Length: 2\n",
148-
"Type: Union{Float64, Missings.Missing}\n",
149-
"Number Missing: 1\n",
150-
"% Missing: 50.000000\n",
151-
"\n",
152-
"C\n",
153-
"Summary Stats:\n",
154-
"Length: 2\n",
155-
"Type: String\n",
156-
"Number Unique: 2\n",
157-
"\n"
158-
]
123+
"data": {
124+
"text/html": [
125+
"<table class=\"data-frame\"><thead><tr><th></th><th>variable</th><th>mean</th><th>min</th><th>median</th><th>max</th><th>nunique</th><th>nmissing</th><th>eltype</th></tr></thead><tbody><tr><th>1</th><td>A</td><td>1.5</td><td>1</td><td>1.5</td><td>2</td><td></td><td></td><td>Int64</td></tr><tr><th>2</th><td>B</td><td>1.0</td><td>1.0</td><td>1.0</td><td>1.0</td><td></td><td>1</td><td>Float64</td></tr><tr><th>3</th><td>C</td><td></td><td>a</td><td></td><td>b</td><td>2</td><td></td><td>String</td></tr></tbody></table>"
126+
],
127+
"text/plain": [
128+
"3×8 DataFrames.DataFrame\n",
129+
"│ Row │ variable │ mean │ min │ median │ max │ nunique │ nmissing │ eltype │\n",
130+
"├─────┼──────────┼──────┼─────┼────────┼─────┼─────────┼──────────┼─────────┤\n",
131+
"│ 1 │ A │ 1.5 │ 1 │ 1.5 │ 2 │ │ │ Int64 │\n",
132+
"│ 2 │ B │ 1.0 │ 1.0 │ 1.0 │ 1.0 │ │ 1 │ Float64 │\n",
133+
"│ 3 │ C │ │ a │ │ b │ 2 │ │ String │"
134+
]
135+
},
136+
"execution_count": 5,
137+
"metadata": {},
138+
"output_type": "execute_result"
159139
}
160140
],
161141
"source": [
162142
"describe(x)"
163143
]
164144
},
165-
{
166-
"cell_type": "markdown",
167-
"metadata": {},
168-
"source": [
169-
"Use `showcols` to get informaton about columns stored in a DataFrame."
170-
]
171-
},
172-
{
173-
"cell_type": "code",
174-
"execution_count": 6,
175-
"metadata": {},
176-
"outputs": [
177-
{
178-
"name": "stdout",
179-
"output_type": "stream",
180-
"text": [
181-
"2×3 DataFrames.DataFrame\n",
182-
"│ Col # │ Name │ Eltype │ Missing │ Values │\n",
183-
"├───────┼──────┼──────────────────────────────────┼─────────┼─────────────────┤\n",
184-
"│ 1 │ A │ Int64 │ 0 │ 1 … 2 │\n",
185-
"│ 2 │ B │ Union{Float64, Missings.Missing} │ 1 │ 1.0 … missing │\n",
186-
"│ 3 │ C │ String │ 0 │ a … b │"
187-
]
188-
}
189-
],
190-
"source": [
191-
"showcols(x)"
192-
]
193-
},
194145
{
195146
"cell_type": "markdown",
196147
"metadata": {},
@@ -200,7 +151,7 @@
200151
},
201152
{
202153
"cell_type": "code",
203-
"execution_count": 7,
154+
"execution_count": 6,
204155
"metadata": {},
205156
"outputs": [
206157
{
@@ -212,7 +163,7 @@
212163
" :C"
213164
]
214165
},
215-
"execution_count": 7,
166+
"execution_count": 6,
216167
"metadata": {},
217168
"output_type": "execute_result"
218169
}
@@ -221,6 +172,13 @@
221172
"names(x)"
222173
]
223174
},
175+
{
176+
"cell_type": "markdown",
177+
"metadata": {},
178+
"source": [
179+
"Future tip: In Julia 0.7 `propertynames` is also supported."
180+
]
181+
},
224182
{
225183
"cell_type": "markdown",
226184
"metadata": {},
@@ -230,7 +188,7 @@
230188
},
231189
{
232190
"cell_type": "code",
233-
"execution_count": 8,
191+
"execution_count": 7,
234192
"metadata": {},
235193
"outputs": [
236194
{
@@ -242,7 +200,7 @@
242200
" String "
243201
]
244202
},
245-
"execution_count": 8,
203+
"execution_count": 7,
246204
"metadata": {},
247205
"output_type": "execute_result"
248206
}
@@ -260,10 +218,8 @@
260218
},
261219
{
262220
"cell_type": "code",
263-
"execution_count": 9,
264-
"metadata": {
265-
"collapsed": true
266-
},
221+
"execution_count": 8,
222+
"metadata": {},
267223
"outputs": [],
268224
"source": [
269225
"y = DataFrame(rand(1:10, 1000, 10));"
@@ -278,27 +234,27 @@
278234
},
279235
{
280236
"cell_type": "code",
281-
"execution_count": 10,
237+
"execution_count": 9,
282238
"metadata": {},
283239
"outputs": [
284240
{
285241
"data": {
286242
"text/html": [
287-
"<table class=\"data-frame\"><thead><tr><th></th><th>x1</th><th>x2</th><th>x3</th><th>x4</th><th>x5</th><th>x6</th><th>x7</th><th>x8</th><th>x9</th><th>x10</th></tr></thead><tbody><tr><th>1</th><td>8</td><td>6</td><td>1</td><td>2</td><td>7</td><td>10</td><td>5</td><td>1</td><td>5</td><td>10</td></tr><tr><th>2</th><td>8</td><td>9</td><td>6</td><td>6</td><td>10</td><td>4</td><td>9</td><td>3</td><td>10</td><td>9</td></tr><tr><th>3</th><td>5</td><td>1</td><td>4</td><td>3</td><td>10</td><td>5</td><td>1</td><td>10</td><td>5</td><td>9</td></tr><tr><th>4</th><td>2</td><td>9</td><td>2</td><td>2</td><td>5</td><td>7</td><td>7</td><td>9</td><td>9</td><td>5</td></tr><tr><th>5</th><td>4</td><td>8</td><td>4</td><td>10</td><td>8</td><td>5</td><td>1</td><td>2</td><td>1</td><td>10</td></tr><tr><th>6</th><td>8</td><td>6</td><td>6</td><td>8</td><td>3</td><td>3</td><td>3</td><td>6</td><td>8</td><td>6</td></tr></tbody></table>"
243+
"<table class=\"data-frame\"><thead><tr><th></th><th>x1</th><th>x2</th><th>x3</th><th>x4</th><th>x5</th><th>x6</th><th>x7</th><th>x8</th><th>x9</th><th>x10</th></tr></thead><tbody><tr><th>1</th><td>4</td><td>1</td><td>2</td><td>8</td><td>10</td><td>7</td><td>5</td><td>1</td><td>8</td><td>3</td></tr><tr><th>2</th><td>5</td><td>6</td><td>6</td><td>3</td><td>2</td><td>4</td><td>9</td><td>10</td><td>10</td><td>4</td></tr><tr><th>3</th><td>3</td><td>5</td><td>4</td><td>8</td><td>4</td><td>4</td><td>4</td><td>6</td><td>6</td><td>9</td></tr><tr><th>4</th><td>8</td><td>8</td><td>2</td><td>6</td><td>7</td><td>3</td><td>6</td><td>4</td><td>10</td><td>6</td></tr><tr><th>5</th><td>1</td><td>2</td><td>6</td><td>10</td><td>4</td><td>7</td><td>7</td><td>7</td><td>5</td><td>4</td></tr><tr><th>6</th><td>5</td><td>7</td><td>9</td><td>10</td><td>5</td><td>1</td><td>6</td><td>2</td><td>3</td><td>4</td></tr></tbody></table>"
288244
],
289245
"text/plain": [
290246
"6×10 DataFrames.DataFrame\n",
291247
"│ Row │ x1 │ x2 │ x3 │ x4 │ x5 │ x6 │ x7 │ x8 │ x9 │ x10 │\n",
292248
"├─────┼────┼────┼────┼────┼────┼────┼────┼────┼────┼─────┤\n",
293-
"│ 1 │ 86 │ 1 │ 2 │ 7 │ 10 │ 5 │ 1 │ 510\n",
294-
"│ 2 │ 89 │ 6 │ 610 │ 4 │ 9 │ 3 │ 10 │ 9\n",
295-
"│ 3 │ 51 │ 4 │ 310 │ 5110 │ 5 │ 9 │\n",
296-
"│ 4 │ 29 │ 2 │ 257799 │ 5\n",
297-
"│ 5 │ 484 │ 10 │ 8512110\n",
298-
"│ 6 │ 8668 │ 333686"
249+
"│ 1 │ 4 │ 1 │ 2 │ 8 │ 10 │ 7 │ 5 │ 1 │ 83 \n",
250+
"│ 2 │ 56 │ 6 │ 32 │ 4 │ 9 │ 10 │ 10 │ 4\n",
251+
"│ 3 │ 35 │ 4 │ 84 │ 446 │ 6 │ 9 │\n",
252+
"│ 4 │ 88 │ 2 │ 6736410 │ 6\n",
253+
"│ 5 │ 126 │ 10 │ 477754 \n",
254+
"│ 6 │ 57910 │ 516234"
299255
]
300256
},
301-
"execution_count": 10,
257+
"execution_count": 9,
302258
"metadata": {},
303259
"output_type": "execute_result"
304260
}
@@ -316,24 +272,24 @@
316272
},
317273
{
318274
"cell_type": "code",
319-
"execution_count": 11,
275+
"execution_count": 10,
320276
"metadata": {},
321277
"outputs": [
322278
{
323279
"data": {
324280
"text/html": [
325-
"<table class=\"data-frame\"><thead><tr><th></th><th>x1</th><th>x2</th><th>x3</th><th>x4</th><th>x5</th><th>x6</th><th>x7</th><th>x8</th><th>x9</th><th>x10</th></tr></thead><tbody><tr><th>1</th><td>1</td><td>10</td><td>5</td><td>7</td><td>8</td><td>6</td><td>1</td><td>2</td><td>3</td><td>6</td></tr><tr><th>2</th><td>1</td><td>1</td><td>2</td><td>7</td><td>9</td><td>7</td><td>3</td><td>3</td><td>3</td><td>3</td></tr><tr><th>3</th><td>4</td><td>6</td><td>1</td><td>2</td><td>1</td><td>1</td><td>4</td><td>7</td><td>9</td><td>4</td></tr></tbody></table>"
281+
"<table class=\"data-frame\"><thead><tr><th></th><th>x1</th><th>x2</th><th>x3</th><th>x4</th><th>x5</th><th>x6</th><th>x7</th><th>x8</th><th>x9</th><th>x10</th></tr></thead><tbody><tr><th>1</th><td>2</td><td>8</td><td>3</td><td>7</td><td>6</td><td>4</td><td>3</td><td>8</td><td>5</td><td>4</td></tr><tr><th>2</th><td>7</td><td>1</td><td>5</td><td>5</td><td>3</td><td>6</td><td>1</td><td>8</td><td>5</td><td>1</td></tr><tr><th>3</th><td>8</td><td>1</td><td>10</td><td>9</td><td>4</td><td>2</td><td>10</td><td>2</td><td>6</td><td>6</td></tr></tbody></table>"
326282
],
327283
"text/plain": [
328284
"3×10 DataFrames.DataFrame\n",
329285
"│ Row │ x1 │ x2 │ x3 │ x4 │ x5 │ x6 │ x7 │ x8 │ x9 │ x10 │\n",
330286
"├─────┼────┼────┼────┼────┼────┼────┼────┼────┼────┼─────┤\n",
331-
"│ 1 │ 110 │ 5 │ 7 │ 861236\n",
332-
"│ 2 │ 1 │ 1 │ 27973333\n",
333-
"│ 3 │ 461 │ 2114 │ 794"
287+
"│ 1 │ 28 │ 3 │ 7 │ 643854\n",
288+
"│ 2 │ 7 │ 1 │ 55361851\n",
289+
"│ 3 │ 8110 │ 94210 │ 266"
334290
]
335291
},
336-
"execution_count": 11,
292+
"execution_count": 10,
337293
"metadata": {},
338294
"output_type": "execute_result"
339295
}
@@ -353,7 +309,7 @@
353309
},
354310
{
355311
"cell_type": "code",
356-
"execution_count": 12,
312+
"execution_count": 11,
357313
"metadata": {},
358314
"outputs": [
359315
{
@@ -362,7 +318,7 @@
362318
"([1, 2], [1, 2], [1, 2])"
363319
]
364320
},
365-
"execution_count": 12,
321+
"execution_count": 11,
366322
"metadata": {},
367323
"output_type": "execute_result"
368324
}
@@ -371,6 +327,13 @@
371327
"x[1], x[:A], x[:, 1]"
372328
]
373329
},
330+
{
331+
"cell_type": "markdown",
332+
"metadata": {},
333+
"source": [
334+
"Future tip: In Julia 0.7 also accessing column using `x.A` syntax (`getproperty`/`setproperty!`) is supported."
335+
]
336+
},
374337
{
375338
"cell_type": "markdown",
376339
"metadata": {},
@@ -380,7 +343,7 @@
380343
},
381344
{
382345
"cell_type": "code",
383-
"execution_count": 13,
346+
"execution_count": 12,
384347
"metadata": {},
385348
"outputs": [
386349
{
@@ -395,7 +358,7 @@
395358
"│ 1 │ 1 │ 1.0 │ a │"
396359
]
397360
},
398-
"execution_count": 13,
361+
"execution_count": 12,
399362
"metadata": {},
400363
"output_type": "execute_result"
401364
}
@@ -413,7 +376,7 @@
413376
},
414377
{
415378
"cell_type": "code",
416-
"execution_count": 14,
379+
"execution_count": 13,
417380
"metadata": {},
418381
"outputs": [
419382
{
@@ -422,7 +385,7 @@
422385
"1"
423386
]
424387
},
425-
"execution_count": 14,
388+
"execution_count": 13,
426389
"metadata": {},
427390
"output_type": "execute_result"
428391
}
@@ -440,7 +403,7 @@
440403
},
441404
{
442405
"cell_type": "code",
443-
"execution_count": 15,
406+
"execution_count": 14,
444407
"metadata": {},
445408
"outputs": [
446409
{
@@ -456,7 +419,7 @@
456419
"│ 2 │ 1 │ 1.0 │ b │"
457420
]
458421
},
459-
"execution_count": 15,
422+
"execution_count": 14,
460423
"metadata": {},
461424
"output_type": "execute_result"
462425
}
@@ -475,7 +438,7 @@
475438
},
476439
{
477440
"cell_type": "code",
478-
"execution_count": 16,
441+
"execution_count": 15,
479442
"metadata": {},
480443
"outputs": [
481444
{
@@ -491,7 +454,7 @@
491454
"│ 2 │ 2 │ 2.0 │ b │"
492455
]
493456
},
494-
"execution_count": 16,
457+
"execution_count": 15,
495458
"metadata": {},
496459
"output_type": "execute_result"
497460
}
@@ -510,7 +473,7 @@
510473
},
511474
{
512475
"cell_type": "code",
513-
"execution_count": 17,
476+
"execution_count": 16,
514477
"metadata": {},
515478
"outputs": [
516479
{
@@ -526,7 +489,7 @@
526489
"│ 2 │ 7 │ 8.0 │ b │"
527490
]
528491
},
529-
"execution_count": 17,
492+
"execution_count": 16,
530493
"metadata": {},
531494
"output_type": "execute_result"
532495
}
@@ -539,15 +502,15 @@
539502
],
540503
"metadata": {
541504
"kernelspec": {
542-
"display_name": "Julia 0.6.0",
505+
"display_name": "Julia 0.6.2",
543506
"language": "julia",
544507
"name": "julia-0.6"
545508
},
546509
"language_info": {
547510
"file_extension": ".jl",
548511
"mimetype": "application/julia",
549512
"name": "julia",
550-
"version": "0.6.0"
513+
"version": "0.6.3"
551514
}
552515
},
553516
"nbformat": 4,

0 commit comments

Comments
 (0)