{ "cells": [ { "cell_type": "markdown", "metadata": {}, "source": [ "# Lesson 17: Tidy data and split-apply-combine\n", "\n", "[Data set download](https://s3.amazonaws.com/bebi103.caltech.edu/data/gfmt_sleep.csv)\n", "\n", "
participant number | gender | age | correct hit percentage | correct reject percentage | percent correct | confidence when correct hit | confidence incorrect hit | confidence correct reject | confidence incorrect reject | confidence when correct | confidence when incorrect | sci | psqi | ess | insomnia |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
i64 | str | i64 | i64 | i64 | f64 | f64 | f64 | f64 | f64 | f64 | f64 | i64 | i64 | i64 | bool |
8 | "f" | 39 | 65 | 80 | 72.5 | 91.0 | 90.0 | 93.0 | 83.5 | 93.0 | 90.0 | 9 | 13 | 2 | true |
16 | "m" | 42 | 90 | 90 | 90.0 | 75.5 | 55.5 | 70.5 | 50.0 | 75.0 | 50.0 | 4 | 11 | 7 | true |
18 | "f" | 31 | 90 | 95 | 92.5 | 89.5 | 90.0 | 86.0 | 81.0 | 89.0 | 88.0 | 10 | 9 | 3 | true |
22 | "f" | 35 | 100 | 75 | 87.5 | 89.5 | null | 71.0 | 80.0 | 88.0 | 80.0 | 13 | 8 | 20 | true |
27 | "f" | 74 | 60 | 65 | 62.5 | 68.5 | 49.0 | 61.0 | 49.0 | 65.0 | 49.0 | 13 | 9 | 12 | true |
insomnia | participant number | gender | age | correct hit percentage | correct reject percentage | percent correct | confidence when correct hit | confidence incorrect hit | confidence correct reject | confidence incorrect reject | confidence when correct | confidence when incorrect | sci | psqi | ess |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
bool | f64 | str | f64 | f64 | f64 | f64 | f64 | f64 | f64 | f64 | f64 | f64 | f64 | f64 | f64 |
false | 54.0 | null | 36.0 | 90.0 | 80.0 | 85.0 | 74.5 | 55.5 | 71.5 | 59.0 | 75.0 | 59.25 | 26.0 | 4.0 | 6.0 |
true | 46.0 | null | 39.0 | 90.0 | 75.0 | 75.0 | 76.5 | 72.0 | 71.0 | 68.5 | 77.0 | 65.0 | 14.0 | 9.0 | 7.0 |
insomnia | participant number | gender | age | correct hit percentage | correct reject percentage | percent correct | confidence when correct hit | confidence incorrect hit | confidence correct reject | confidence incorrect reject | confidence when correct | confidence when incorrect | sci | psqi | ess |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
bool | f64 | str | f64 | f64 | f64 | f64 | f64 | f64 | f64 | f64 | f64 | f64 | f64 | f64 | f64 |
true | 46.0 | null | 39.0 | 90.0 | 75.0 | 75.0 | 76.5 | 72.0 | 71.0 | 68.5 | 77.0 | 65.0 | 14.0 | 9.0 | 7.0 |
false | 54.0 | null | 36.0 | 90.0 | 80.0 | 85.0 | 74.5 | 55.5 | 71.5 | 59.0 | 75.0 | 59.25 | 26.0 | 4.0 | 6.0 |
insomnia | age | correct hit percentage | correct reject percentage | percent correct | confidence when correct hit | confidence incorrect hit | confidence correct reject | confidence incorrect reject | confidence when correct | confidence when incorrect | sci | psqi | ess |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|
bool | f64 | f64 | f64 | f64 | f64 | f64 | f64 | f64 | f64 | f64 | f64 | f64 | f64 |
true | 39.0 | 90.0 | 75.0 | 75.0 | 76.5 | 72.0 | 71.0 | 68.5 | 77.0 | 65.0 | 14.0 | 9.0 | 7.0 |
false | 36.0 | 90.0 | 80.0 | 85.0 | 74.5 | 55.5 | 71.5 | 59.0 | 75.0 | 59.25 | 26.0 | 4.0 | 6.0 |
insomnia | percent correct | confidence when correct |
---|---|---|
bool | f64 | f64 |
false | 85.0 | 75.0 |
true | 75.0 | 77.0 |
gender | insomnia | participant number | age | correct hit percentage | correct reject percentage | percent correct | confidence when correct hit | confidence incorrect hit | confidence correct reject | confidence incorrect reject | confidence when correct | confidence when incorrect | sci | psqi | ess |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
str | bool | f64 | f64 | f64 | f64 | f64 | f64 | f64 | f64 | f64 | f64 | f64 | f64 | f64 | f64 |
"f" | false | 58.0 | 36.0 | 85.0 | 80.0 | 85.0 | 74.0 | 55.0 | 70.5 | 60.0 | 74.0 | 58.75 | 26.0 | 4.0 | 7.0 |
"m" | true | 55.5 | 37.0 | 95.0 | 82.5 | 83.75 | 83.75 | 55.5 | 75.75 | 73.25 | 81.25 | 62.5 | 14.0 | 9.0 | 8.0 |
"f" | true | 46.0 | 39.0 | 80.0 | 75.0 | 72.5 | 76.5 | 73.75 | 71.0 | 68.5 | 77.0 | 70.5 | 14.0 | 9.0 | 7.0 |
"m" | false | 41.0 | 38.5 | 90.0 | 80.0 | 82.5 | 76.0 | 57.75 | 74.25 | 54.75 | 76.25 | 59.25 | 29.0 | 3.0 | 6.0 |
insomnia | percent correct |
---|---|
bool | list[u32] |
true | [11, 21, … 10] |
false | [13, 35, … 7] |
insomnia | percent correct |
---|---|
bool | u32 |
true | 11 |
true | 21 |
true | 23 |
true | 19 |
true | 3 |
… | … |
false | 29 |
false | 57 |
false | 20 |
false | 12 |
false | 7 |
participant number | gender | age | correct hit percentage | correct reject percentage | percent correct | confidence when correct hit | confidence incorrect hit | confidence correct reject | confidence incorrect reject | confidence when correct | confidence when incorrect | sci | psqi | ess | insomnia | percent correct ranked within insomnia groups |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
i64 | str | i64 | i64 | i64 | f64 | f64 | f64 | f64 | f64 | f64 | f64 | i64 | i64 | i64 | bool | u32 |
8 | "f" | 39 | 65 | 80 | 72.5 | 91.0 | 90.0 | 93.0 | 83.5 | 93.0 | 90.0 | 9 | 13 | 2 | true | 11 |
16 | "m" | 42 | 90 | 90 | 90.0 | 75.5 | 55.5 | 70.5 | 50.0 | 75.0 | 50.0 | 4 | 11 | 7 | true | 21 |
18 | "f" | 31 | 90 | 95 | 92.5 | 89.5 | 90.0 | 86.0 | 81.0 | 89.0 | 88.0 | 10 | 9 | 3 | true | 23 |
22 | "f" | 35 | 100 | 75 | 87.5 | 89.5 | null | 71.0 | 80.0 | 88.0 | 80.0 | 13 | 8 | 20 | true | 19 |
27 | "f" | 74 | 60 | 65 | 62.5 | 68.5 | 49.0 | 61.0 | 49.0 | 65.0 | 49.0 | 13 | 9 | 12 | true | 3 |
… | … | … | … | … | … | … | … | … | … | … | … | … | … | … | … | … |
97 | "f" | 23 | 70 | 85 | 77.5 | 77.0 | 66.5 | 77.0 | 77.5 | 77.0 | 74.0 | 20 | 8 | 10 | false | 29 |
98 | "f" | 70 | 90 | 85 | 87.5 | 65.5 | 85.5 | 87.0 | 80.0 | 74.0 | 80.0 | 19 | 8 | 7 | false | 57 |
99 | "f" | 24 | 70 | 80 | 75.0 | 61.5 | 81.0 | 70.0 | 61.0 | 65.0 | 81.0 | 31 | 2 | 15 | false | 20 |
102 | "f" | 40 | 75 | 65 | 70.0 | 53.0 | 37.0 | 84.0 | 52.0 | 81.0 | 51.0 | 22 | 4 | 7 | false | 12 |
103 | "f" | 33 | 85 | 40 | 62.5 | 80.0 | 27.0 | 31.0 | 82.5 | 81.0 | 73.0 | 24 | 5 | 7 | false | 7 |
insomnia | median percent correct |
---|---|
bool | f64 |
false | 85.0 |
true | 75.0 |
insomnia | median percent correct |
---|---|
bool | f64 |
true | 75.0 |
false | 85.0 |
insomnia | coeff of var percent correct |
---|---|
bool | f64 |
true | 0.171856 |
false | 0.138785 |
insomnia | percent correct |
---|---|
bool | f64 |
true | 0.171856 |
false | 0.138785 |
struct[16] |
{8,"f",39,65,80,72.5,91.0,90.0,93.0,83.5,93.0,90.0,9,13,2,true} |
{16,"m",42,90,90,90.0,75.5,55.5,70.5,50.0,75.0,50.0,4,11,7,true} |
{18,"f",31,90,95,92.5,89.5,90.0,86.0,81.0,89.0,88.0,10,9,3,true} |
{22,"f",35,100,75,87.5,89.5,null,71.0,80.0,88.0,80.0,13,8,20,true} |
{27,"f",74,60,65,62.5,68.5,49.0,61.0,49.0,65.0,49.0,13,9,12,true} |
… |
{97,"f",23,70,85,77.5,77.0,66.5,77.0,77.5,77.0,74.0,20,8,10,false} |
{98,"f",70,90,85,87.5,65.5,85.5,87.0,80.0,74.0,80.0,19,8,7,false} |
{99,"f",24,70,80,75.0,61.5,81.0,70.0,61.0,65.0,81.0,31,2,15,false} |
{102,"f",40,75,65,70.0,53.0,37.0,84.0,52.0,81.0,51.0,22,4,7,false} |
{103,"f",33,85,40,62.5,80.0,27.0,31.0,82.5,81.0,73.0,24,5,7,false} |
percent correct |
---|
f64 |
72.5 |
90.0 |
92.5 |
87.5 |
62.5 |
… |
77.5 |
87.5 |
75.0 |
70.0 |
62.5 |
insomnia | bivariate correlation |
---|---|
bool | f64 |
true | 0.590435 |
false | 0.552045 |
insomnia | confidence when correct |
---|---|
bool | f64 |
true | 0.590435 |
false | 0.552045 |