{ "cells": [ { "cell_type": "markdown", "metadata": {}, "source": [ "# `spudtr` epochs dataframe format\n", "\n", "`spudtr` epochs are `pandas.DataFrame` objects.\n", "\n", "There are three key elements:\n", "\n", " 1. `epoch_id` an index-like integer column, where each value designates a unique epoch\n", " 2. `time` an index-like column of integer timestamps, the same in each epoch\n", " 3. the rest of the data columns\n", " \n", "There must be at least one epoch.\n", "\n", "There must be at least one timepoint.\n", "\n", "All the epochs must be timestamped exactly the same way.\n", "\n", "> NOTE: timestamps are positive and negative integers, the units are unspecified: milliseconds, months, nanoseconds, hours." ] }, { "cell_type": "code", "execution_count": 1, "metadata": {}, "outputs": [], "source": [ "import pandas as pd\n", "from matplotlib import pyplot as plt\n", "\n", "from spudtr import get_demo_df, P3_1500_FEATHER\n", "from spudtr import epf\n", "import spudtr.fake_epochs_data as fake_data" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "**Example: simulated categorical and continuous data**\n", "\n", "The `epoch_id` column is \"epoch_id\", there are four epochs: 0, 1, 2, 3.\n", "\n", "The `time` column is \"days\", there are 31 days in each epoch, 0, 1, 2, ..., 31.\n", "\n", "The rest of the columns are the data recorded in each epoch at each time stamp." ] }, { "cell_type": "code", "execution_count": 2, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", " | epoch_id | \n", "days | \n", "categorical | \n", "continuous | \n", "channel0 | \n", "channel1 | \n", "channel2 | \n", "channel3 | \n", "
---|---|---|---|---|---|---|---|---|
0 | \n", "0 | \n", "0 | \n", "cat0 | \n", "0.771321 | \n", "-13.170787 | \n", "-30.197057 | \n", "19.609869 | \n", "43.177612 | \n", "
1 | \n", "0 | \n", "1 | \n", "cat0 | \n", "0.020752 | \n", "4.233125 | \n", "-7.726009 | \n", "-65.298259 | \n", "41.464399 | \n", "
2 | \n", "0 | \n", "2 | \n", "cat0 | \n", "0.633648 | \n", "8.191480 | \n", "21.915223 | \n", "18.568468 | \n", "27.639613 | \n", "
3 | \n", "0 | \n", "3 | \n", "cat0 | \n", "0.748804 | \n", "-48.557122 | \n", "-50.952045 | \n", "14.317029 | \n", "-17.186617 | \n", "
4 | \n", "0 | \n", "4 | \n", "cat0 | \n", "0.498507 | \n", "-17.193401 | \n", "50.222266 | \n", "0.782896 | \n", "38.251473 | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
123 | \n", "3 | \n", "27 | \n", "cat1 | \n", "0.744603 | \n", "33.167254 | \n", "-7.658414 | \n", "14.630878 | \n", "14.329468 | \n", "
124 | \n", "3 | \n", "28 | \n", "cat1 | \n", "0.469785 | \n", "-60.531560 | \n", "0.774228 | \n", "1.689442 | \n", "0.882024 | \n", "
125 | \n", "3 | \n", "29 | \n", "cat1 | \n", "0.598256 | \n", "16.216221 | \n", "66.028993 | \n", "16.373534 | \n", "4.854384 | \n", "
126 | \n", "3 | \n", "30 | \n", "cat1 | \n", "0.147620 | \n", "-43.268966 | \n", "26.531028 | \n", "-20.493672 | \n", "-12.327708 | \n", "
127 | \n", "3 | \n", "31 | \n", "cat1 | \n", "0.184035 | \n", "-48.265511 | \n", "-41.604676 | \n", "-19.770519 | \n", "27.925069 | \n", "
128 rows × 8 columns
\n", "\n", " | epoch_id | \n", "time_ms | \n", "sub_id | \n", "eeg_artifact | \n", "dblock_path | \n", "log_evcodes | \n", "log_ccodes | \n", "dblock_srate | \n", "ccode | \n", "instrument | \n", "... | \n", "RMOc | \n", "LLTe | \n", "RLTe | \n", "LLOc | \n", "RLOc | \n", "MiOc | \n", "A2 | \n", "HEOG | \n", "rle | \n", "rhz | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", "0 | \n", "-748 | \n", "sub000 | \n", "0 | \n", "sub000/dblock_0 | \n", "0 | \n", "0 | \n", "250.0 | \n", "1 | \n", "eeg | \n", "... | \n", "-25.093750 | \n", "-0.753906 | \n", "1.480469 | \n", "-13.414062 | \n", "-18.937500 | \n", "-17.734375 | \n", "5.660156 | \n", "98.875000 | \n", "-39.500000 | \n", "38.375000 | \n", "
1 | \n", "0 | \n", "-744 | \n", "sub000 | \n", "0 | \n", "sub000/dblock_0 | \n", "0 | \n", "0 | \n", "250.0 | \n", "1 | \n", "eeg | \n", "... | \n", "-24.593750 | \n", "0.502441 | \n", "-2.466797 | \n", "-17.640625 | \n", "-17.468750 | \n", "-15.304688 | \n", "1.968750 | \n", "104.750000 | \n", "-38.031250 | \n", "41.281250 | \n", "
2 | \n", "0 | \n", "-740 | \n", "sub000 | \n", "0 | \n", "sub000/dblock_0 | \n", "0 | \n", "0 | \n", "250.0 | \n", "1 | \n", "eeg | \n", "... | \n", "-16.484375 | \n", "-1.507812 | \n", "3.947266 | \n", "-15.648438 | \n", "-10.085938 | \n", "-11.171875 | \n", "8.367188 | \n", "102.062500 | \n", "-33.656250 | \n", "43.718750 | \n", "
3 | \n", "0 | \n", "-736 | \n", "sub000 | \n", "0 | \n", "sub000/dblock_0 | \n", "0 | \n", "0 | \n", "250.0 | \n", "1 | \n", "eeg | \n", "... | \n", "-11.804688 | \n", "-15.070312 | \n", "9.867188 | \n", "-14.906250 | \n", "-7.378906 | \n", "-8.742188 | \n", "9.351562 | \n", "100.562500 | \n", "-42.906250 | \n", "37.406250 | \n", "
4 | \n", "0 | \n", "-732 | \n", "sub000 | \n", "0 | \n", "sub000/dblock_0 | \n", "0 | \n", "0 | \n", "250.0 | \n", "1 | \n", "eeg | \n", "... | \n", "-6.394531 | \n", "-4.019531 | \n", "9.125000 | \n", "-10.679688 | \n", "-6.886719 | \n", "-8.015625 | \n", "8.125000 | \n", "98.375000 | \n", "-43.875000 | \n", "37.906250 | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
224995 | \n", "600 | \n", "732 | \n", "sub000 | \n", "0 | \n", "sub000/dblock_4 | \n", "0 | \n", "0 | \n", "250.0 | \n", "0 | \n", "cal | \n", "... | \n", "-4.671875 | \n", "-3.517578 | \n", "-4.441406 | \n", "-4.718750 | \n", "-4.671875 | \n", "-3.400391 | \n", "-4.429688 | \n", "-4.406250 | \n", "-3.900391 | \n", "-4.371094 | \n", "
224996 | \n", "600 | \n", "736 | \n", "sub000 | \n", "0 | \n", "sub000/dblock_4 | \n", "0 | \n", "0 | \n", "250.0 | \n", "0 | \n", "cal | \n", "... | \n", "-4.179688 | \n", "-4.019531 | \n", "-4.195312 | \n", "-4.222656 | \n", "-4.425781 | \n", "-3.644531 | \n", "-4.429688 | \n", "-4.160156 | \n", "-3.412109 | \n", "-4.371094 | \n", "
224997 | \n", "600 | \n", "740 | \n", "sub000 | \n", "0 | \n", "sub000/dblock_4 | \n", "0 | \n", "0 | \n", "250.0 | \n", "0 | \n", "cal | \n", "... | \n", "-4.425781 | \n", "-3.767578 | \n", "-4.441406 | \n", "-3.974609 | \n", "-4.425781 | \n", "-3.400391 | \n", "-4.429688 | \n", "-4.160156 | \n", "-3.900391 | \n", "-4.859375 | \n", "
224998 | \n", "600 | \n", "744 | \n", "sub000 | \n", "0 | \n", "sub000/dblock_4 | \n", "0 | \n", "0 | \n", "250.0 | \n", "0 | \n", "cal | \n", "... | \n", "-4.425781 | \n", "-4.269531 | \n", "-4.195312 | \n", "-4.222656 | \n", "-4.425781 | \n", "-3.886719 | \n", "-4.429688 | \n", "-4.406250 | \n", "-3.900391 | \n", "-4.371094 | \n", "
224999 | \n", "600 | \n", "748 | \n", "sub000 | \n", "0 | \n", "sub000/dblock_4 | \n", "0 | \n", "0 | \n", "250.0 | \n", "0 | \n", "cal | \n", "... | \n", "-4.179688 | \n", "-4.019531 | \n", "-3.947266 | \n", "-4.222656 | \n", "-4.179688 | \n", "-3.400391 | \n", "-4.183594 | \n", "-4.406250 | \n", "-3.412109 | \n", "-4.371094 | \n", "
225000 rows × 47 columns
\n", "\n", " | epoch_id | \n", "time_ms | \n", "sub_id | \n", "eeg_artifact | \n", "dblock_path | \n", "log_evcodes | \n", "log_ccodes | \n", "dblock_srate | \n", "ccode | \n", "instrument | \n", "... | \n", "RMOc | \n", "LLTe | \n", "RLTe | \n", "LLOc | \n", "RLOc | \n", "MiOc | \n", "A2 | \n", "HEOG | \n", "rle | \n", "rhz | \n", "
---|
0 rows × 47 columns
\n", "