Kernel: Python 3
Future question for Dr. Soto
Should I concatinate the dataframes on integer indices or Date-Time indices? I dont think it will make a difference.. not sure which one is easier
In [777]:
In [778]:
Timestamp | Temperature | Humidity | CO2 | Noise | Pressure | |
---|---|---|---|---|---|---|
count | 9.014300e+04 | 90143.000000 | 90143.000000 | 90137.000000 | 90132.000000 | 90143.000000 |
mean | 1.469613e+09 | 22.766724 | 51.291637 | 550.204799 | 38.964730 | 1011.348933 |
std | 7.900773e+06 | 1.592268 | 6.929620 | 318.321732 | 7.100703 | 4.217541 |
min | 1.455917e+09 | 17.900000 | 27.000000 | 201.000000 | 35.000000 | 995.000000 |
25% | 1.462765e+09 | 21.700000 | 49.000000 | 354.000000 | 36.000000 | 1008.300000 |
50% | 1.469657e+09 | 22.900000 | 52.000000 | 416.000000 | 36.000000 | 1011.000000 |
75% | 1.476459e+09 | 23.800000 | 55.000000 | 639.000000 | 38.000000 | 1014.100000 |
max | 1.483257e+09 | 28.500000 | 76.000000 | 2777.000000 | 79.000000 | 1027.500000 |
In [779]:
In [780]:
In [781]:
Timestamp | Timezone : America/Los_Angeles | Temperature | Humidity | CO2 | Noise | Pressure | |
---|---|---|---|---|---|---|---|
Numbered_index | |||||||
1 | 1455917199 | 2/19/16 13:26 | 18.8 | 76 | NaN | NaN | 1015.7 |
2 | 1455917255 | 2/19/16 13:27 | 19.2 | 75 | 718.0 | NaN | 1015.7 |
3 | 1455917257 | 2/19/16 13:27 | 19.9 | 73 | NaN | NaN | 1015.7 |
4 | 1455917513 | 2/19/16 13:31 | 20.3 | 73 | 337.0 | 44.0 | 1015.8 |
5 | 1455917814 | 2/19/16 13:36 | 21.2 | 70 | 332.0 | 47.0 | 1015.7 |
In [782]:
In [783]:
Timezone : America/Los_Angeles | CO2 | |
---|---|---|
Numbered_index | ||
1 | 2/19/16 13:26 | NaN |
In [784]:
In [785]:
In [786]:
In [787]:
In [788]:
In [789]:
Time | CO2 | |
---|---|---|
numbered_index | ||
90144 | 1/1/17 0:00 | 482 |
90145 | 1/1/17 0:05 | 491 |
90146 | 1/1/17 0:11 | 480 |
90147 | 1/1/17 0:16 | 486 |
90148 | 1/1/17 0:21 | 490 |
In [790]:
Timezone : America/Los_Angeles | CO2 | |
---|---|---|
Numbered_index | ||
1 | 2/19/16 13:26 | NaN |
2 | 2/19/16 13:27 | 718.0 |
3 | 2/19/16 13:27 | NaN |
4 | 2/19/16 13:31 | 337.0 |
5 | 2/19/16 13:36 | 332.0 |
In [791]:
Time | CO2 | |
---|---|---|
Numbered_index | ||
1 | 2/19/16 13:26 | NaN |
2 | 2/19/16 13:27 | 718.0 |
3 | 2/19/16 13:27 | NaN |
4 | 2/19/16 13:31 | 337.0 |
5 | 2/19/16 13:36 | 332.0 |
In [792]:
Time | CO2 | |
---|---|---|
numbered_index | ||
100987 | 2/12/17 18:27 | 484 |
100988 | 2/12/17 18:32 | 486 |
100989 | 2/12/17 18:37 | 469 |
100990 | 2/12/17 18:42 | 485 |
100991 | 2/12/17 18:47 | 480 |
In [793]:
Time | CO2 | |
---|---|---|
1 | 2/19/16 13:26 | NaN |
2 | 2/19/16 13:27 | 718.0 |
3 | 2/19/16 13:27 | NaN |
4 | 2/19/16 13:31 | 337.0 |
5 | 2/19/16 13:36 | 332.0 |
In [794]:
Time | CO2 | |
---|---|---|
100987 | 2/12/17 18:27 | 484.0 |
100988 | 2/12/17 18:32 | 486.0 |
100989 | 2/12/17 18:37 | 469.0 |
100990 | 2/12/17 18:42 | 485.0 |
100991 | 2/12/17 18:47 | 480.0 |
In [795]:
<matplotlib.axes._subplots.AxesSubplot at 0x7fc30f81eb00>
In [796]:
In [797]:
In [798]:
In [799]:
Time object
CO2 float64
dtype: object
In [800]:
Time | CO2 | |
---|---|---|
1 | 2/19/16 13:26 | NaN |
2 | 2/19/16 13:27 | 718.0 |
3 | 2/19/16 13:27 | NaN |
4 | 2/19/16 13:31 | 337.0 |
5 | 2/19/16 13:36 | 332.0 |
In [801]:
Time | CO2 | |
---|---|---|
1 | False | True |
2 | False | False |
3 | False | True |
4 | False | False |
5 | False | False |
In [0]:
In [0]:
In [802]:
In [803]:
Time | CO2 | |
---|---|---|
1 | 2016-02-19 13:26:00 | NaN |
2 | 2016-02-19 13:27:00 | 718.0 |
3 | 2016-02-19 13:27:00 | NaN |
4 | 2016-02-19 13:31:00 | 337.0 |
5 | 2016-02-19 13:36:00 | 332.0 |
In [804]:
1 Friday
2 Friday
3 Friday
4 Friday
5 Friday
Name: Time, dtype: object
In [805]:
In [806]:
Time | CO2 | |
---|---|---|
411 | 2016-02-20 23:39:00 | 400.0 |
412 | 2016-02-20 23:44:00 | 419.0 |
413 | 2016-02-20 23:49:00 | 407.0 |
414 | 2016-02-20 23:54:00 | 417.0 |
415 | 2016-02-20 23:59:00 | 417.0 |
In [807]:
Timedelta('359 days 05:21:00')
In [808]:
Time | CO2 | Day | |
---|---|---|---|
1 | 2016-02-19 13:26:00 | NaN | Friday |
2 | 2016-02-19 13:27:00 | 718.0 | Friday |
3 | 2016-02-19 13:27:00 | NaN | Friday |
4 | 2016-02-19 13:31:00 | 337.0 | Friday |
5 | 2016-02-19 13:36:00 | 332.0 | Friday |
In [809]:
Saturday 14598
Tuesday 14589
Sunday 14539
Monday 14488
Wednesday 14472
Friday 14438
Thursday 13867
Name: Day, dtype: int64
In [810]:
<matplotlib.axes._subplots.AxesSubplot at 0x7fc30f0ed1d0>
Switching to df2 because it is still note recognized by datetime
In [811]:
Time | CO2 | |
---|---|---|
numbered_index | ||
90144 | 1/1/17 0:00 | 482 |
90145 | 1/1/17 0:05 | 491 |
90146 | 1/1/17 0:11 | 480 |
90147 | 1/1/17 0:16 | 486 |
90148 | 1/1/17 0:21 | 490 |
In [812]:
In [813]:
Time | CO2 | Day | |
---|---|---|---|
1 | 2016-02-19 13:26:00 | NaN | Friday |
2 | 2016-02-19 13:27:00 | 718.0 | Friday |
3 | 2016-02-19 13:27:00 | NaN | Friday |
4 | 2016-02-19 13:31:00 | 337.0 | Friday |
5 | 2016-02-19 13:36:00 | 332.0 | Friday |
In [814]:
In [815]:
Time | CO2 | Day | Time2 | |
---|---|---|---|---|
1 | 2016-02-19 13:26:00 | NaN | Friday | 2016-02-19 13:27:00 |
2 | 2016-02-19 13:27:00 | 718.0 | Friday | 2016-02-19 13:27:00 |
3 | 2016-02-19 13:27:00 | NaN | Friday | 2016-02-19 13:31:00 |
4 | 2016-02-19 13:31:00 | 337.0 | Friday | 2016-02-19 13:36:00 |
5 | 2016-02-19 13:36:00 | 332.0 | Friday | 2016-02-19 13:41:00 |
In [816]:
Time | CO2 | Day | Time2 | TimeDel | |
---|---|---|---|---|---|
1 | 2016-02-19 13:26:00 | NaN | Friday | 2016-02-19 13:27:00 | 00:01:00 |
2 | 2016-02-19 13:27:00 | 718.0 | Friday | 2016-02-19 13:27:00 | 00:00:00 |
3 | 2016-02-19 13:27:00 | NaN | Friday | 2016-02-19 13:31:00 | 00:04:00 |
4 | 2016-02-19 13:31:00 | 337.0 | Friday | 2016-02-19 13:36:00 | 00:05:00 |
5 | 2016-02-19 13:36:00 | 332.0 | Friday | 2016-02-19 13:41:00 | 00:05:00 |
In [817]:
1 60.0
2 0.0
3 240.0
4 300.0
5 300.0
Name: TimeDel, dtype: float64
In [818]:
Time datetime64[ns]
CO2 float64
Day object
Time2 datetime64[ns]
TimeDel timedelta64[ns]
dtype: object
In [819]:
In [820]:
Time datetime64[ns]
CO2 float64
Day object
Time2 datetime64[ns]
TimeDel float64
dtype: object
In [821]:
In [822]:
Time 0
CO2 6
Day 0
Time2 1
TimeDel 1
CO2_over_TimeDiff 7
dtype: int64
In [823]:
Time | CO2 | Day | Time2 | TimeDel | CO2_over_TimeDiff | |
---|---|---|---|---|---|---|
1 | 2016-02-19 13:26:00 | NaN | Friday | 2016-02-19 13:27:00 | 60.0 | NaN |
3 | 2016-02-19 13:27:00 | NaN | Friday | 2016-02-19 13:31:00 | 240.0 | NaN |
2911 | 2016-02-29 17:03:00 | NaN | Monday | 2016-02-29 17:05:00 | 120.0 | NaN |
32931 | 2016-06-14 05:09:00 | NaN | Tuesday | 2016-06-14 05:10:00 | 60.0 | NaN |
48678 | 2016-08-09 05:21:00 | NaN | Tuesday | 2016-08-09 05:22:00 | 60.0 | NaN |
72565 | 2016-10-31 15:40:00 | NaN | Monday | 2016-10-31 15:44:00 | 240.0 | NaN |
In [824]:
(100991, 6)
In [825]:
In [826]:
(100984, 6)
In [827]:
Time | CO2 | Day | Time2 | TimeDel | CO2_over_TimeDiff | |
---|---|---|---|---|---|---|
2 | 2016-02-19 13:27:00 | 718.0 | Friday | 2016-02-19 13:27:00 | 0.0 | inf |
4 | 2016-02-19 13:31:00 | 337.0 | Friday | 2016-02-19 13:36:00 | 300.0 | 1.123333 |
5 | 2016-02-19 13:36:00 | 332.0 | Friday | 2016-02-19 13:41:00 | 300.0 | 1.106667 |
6 | 2016-02-19 13:41:00 | 328.0 | Friday | 2016-02-19 13:46:00 | 300.0 | 1.093333 |
7 | 2016-02-19 13:46:00 | 307.0 | Friday | 2016-02-19 13:51:00 | 300.0 | 1.023333 |
In [828]:
CO2 | TimeDel | CO2_over_TimeDiff | |
---|---|---|---|
count | 100984.000000 | 100984.000000 | 1.009840e+05 |
mean | 547.647548 | 307.336608 | inf |
std | 304.512740 | 1369.027580 | NaN |
min | 201.000000 | -3300.000000 | -3.500000e-01 |
25% | 362.000000 | 300.000000 | 1.200000e+00 |
50% | 438.000000 | 300.000000 | 1.453333e+00 |
75% | 615.000000 | 300.000000 | 2.040000e+00 |
max | 2777.000000 | 424320.000000 | inf |
In [829]:
2 inf
4 1.123333
5 1.106667
6 1.093333
7 1.023333
Name: CO2_over_TimeDiff, dtype: float64
In [0]: