-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathsensorutils.py
84 lines (67 loc) · 3.06 KB
/
sensorutils.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
# common code for handling the data directory
# filename format:
# DATA_DIR/sensors-yyyy-mm-dd.csv
# file format:
# epoch, date_time, location, temperature, humidity
import datetime
import os.path
import pandas as pd
COLUMNS = ['epoch', 'iso_time', 'location', 'temperature', 'humidity', 'pressure', 'resistance', 'elapsed_time']
def get_cutoff_date(days_ago: int):
return datetime.date.today() - datetime.timedelta(days=days_ago)
def get_cutoff_time(days_ago: int):
cutoff_date = get_cutoff_date(days_ago)
return datetime.datetime.combine(cutoff_date, datetime.time())
def convert_item(item) -> str:
if item is None:
return ''
return str(item)
class DataLocation:
def __init__(self, data_directory, verbose):
self.directory = data_directory
self.verbose = verbose
def get_filename(self, date: datetime.date):
"""
Generate the correct filename for the given date.
"""
date_string = date.isoformat()
filename = os.path.join(self.directory, f'sensors-{date_string}.csv')
return filename
def find_files(self, max_days_ago: int):
"""
Search the directory for data files up to X days ago.
"""
date_range = [datetime.date.today() - datetime.timedelta(days=d) for d in range(0, max_days_ago)]
look_for = [self.get_filename(d) for d in date_range]
return [filename for filename in look_for if os.path.exists(filename)]
def record(self, epoch: int, iso_time: datetime.datetime, location: str,
temperature: float, humidity: float, pressure: float, resistance: float,
elapsed_time: float):
filename = self.get_filename(iso_time.date())
iso_time = datetime.datetime.isoformat(iso_time).split('.')[0]
output_entries = [convert_item(epoch), iso_time, location, convert_item(temperature),
convert_item(humidity), convert_item(pressure),
convert_item(resistance), convert_item(elapsed_time)]
output_line = ','.join(output_entries) + '\n'
with open(filename, 'a', encoding='utf-8') as f:
if self.verbose:
print('writing to', filename)
print(output_line)
f.write(output_line)
return
def get_dataframe(self, max_days_ago: int, location: str) -> pd.DataFrame:
filenames = self.find_files(max_days_ago)
dataframes = []
for fn in filenames:
if self.verbose:
print('Reading', fn)
dataframes.append(pd.read_csv(fn, header=None, names=COLUMNS))
big_dataframe = pd.concat(dataframes)
big_dataframe['timestamp'] = pd.to_datetime(big_dataframe['iso_time'])
big_dataframe['date'] = big_dataframe['timestamp'].dt.date
big_dataframe = big_dataframe.sort_values(by='timestamp', axis=0)
if self.verbose:
print('dataframe', big_dataframe.shape)
print('columns', big_dataframe.columns)
del dataframes
return big_dataframe[big_dataframe['location'] == location]