Skip to content
Snippets Groups Projects
Commit e4a480ae authored by Oliver's avatar Oliver
Browse files

Added csv for maximum average over a single day, for maximum one hour average...

Added csv for maximum average over a single day, for maximum one hour average and for average over the entire year/dataset
parent 26ad6b13
No related branches found
No related tags found
No related merge requests found
sp_name,sample_datetime,time_basis_id,value
Alphington,01-01-16 0:00,1HR_AV,22.79999924
Alphington,01-01-16 1:00,1HR_AV,26.39999962
Alphington,01-01-16 2:00,1HR_AV,22.60000038
sp_name,value
Alphington,14.423692019423688
Brooklyn,20.259909177105143
Dandenong,15.554988189340063
Footscray,15.077387055742498
Geelong South,17.114088090521765
Mooroolbark,13.03298071988639
Richmond,16.088718474207894
Traralgon,13.789331489934671
sp_name,value
Alphington,310.5
Brooklyn,292.8999939
Dandenong,189.8999939
Footscray,180.5
Geelong South,919.0999756
Mooroolbark,304.1000061
Richmond,336.2000122
Traralgon,120.0999985
sp_name,value
Alphington,37.87500011879167
Brooklyn,82.41250022125
Dandenong,40.941667120000005
Footscray,42.65833330041665
Geelong South,68.35000076016667
Mooroolbark,44.6833333975
Richmond,35.79583295166666
Traralgon,49.191666285416666
ovi.py 0 → 100644
import pandas as pandas
air_quality_readings = pandas.read_csv("2016_1HR.csv", dtype="str", low_memory=False)
def time_to_iso8601(old):
#01-01-16 0:00 to 2016-01-01T00:00
parts = old.split(" ")
old_date = parts[0]
new_date = "20" + old_date[6:8] + "-" + old_date[3:5] + "-" + old_date[0:2]
old_time = parts[1]
time = new_date + "T" + old_time.zfill(5)
return time
air_quality_readings["sample_datetime"] = air_quality_readings["sample_datetime"].apply(time_to_iso8601)
air_quality_readings = air_quality_readings.drop("time_basis_id", axis=1)
air_quality_readings = air_quality_readings.sort_values(['sp_name', 'sample_datetime'])
air_quality_readings['sample_datetime'] = pandas.to_datetime(air_quality_readings['sample_datetime'], format = "%Y-%m-%dT%H:%M")
air_quality_readings['value'] = air_quality_readings['value'].astype(float)
air_quality_readings = air_quality_readings.set_index(["sample_datetime"])
max_readings = air_quality_readings.groupby(['sp_name']).max()
max_readings.to_csv(path_or_buf = "2016_MAX_1HR_READING.csv")
max_24HR = air_quality_readings.groupby(["sp_name"]).resample("D").mean().groupby(["sp_name"]).max()
max_24HR.to_csv(path_or_buf = "2016_MAX_24HR_READING.csv")
average = air_quality_readings.groupby(["sp_name"]).mean()
average.to_csv(path_or_buf = "2016_AV_READING.csv")
\ No newline at end of file
0% Loading or .
You are about to add 0 people to the discussion. Proceed with caution.
Please register or to comment