advance on tests; almost there...
[talweg.git] / data / scripts / augment_meteo.R
CommitLineData
3d69ff21
BA
1meteo_df = read.csv("meteo.csv")
2
da7f46b8
BA
3#inspiration
4#http://stackoverflow.com/questions/8214303/conditional-replacement-of-values-in-a-data-frame
5
3d69ff21
BA
6meteo_df$Season = 0
7meteo_df$Week = 0
8meteo_df$Pollution = -1
9
da7f46b8
BA
10#Need to load and aggregate PM10 by days: use getData() from package
11data = getData(..., predict_at=0) #TODO:
3d69ff21 12
da7f46b8 13for (i in 1:nrow(meteo_df))
3d69ff21 14{
da7f46b8 15 pm10_level = data$getLevel(i)
3d69ff21
BA
16 #Fill Pollution column: -1 if no info, 0 to 2 for pollution level
17 if (!is.nan(pm10_level))
18 {
19 if (pm10_level < 30)
20 meteo_df$Pollution[i] = 0
21 else if (pm10_level <= 50)
22 meteo_df$Pollution[i] = 1
23 else #pm10 > 50
24 meteo_df$Pollution[i] = 2
25 }
26
27 #Also fill season + days of week variables
28 meteo_df$Season[i] = ifelse(
29 strsplit(as.character(meteo_df$Date[i]),'/')[[1]][1] %in% c("4","5","6","7","8"),
30 1, 0)
31 current_datetime = strptime(as.character(meteo_df$Date[i]), "%m/%d/%Y", tz="GMT")
32 meteo_df$Week[i] = ifelse(current_datetime$wday %in% c(6,0), 0, 1)
33}
34
3d69ff21
BA
35#Finally write new data
36write.csv(meteo_df, file="meteo_extra.csv", row.names=FALSE)