### Create training set for Hvaler

In [68]:
library(tidyr)
library(dplyr)
library(lubridate)
library(xts)

KeepingYears = c(2012, 2013)
TestingYears = c(2013)
TestingWeeks = c(16, 28, 40, 52, 53)

HvalerDfFile = "Hvaler/imputed_complete.csv"
HvalerClasses = c('POSIXct', rep("numeric", 21))

df = read.csv(HvalerDfFile, stringsAsFactors=FALSE, colClasses=HvalerClasses) 
df = df %>% filter (year(df$DateTime) %in% KeepingYears) #only keep data within these years
testing_idx = year(df$DateTime) %in% TestingYears #Satisfy the year
testing_idx = testing_idx & (week(df$DateTime) %in% TestingWeeks) #Satisfy the week number

df[testing_idx, !(colnames(df) %in% c("DateTime", "T01")) ] = NA

write.csv(df, "Hvaler/training_set.csv", row.names=FALSE)

In [69]:
#Visualize training data
source("Lib/strip.R")
zone = "subs.1";
pdf(paste0(zone, "_trainingdata.pdf"),width=7,height=5)
strip(x = df[[zone]], 
  date = df$DateTime,
  cond = year(df$DateTime),
  arrange = "wide",
  main = paste("Consumption", zone))
dev.off()


 Module   :  strip 
 Author   :  Tim Appelhans <tim.appelhans@gmail.com>, Thomas Nauss 
 Version  :  2012-01-06 
 License  :  GNU GPLv3, see http://www.gnu.org/licenses/ 


### Create training set for GEFCom2012

In [70]:
library(tidyr)
library(dplyr)
library(lubridate)
library(xts)

KeepingYears = c(2004, 2005, 2006, 2007)
TestingYears = c(2007)
TestingWeeks = c(16, 28, 40, 52, 53)

GEFComDfFile = "GEFCom2012/complete.csv"
GEFComClasses = c('POSIXct', rep("numeric", 32))

df = read.csv(GEFComDfFile, stringsAsFactors=FALSE, colClasses=GEFComClasses)
df = df %>% filter (year(df$DateTime) %in% KeepingYears) #only keep data within these years
testing_idx = year(df$DateTime) %in% TestingYears #Satisfy the year
testing_idx = testing_idx & (week(df$DateTime) %in% TestingWeeks) #Satisfy the week number

df[testing_idx, !(colnames(df) %in% c("DateTime", "T01")) ] = NA

write.csv(df, "GEFCom2012/training_set.csv", row.names=FALSE)

In [71]:
#Visualize training data
source("Lib/strip.R")
zone = "zone.1";
pdf(paste0(zone, "_trainingdata.pdf"),width=7,height=5)
strip(x = df[[zone]], 
  date = df$DateTime,
  cond = year(df$DateTime),
  arrange = "wide",
  main = paste("Consumption", zone))
dev.off()


 Module   :  strip 
 Author   :  Tim Appelhans <tim.appelhans@gmail.com>, Thomas Nauss 
 Version  :  2012-01-06 
 License  :  GNU GPLv3, see http://www.gnu.org/licenses/ 
