In [17]:
# Daten einlesen
wetterdaten <- readRDS("datasets/rds/wetterdaten.rds")

# Ort für die Analyse festlegen
norderney <- wetterdaten[[6]]

In [19]:
# Zeitindex als unabhängige Variable hinzufügen, weil Datum als unabhängige Variable nicht funktioniert, weil es nicht numerisch ist
norderney$Zeitindex <- as.numeric(norderney$MESS_DATUM - min(norderney$MESS_DATUM))
head(norderney)

# Unnötige Spalten entfernen, damit cor() auf dataframe angewendet werden kann
norderney$MESS_DATUM <- NULL
norderney$STATIONS_ID <- NULL
head(norderney)

Unnamed: 0_level_0,STATIONS_ID,MESS_DATUM,RSK,SDK,TMK,Zeitindex
Unnamed: 0_level_1,<int>,<date>,<dbl>,<dbl>,<dbl>,<dbl>
46346,3631,2014-01-01,0.2,3.6,5.8,0
46347,3631,2014-01-02,0.5,0.5,7.9,1
46348,3631,2014-01-03,2.4,0.0,7.2,2
46349,3631,2014-01-04,1.3,3.0,6.8,3
46350,3631,2014-01-05,0.4,5.0,5.7,4
46351,3631,2014-01-06,5.0,0.4,8.1,5


Unnamed: 0_level_0,RSK,SDK,TMK,Zeitindex
Unnamed: 0_level_1,<dbl>,<dbl>,<dbl>,<dbl>
46346,0.2,3.6,5.8,0
46347,0.5,0.5,7.9,1
46348,2.4,0.0,7.2,2
46349,1.3,3.0,6.8,3
46350,0.4,5.0,5.7,4
46351,5.0,0.4,8.1,5


In [88]:
# Regressionsanalyse beginnt immer mit Korrelationsanalyse
cor(norderney)
cor.test(norderney$Zeitindex, norderney$TMK, conf.level = 0.95)

Unnamed: 0,RSK,SDK,TMK,Zeitindex
RSK,1.0,-0.26749939,0.0460052,0.02976479
SDK,-0.26749939,1.0,0.43409277,0.01660079
TMK,0.0460052,0.43409277,1.0,0.04970893
Zeitindex,0.02976479,0.01660079,0.04970893,1.0



	Pearson's product-moment correlation

data:  norderney$Zeitindex and norderney$TMK
t = 3.0003, df = 3634, p-value = 0.002715
alternative hypothesis: true correlation is not equal to 0
95 percent confidence interval:
 0.01723086 0.08208221
sample estimates:
       cor 
0.04970893 


In [85]:
# Heatmap für TMK und Zeitindex 

# Pakete installieren und laden
if (!require(RColorBrewer, quietly = TRUE)) {
  install.packages("RColorBrewer")
}
if (!require(MASS, quietly = TRUE)) {
  install.packages("MASS")
}
library(RColorBrewer)
library(MASS)

# Funktion für Heatmap
heatmap <- function(df_to_plot, file_path) {

    # PNG
    png(file_path, width=800, height=300)

    # Farbpallette für Darstellung
    rf <- colorRampPalette(rev(brewer.pal(11, "Spectral")))
    r <- rf(32)

    # Plot erzeugen
    h2 <- hist(df_to_plot[,2], breaks=25, plot=FALSE)
    k <- kde2d(df_to_plot[,1], df_to_plot[,2], n=25)
    y_label <- "TMK"
    x_label <- "Zeitindex"
    cex = 1.5

    par(mar = c(6,6,1,1), cex.axis = cex)
    layout(matrix(c(1,2), 1, 2, byrow = TRUE), widths = c(5,1) , heights = c(1,3))
    image(k, col = r)
    mtext(side = 1, line = 3, x_label, cex = cex)
    mtext(side = 2, line = 3, y_label, cex = cex)

    # Barplot rechts
    par(mar = c(5.2,0,0.2,1))
    barplot(h2$counts, axes=FALSE, xlim=c(0, max(h2$counts)), space=0, col="red", horiz=TRUE)

    dev.off()
}

# TMK Dataframe erzeugen
df_tmk <- data.frame(norderney$TMK, norderney$Zeitindex)

# TMK Heatmap erzeugen
heatmap(df_TMK, "plots/linear_regression/heatmap_TMK.png" )
