From 07159c04e558772339b62f56ad88d9341376f832 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Przemys=C5=82aw=20Biecek?= Date: Sat, 22 Dec 2018 22:50:10 +0100 Subject: [PATCH] init for drifter --- .Rbuildignore | 2 ++ .gitignore | 1 + DESCRIPTION | 9 +++++++++ NAMESPACE | 2 ++ README.md | 11 +++++++++-- drifter.Rproj | 21 +++++++++++++++++++++ 6 files changed, 44 insertions(+), 2 deletions(-) create mode 100644 .Rbuildignore create mode 100644 DESCRIPTION create mode 100644 NAMESPACE create mode 100644 drifter.Rproj diff --git a/.Rbuildignore b/.Rbuildignore new file mode 100644 index 0000000..91114bf --- /dev/null +++ b/.Rbuildignore @@ -0,0 +1,2 @@ +^.*\.Rproj$ +^\.Rproj\.user$ diff --git a/.gitignore b/.gitignore index 26fad6f..be0b467 100644 --- a/.gitignore +++ b/.gitignore @@ -34,3 +34,4 @@ vignettes/*.pdf # Shiny token, see https://shiny.rstudio.com/articles/shinyapps.html rsconnect/ +.Rproj.user diff --git a/DESCRIPTION b/DESCRIPTION new file mode 100644 index 0000000..e5b3fa3 --- /dev/null +++ b/DESCRIPTION @@ -0,0 +1,9 @@ +Package: drifter +Title: Concept Drift and Concept Shift Detection for Predictive Models +Version: 0.1 +Authors@R: person("First", "Last", email = "first.last@example.com", role = c("aut", "cre")) +Description: What the package does (one paragraph). +Depends: R (>= 3.5.0) +License: GPL +Encoding: UTF-8 +LazyData: true diff --git a/NAMESPACE b/NAMESPACE new file mode 100644 index 0000000..884a631 --- /dev/null +++ b/NAMESPACE @@ -0,0 +1,2 @@ +# Generated by roxygen2: fake comment so roxygen2 overwrites silently. +exportPattern("^[^\\.]") diff --git a/README.md b/README.md index 80da533..4b2c862 100644 --- a/README.md +++ b/README.md @@ -1,2 +1,9 @@ -# drifter -Concept Drift and Concept Shift Detection for Predictive Models +# drifter: Concept Drift and Concept Shift Detection for Predictive Models + +Machine learning models are often fitted and validated on historical data under silent assumption that data are stationary. The most popular techniques for validation (k-fold cross-validation, repeated cross-validation, and so on) test models on data with the same distribution as training data. + +Yet, in many practical applications, deployed models are working in a changing environment. After some time, due to changes in the environment, model performance may degenerate, as model may be less reliable. + +Concept drift refers to the change in the data distribution or in the relationships between variables over time. Think about model for energy consumption for a school, over time the school may be equipped with larger number of devices of with more power-efficient devices that may affect the model performance. + + diff --git a/drifter.Rproj b/drifter.Rproj new file mode 100644 index 0000000..30e02be --- /dev/null +++ b/drifter.Rproj @@ -0,0 +1,21 @@ +Version: 1.0 + +RestoreWorkspace: No +SaveWorkspace: No +AlwaysSaveHistory: Default + +EnableCodeIndexing: Yes +UseSpacesForTab: Yes +NumSpacesForTab: 2 +Encoding: UTF-8 + +RnwWeave: knitr +LaTeX: pdfLaTeX + +AutoAppendNewline: Yes +StripTrailingWhitespace: Yes + +BuildType: Package +PackageUseDevtools: Yes +PackageInstallArgs: --no-multiarch --with-keep.source +PackageRoxygenize: rd,collate,namespace