Skip to content

Commit

Permalink
PUBDEV-1188: add mergecat test as proper runit
Browse files Browse the repository at this point in the history
  • Loading branch information
spennihana committed May 28, 2015
1 parent a36c14f commit 3ef148b
Showing 1 changed file with 31 additions and 0 deletions.
31 changes: 31 additions & 0 deletions h2o-r/tests/testdir_misc/runit_mergecat.R
@@ -0,0 +1,31 @@
setwd(normalizePath(dirname(R.utils::commandArgs(asValues=TRUE)$"f")))
source('../h2o-runit.R')

test.mergecat <- function(conn) {
census_path <- locate("smalldata/chicago/chicagoCensus.csv")
crimes_path <- locate("smalldata/chicago/chicagoCrimes10k.csv.zip")

Log.info("Import Chicago census data...")
census_raw <- h2o.importFile(census_path, parse=FALSE)
census_setup <- h2o.parseSetup(census_raw)
census_setup$column_types[2] <- "Enum" # change from String -> Enum
census <- h2o.parseRaw(census_raw, col.types=census_setup$column_types)

Log.info("Import Chicago crimes data...")
crimes <- h2o.importFile(crimes_path)

Log.info("Set column names to be syntactically valid for R")
names(census) <- make.names(names(census))
names(crimes) <- make.names(names(crimes))
print(summary(census))
print(summary(crimes))

Log.info("Merge crimes and census data on community area number")
names(census)[names(census) == "Community.Area.Number"] <- "Community.Area"
crimeMerge <- h2o.merge(crimes, census)
print(summary(crimeMerge))

testEnd()
}

doTest("Merging H2O Frames that contain categorical columns", test.mergecat)

0 comments on commit 3ef148b

Please sign in to comment.