Skip to content

Commit 28c4990

Browse files
committed
Update HDFS deletion command, and run GBM before DRF.
1 parent e8c97e3 commit 28c4990

File tree

1 file changed

+5
-5
lines changed

1 file changed

+5
-5
lines changed

R/examples/manycols.R

+5-5
Original file line numberDiff line numberDiff line change
@@ -10,7 +10,7 @@ library(h2o)
1010
#wget http://h2o-release.s3.amazonaws.com/h2o/h2o-parsemanycols/8/h2o-2.9.0.8.zip
1111
#unzip h2o-2.9.0.8.zip
1212
#cd h2o-2.9.0.8/hadoop
13-
#hadoop fs -rmr myDir
13+
#hadoop fs -rm -r myDir
1414
#hadoop jar h2odriver_hdp2.1.jar water.hadoop.h2odriver -libjars ../h2o.jar -n 8 -mapperXmx 40g -output myDir -baseport 61111 -data_max_factor_levels 65000 -chunk_bits 24
1515

1616
h2oCluster <- h2o.init(ip="mr-0xd1", port=61111)
@@ -40,10 +40,10 @@ mdl.glm
4040
pred.glm <- h2o.predict(mdl.glm, valid)
4141
h2o.performance(pred.glm[,3], valid[,response], measure="F1")
4242

43-
# Random Forest
44-
mdl.rf <- h2o.randomForest(x=predictors, y=response, data=train, validation=valid, type="BigData", depth=15, importance=T, balance.classes = T, class.sampling.factors = c(1,250))
45-
mdl.rf
46-
4743
# Gradient Boosted Trees
4844
mdl.gbm <- h2o.gbm(x=predictors, y=response, data=train, validation=valid, importance=T, balance.classes = T, class.sampling.factors = c(1,250))
4945
mdl.gbm
46+
47+
# Random Forest
48+
mdl.rf <- h2o.randomForest(x=predictors, y=response, data=train, validation=valid, type="BigData", depth=15, importance=T, balance.classes = T, class.sampling.factors = c(1,250))
49+
mdl.rf

0 commit comments

Comments
 (0)