我在Windows 8上使用R版本3.3.2。我正在尝试使用C50包中的C5.0算法创建决策树。每当我使用成本矩阵时,决策树长度将变为零。在使用类似的代码和数据集时,我看到人们得到了结果。虽然,我并不完全确定数据集的确切相似性。 可能吗?难道我做错了什么?我附上了我的代码。
C5.0_test<-function(credit){
credit$default<-factor(credit$default, levels = c(1, 2), labels = ("non-defaulter, defaulter"))
set.seed(12345)
credit_rand <- credit[order(runif(1000)), ]
credit_train <- credit_rand[1:900, ]
credit_test <- credit_rand[901:1000, ]
credit_model <- C5.0.default(credit_train[-17], credit_train$default)
credit_pred <- predict(credit_model, credit_test)
credit_boost10 <- C5.0.default(credit_train[-17], credit_train$default, trials = 10)
credit_boost_pred10 <- predict(credit_boost10, credit_test)
error_cost <- matrix(c(0, 1, 2, 0), nrow = 2) # create a cost matrix
credit_cost <- C5.0.default(credit_train[-17], credit_train$default,
costs = error_cost) # Apply the cost matrix to the tree
credit_cost_pred <- predict(credit_cost, credit_test)
CrossTable(credit_test$default, credit_cost_pred, prop.chisq = F, prop.c = F, prop.r = F)
}