Created
July 19, 2013 12:36
-
-
Save tomasgreif/6038822 to your computer and use it in GitHub Desktop.
Parse rpart model.
This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
#' Create SQL statement from rpart rules | |
#' | |
#' Rpart rules are changed to sql CASE statement. | |
#' | |
#' @param df data frame used for rpart model | |
#' @param model rpart model | |
#' @export | |
#' @examples | |
#' parse_tree(df=kyphosis,model=rpart(data=kyphosis,formula=Kyphosis~.)) | |
#' parse_tree(df=mtcars,model=rpart(data=mtcars,formula=am~.)) | |
#' parse_tree(df=iris,model=rpart(data=iris,formula=Species~.)) | |
#' x <- german_data | |
#' x$gbbin <- NULL | |
#' model <- rpart(data=x,formula=gb~.) | |
#' parse_tree(x,model) | |
parse_tree <- function (df=NULL, model=NULL) { | |
log <- capture.output({ | |
rpart.rules <- path.rpart(model,rownames(model$frame)[model$frame$var=="<leaf>"]) | |
}) | |
args <- c("<=",">=","<",">","=") | |
rules_out <- "case " | |
i <- 1 | |
for (rule in rpart.rules) { | |
rule_out <- character(0) | |
for (component in rule) { | |
sep <- lapply(args, function(x) length(unlist(strsplit(component,x)))) > 1 | |
elements <- unlist(strsplit(component,(args[sep])[1])) | |
if(!(elements[1]=="root")) { | |
if (is.numeric(df[,elements[[1]]])) { | |
rule_out <- c(rule_out,paste(elements[1],(args[sep])[1],elements[2])) | |
} else { | |
rule_out <- c(rule_out,paste0(elements[1]," in (",paste0("'",unlist(strsplit(elements[2],",")),"'",collapse=","),")")) | |
} | |
} | |
} | |
rules_out <- c(rules_out, paste0("when ", paste(rule_out,collapse=" AND ")," then 'node_" ,names(rpart.rules)[i],"'")) | |
if(i==length(rpart.rules)) rules_out <- c(rules_out," end ") | |
i <- i +1 | |
} | |
sql_out <- paste(rules_out, collapse=" ") | |
sql_out | |
} |
Sign up for free
to join this conversation on GitHub.
Already have an account?
Sign in to comment
Very good work, thank you!