SparkR每个键输出多个文件

时间:2016-10-31 23:18:45

标签: apache-spark sparkr

我一直在SparkR中开展一个项目。我有一个包含数据帧的值的平面图。当我将flatmap结果保存到文本文件时,它会给我一个文本文件。我想在结果中得到flatmap中每个键的每个文件。我如何实现这个?

调整从组中获得的每个密钥的计算

dfsMapKey<-SparkR:::flatMap(dfsGroupKey,function(current_key)
   {
  tryCatch({
 data<-as.data.frame(t(sapply(current_key[[2]], rbind))) # current_key[[1]] as key and current_key[[2]] as list of values for each key
 names(data)<-names(current_key[[2]][[1]]) 
 data<-format_data_type(data)
 current_parameter <- matrix(
     list(as.character(unique(data$x)),unique(as.character(data$y)),data_year), # the columns for the field , which yield has to be adjusted
      nrow=1,              # number of rows
      ncol=3,              # number of columns
      byrow = TRUE)        # fill matrix by rows
     dimnames(current_parameter) = list(
      list("current_field"),         # row names
      list("x","y","data_year")) #colnames
 fields<<-as.data.frame(current_parameter["current_field",])
 print(fields)
 data<-clean_data(data)
 data$field <- as.character(data$field)
 data <- seperate_combined_fields(data)
 data <- data[ , !(names(data) %in% c("gps_year", "gps_month", "gps_day", "crop"))]
 approach <<- "gam" # enter "gam" or "loess"
 useSpan <<- 0.015
 nbs <<- 500 # number of basic splines
 data <- adjust_values(data)
 data <- data[ , !(names(data) %in% c("x"))]
 data[is.na(data)] <- ''
 data[data == "NA" ] <-''
 data <- as.data.frame(t(sapply(data, rbind)))
 return(data)
  }, error=function(e){
    print(e)
  })
})
 SparkR:::saveAsTextFile( dfsMapKey , "yieldTesting")

0 个答案:

没有答案