使用facet_grid

时间:2018-05-24 15:38:13

标签: r plot ggplot2 geom-bar facet-grid

我长期以来一直坚持这个问题。基本上我需要在二维facet_grid中生成细菌分类群的堆积条形图。这不是问题 - 但是,我确实需要使用2个不同的x轴标签图。

我看过这些有用的线程,但仍然不满意:

Force x-axis labels on facet_grid ggplot: drop lables

Force x-axis labels on facet_grid ggplot: x-axis labels differ per row

Force X axis text on for all facets of a facet_grid plot

我的第一个数据框:

structure(list(variable = structure(c(1L, 1L, 1L, 15L, 15L, 15L, 
8L, 8L, 8L, 14L, 14L, 14L, 11L, 11L, 11L, 6L, 6L, 6L, 9L, 9L, 
9L, 2L, 2L, 2L, 4L, 4L, 4L, 13L, 13L, 13L, 12L, 12L, 12L, 10L, 
10L, 10L, 3L, 3L, 3L, 7L, 7L, 7L, 5L, 5L, 5L), .Label = c("Control-5C10-7F", 
"Control-5C20-7M", "Treatment-5T16-7M", "Treatment-5T10-7F", 
"Treatment-5T20-7F", "Control-5C18-7F", "Treatment-5T17-7F", 
"Control-5C11-7F", "Control-5C19-7M", "Treatment-5T16-7F", "Control-5C17-7F", 
"Treatment-5T11-7M", "Treatment-5T10-7M", "Control-5C11-7M", 
"Control-5C10-7M"), class = "factor"), value = c(0.331838128419, 
0.352404886374, 0.0718854601356, 0.354207630618, 0.294475795902, 
0.0531792027053, 0.29236332445, 0.468273675353, 0.0607016856192, 
0.293872306838, 0.362196681338, 0.066892937885, 0.365593390631, 
0.307405564259, 0.0440421535284, 0.355757725414, 0.344565656834, 
0.0385728714381, 0.321804993859, 0.357477936005, 0.0189435852408, 
0.29485205349, 0.323279812948, 0.0613479971185, 0.330899082108, 
0.0950818222943, 0.00477515444166, 0.382399029908, 0.118943005246, 
0.00476898392234, 0.369726433283, 0.163932867784, 0.00531688661114, 
0.309218704951, 0.146836936202, 0.196198995646, 0.395112160831, 
0.185072972204, 0.00267743643869, 0.306483893184, 0.330640754636, 
0.0715509081212, 0.301275805191, 0.388917814857, 0.0356065705157
), Type = structure(c(1L, 1L, 1L, 1L, 1L, 1L, 1L, 1L, 1L, 1L, 
1L, 1L, 1L, 1L, 1L, 1L, 1L, 1L, 1L, 1L, 1L, 1L, 1L, 1L, 2L, 2L, 
2L, 2L, 2L, 2L, 2L, 2L, 2L, 2L, 2L, 2L, 2L, 2L, 2L, 2L, 2L, 2L, 
2L, 2L, 2L), .Label = c("Control", "Treatment"), class = "factor"), 
    Time.Sex = structure(c(2L, 2L, 2L, 1L, 1L, 1L, 2L, 2L, 2L, 
    1L, 1L, 1L, 2L, 2L, 2L, 2L, 2L, 2L, 1L, 1L, 1L, 1L, 1L, 1L, 
    2L, 2L, 2L, 1L, 1L, 1L, 1L, 1L, 1L, 2L, 2L, 2L, 1L, 1L, 1L, 
    2L, 2L, 2L, 2L, 2L, 2L), .Label = c("7d.M", "7d.F"), class = "factor"), 
    IndividualID = c("5C10", "5C10", "5C10", "5C10", "5C10", 
    "5C10", "5C11", "5C11", "5C11", "5C11", "5C11", "5C11", "5C17", 
    "5C17", "5C17", "5C18", "5C18", "5C18", "5C19", "5C19", "5C19", 
    "5C20", "5C20", "5C20", "5T10", "5T10", "5T10", "5T10", "5T10", 
    "5T10", "5T11", "5T11", "5T11", "5T16", "5T16", "5T16", "5T16", 
    "5T16", "5T16", "5T17", "5T17", "5T17", "5T20", "5T20", "5T20"
    ), Sex = c("F", "F", "F", "M", "M", "M", "F", "F", "F", "M", 
    "M", "M", "F", "F", "F", "F", "F", "F", "M", "M", "M", "M", 
    "M", "M", "F", "F", "F", "M", "M", "M", "M", "M", "M", "F", 
    "F", "F", "M", "M", "M", "F", "F", "F", "F", "F", "F"), Rep = c(1, 
    1, 1, 1, 1, 1, 2, 2, 2, 2, 2, 2, 3, 3, 3, 4, 4, 4, 3, 3, 
    3, 4, 4, 4, 1, 1, 1, 1, 1, 1, 2, 2, 2, 2, 2, 2, 3, 3, 3, 
    3, 3, 3, 4, 4, 4), IndividualID.Sex = c("5C10.F", "5C10.F", 
    "5C10.F", "5C10.M", "5C10.M", "5C10.M", "5C11.F", "5C11.F", 
    "5C11.F", "5C11.M", "5C11.M", "5C11.M", "5C17.F", "5C17.F", 
    "5C17.F", "5C18.F", "5C18.F", "5C18.F", "5C19.M", "5C19.M", 
    "5C19.M", "5C20.M", "5C20.M", "5C20.M", "5T10.F", "5T10.F", 
    "5T10.F", "5T10.M", "5T10.M", "5T10.M", "5T11.M", "5T11.M", 
    "5T11.M", "5T16.F", "5T16.F", "5T16.F", "5T16.M", "5T16.M", 
    "5T16.M", "5T17.F", "5T17.F", "5T17.F", "5T20.F", "5T20.F", 
    "5T20.F"), Genus = c("o__Bacteroidales;g__Parabacteroides", 
    "o__Lactobacillales;g__Lactobacillus", "o__Clostridiales;g__Lachnospiraceae NK4A136 group", 
    "o__Bacteroidales;g__Parabacteroides", "o__Lactobacillales;g__Lactobacillus", 
    "o__Clostridiales;g__Lachnospiraceae NK4A136 group", "o__Bacteroidales;g__Parabacteroides", 
    "o__Lactobacillales;g__Lactobacillus", "o__Clostridiales;g__Lachnospiraceae NK4A136 group", 
    "o__Bacteroidales;g__Parabacteroides", "o__Lactobacillales;g__Lactobacillus", 
    "o__Clostridiales;g__Lachnospiraceae NK4A136 group", "o__Bacteroidales;g__Parabacteroides", 
    "o__Lactobacillales;g__Lactobacillus", "o__Clostridiales;g__Lachnospiraceae NK4A136 group", 
    "o__Bacteroidales;g__Parabacteroides", "o__Lactobacillales;g__Lactobacillus", 
    "o__Clostridiales;g__Lachnospiraceae NK4A136 group", "o__Bacteroidales;g__Parabacteroides", 
    "o__Lactobacillales;g__Lactobacillus", "o__Clostridiales;g__Lachnospiraceae NK4A136 group", 
    "o__Bacteroidales;g__Parabacteroides", "o__Lactobacillales;g__Lactobacillus", 
    "o__Clostridiales;g__Lachnospiraceae NK4A136 group", "o__Bacteroidales;g__Parabacteroides", 
    "o__Lactobacillales;g__Lactobacillus", "o__Clostridiales;g__Lachnospiraceae NK4A136 group", 
    "o__Bacteroidales;g__Parabacteroides", "o__Lactobacillales;g__Lactobacillus", 
    "o__Clostridiales;g__Lachnospiraceae NK4A136 group", "o__Bacteroidales;g__Parabacteroides", 
    "o__Lactobacillales;g__Lactobacillus", "o__Clostridiales;g__Lachnospiraceae NK4A136 group", 
    "o__Bacteroidales;g__Parabacteroides", "o__Lactobacillales;g__Lactobacillus", 
    "o__Clostridiales;g__Lachnospiraceae NK4A136 group", "o__Bacteroidales;g__Parabacteroides", 
    "o__Lactobacillales;g__Lactobacillus", "o__Clostridiales;g__Lachnospiraceae NK4A136 group", 
    "o__Bacteroidales;g__Parabacteroides", "o__Lactobacillales;g__Lactobacillus", 
    "o__Clostridiales;g__Lachnospiraceae NK4A136 group", "o__Bacteroidales;g__Parabacteroides", 
    "o__Lactobacillales;g__Lactobacillus", "o__Clostridiales;g__Lachnospiraceae NK4A136 group"
    ), variable2 = c("7d.F-1", "7d.F-1", "7d.F-1", "7d.M-1", 
    "7d.M-1", "7d.M-1", "7d.F-2", "7d.F-2", "7d.F-2", "7d.M-2", 
    "7d.M-2", "7d.M-2", "7d.F-3", "7d.F-3", "7d.F-3", "7d.F-4", 
    "7d.F-4", "7d.F-4", "7d.M-3", "7d.M-3", "7d.M-3", "7d.M-4", 
    "7d.M-4", "7d.M-4", "7d.F-1", "7d.F-1", "7d.F-1", "7d.M-1", 
    "7d.M-1", "7d.M-1", "7d.M-2", "7d.M-2", "7d.M-2", "7d.F-2", 
    "7d.F-2", "7d.F-2", "7d.M-3", "7d.M-3", "7d.M-3", "7d.F-3", 
    "7d.F-3", "7d.F-3", "7d.F-4", "7d.F-4", "7d.F-4"), pos = c(0.1, 
    0.1, 0.1, 0.1, 0.1, 0.1, 0.1, 0.1, 0.1, 0.1, 0.1, 0.1, 0.1, 
    0.1, 0.1, 0.1, 0.1, 0.1, 0.1, 0.1, 0.1, 0.1, 0.1, 0.1, 0.2, 
    0.2, 0.2, 0.2, 0.2, 0.2, 0.2, 0.2, 0.2, 0.2, 0.2, 0.2, 0.2, 
    0.2, 0.2, 0.2, 0.2, 0.2, 0.2, 0.2, 0.2)), .Names = c("variable", 
"value", "Type", "Time.Sex", "IndividualID", "Sex", "Rep", "IndividualID.Sex", 
"Genus", "variable2", "pos"), row.names = c(NA, -45L), class = "data.frame")

ggplot内部函数中使用的第二个数据框。

structure(list(variable2 = c("7d.F-1", "7d.M-1", "7d.F-2", "7d.M-2", 
"7d.F-3", "7d.F-4", "7d.M-3", "7d.M-4", "7d.F-1", "7d.M-1", "7d.M-2", 
"7d.F-2", "7d.M-3", "7d.F-3", "7d.F-4"), IndividualID = c("5C10", 
"5C10", "5C11", "5C11", "5C17", "5C18", "5C19", "5C20", "5T10", 
"5T10", "5T11", "5T16", "5T16", "5T17", "5T20"), Type = structure(c(1L, 
1L, 1L, 1L, 1L, 1L, 1L, 1L, 2L, 2L, 2L, 2L, 2L, 2L, 2L), .Label = c("Control", 
"Treatment"), class = "factor")), .Names = c("variable2", "IndividualID", 
"Type"), row.names = c(1L, 4L, 7L, 10L, 13L, 16L, 19L, 22L, 25L, 
28L, 31L, 34L, 37L, 40L, 43L), class = "data.frame")

我的代码:

index_x <<-  0
index_k <<-  0
p <- ggplot(data=df, aes(x=variable2, y=value, fill=Genus)) +
   facet_grid("Type ~ Time.Sex", scales="free_x", space="free_x") +
   geom_bar(stat="identity", size=0.0) +
   geom_bar( size=0.0, stat="identity", show.legend=FALSE) +
##I tried with some level of success to include the labels I want inside the stacked bars themselves, but 
   ## would ideally like them to be on the x-axis.
   geom_text(aes(y=pos, label=IndividualID), vjust=0, angle=90, size=3) +
   xlab("Category") +
   ylab("Abundance %") +
   ggtitle(paste0("Taxa abundance")) +
   theme(
      panel.border=element_rect(fill=NA, linetype="solid", colour = "black", size=0.25),
      axis.text.x=element_text(size=9, colour="black", angle=as.numeric(90)),
      axis.text.y=element_text(size=9, colour="black"),
      axis.title=element_text(family="Helvetica", size=10),
      plot.title = element_text(lineheight=1.2, face="bold", size=25),
      panel.grid.major=element_blank(),
      panel.grid.minor=element_blank(),
      panel.background=element_blank(),
      legend.key.size = unit(0.35, "cm"),
      legend.text = element_text(size=12, face="bold"),
      legend.title = element_text(size=12, face="bold"),
      legend.spacing = unit(1, "cm"),
      legend.position="right",
      strip.text.x = element_text(angle=90, vjust=0, size=7, face="bold"),
      strip.text.y = element_text(hjust=0, angle=0, size=7, face="bold"),
      strip.background =  element_blank(),
      panel.spacing.y = unit(0.3, "lines")
   ) +  scale_fill_manual(values=vColors) +
   ## I wrote an internal function to force the x labels
   scale_x_discrete(name="IndividualID", labels = function(x){

      final_labels = c()

      if(index_x %% length(curr_order_x) == 0){
         index_k <<- index_k + 1
      }
      df_labels2 = df_labels_orig[df_labels_orig[[ facets[1] ]] == rev(curr_order_y)[index_k], ]

      for(i in 1:length(x)){
         final_labels = c(final_labels, df_labels2[df_labels2$variable2 == x[i],]$IndividualID)
      }
      index_x <<- index_x + 1

      print(final_labels)
      return(final_labels)
   }  
   )
print(p)

我得到以下内容: Obtained stacked barplot 但我想要的是在x轴上位于堆叠条中的个体ID。所以这就是我所做的,以为我可以使用gTable从上面的内部函数中显示强制x轴标签。

# Then following the references I found on SO, I tried the following:
index_x <<- 0 
index_k <<- 0

g <- ggplotGrob(p)

panels <- grep("panel", g$layout$name)
top <- unique(g$layout$t[panels])

top.row <- gtable:::rbind_gtable(
   g[seq.int(min(top)), ],
   g[max(top)+1,], "first"
)
bottom.row <- g[(max(top)-1):nrow(g), ]
all <- gtable:::rbind_gtable(top.row, bottom.row, "first")
grid.newpage()
grid.draw(all)

我获得了: stacked barplot with gTable x轴在两行上是相同的,我希望它们与它们实际代表的对应。它似乎适用于底部面板,但上面板x轴标签包含与下面板上的标签相同的标签。我也失去了传奇。

编辑:这是我想要的最终结果: Desired figure

1 个答案:

答案 0 :(得分:1)

不要调整到facet_grid的设置,而是考虑根据所需的分组单独构建绘图。具体来说,考虑基础R by(根据因子对数据框进行切片),根据您的级别类型时间来构建一个图表列表。性

但是,需要进行调整以满足您的要求:

  1. 控制图放在治疗图上方;
  2. 调整轴以避免冗余(根据实际的绘图数量,此处为4):
    • 删除第2和第4位的y轴标题/文字/刻度;
    • 删除第1和第2图上的x轴标题;
  3. 使用@baptist's share a legend方法避免使用多个图例。
  4. 分享图例 (已调整为在第一个参数的图表列表中读取并在顶部添加标题)

    # CREDIT: @Baptist: https://github.com/tidyverse/ggplot2/wiki/Share-a-legend-between-two-ggplot2-graphs
    grid_arrange_shared_legend <- function(plots, ncol = length(list(...)), nrow = 1, position = c("bottom", "right")) {
    
      position <- match.arg(position)
      g <- ggplotGrob(plots[[1]] + theme(legend.position = position))$grobs
      legend <- g[[which(sapply(g, function(x) x$name) == "guide-box")]]
      lheight <- sum(legend$height)
      lwidth <- sum(legend$width)
      gl <- lapply(plots, function(x) x + theme(legend.position="none"))
      gl <- c(gl, ncol = ncol, nrow = nrow)
    
      title <- textGrob("Taxa Abundance",gp=gpar(fontsize=20))
    
      combined <- switch(position,
                         "bottom" = arrangeGrob(do.call(arrangeGrob, gl),
                                                legend,
                                                ncol = 1,
                                                top = title,
                                                heights = unit.c(unit(0.95, "npc") - lheight, lheight)),
                         "right" = arrangeGrob(do.call(arrangeGrob, gl),
                                               legend,
                                               ncol = 2,
                                               widths = unit.c(unit(1, "npc") - lwidth, lwidth)))
    
      grid.newpage()
      grid.draw(combined)
    
      # return gtable invisibly
      invisible(combined)
    
    }
    

    R (使用by()图)

    vColors <- c("red", "green", "blue")
    
    by_plots <- by(df, df[,c("Type", "Time.Sex")], FUN=function(sub)       
      ggplot(sub, aes(x=IndividualID, y=value, fill=factor(Genus))) +
        geom_bar(stat="identity", size=0.0) + 
        labs(title=paste(sub$Type[[1]], "-", sub$Time.Sex[[1]]), x="Category", y="Abundance %") + 
        guides(fill=guide_legend(title="Genus", nrow=3)) + ylim(0, 0.9) +
        scale_fill_manual(values=vColors) +
        theme(plot.title = element_text(hjust = 0.5))
    )
    
    # RE-ORDER FOR CONTROL PLOTS ABOVE TREATMENT PLOTS
    by_plots <- by_plots[c(1,3,2,4)]
    
    # CONDITIONALLY REMOVE Y-AXIS AND X-AXIS TITLE    
    by_plots <- lapply(seq_along(by_plots), function(i) {
      if ((i %% 2) == 0)
        by_plots[[i]] <- by_plots[[i]] + theme(axis.title.y = element_blank(),
                                               axis.text.y = element_blank(),
                                               axis.ticks.y = element_blank())
    
      if (i < 3)
        by_plots[[i]] <- by_plots[[i]] + theme(axis.title.x = element_blank())      
    
      return(by_plots[[i]])
    })
    
    grid_arrange_shared_legend(by_plots, ncol=2, nrow=2)
    

    <强>输出

    Plot Output