在ggplot中

时间:2017-05-09 16:18:09

标签: r ggplot2 dplyr

我正在尝试手动重新排序每个方面内的x轴标签。

数据如下:

df = structure(list(block = structure(c(1L, 1L, 1L, 1L, 1L, 1L, 1L, 
2L, 2L, 2L, 2L, 2L, 2L, 2L, 3L, 3L, 3L, 3L, 3L, 3L, 3L, 4L, 4L, 
4L, 4L, 4L, 4L, 4L, 5L, 5L, 5L, 5L, 5L, 5L, 5L), .Label = c("1", 
"2", "3", "4", "5"), class = "factor"), item = structure(c(14L, 
15L, 28L, 29L, 30L, 31L, 32L, 15L, 16L, 17L, 18L, 19L, 20L, 21L, 
15L, 22L, 23L, 24L, 25L, 26L, 27L, 1L, 2L, 3L, 4L, 5L, 6L, 7L, 
1L, 8L, 9L, 10L, 11L, 12L, 13L), .Label = c("p00e00d00", "p00e00d11", 
"p00e00d12", "p00e00d13", "p00e00d21", "p00e00d22", "p00e00d23", 
"p00e11d00", "p00e12d00", "p00e13d00", "p00e21d00", "p00e22d00", 
"p00e23d00", "p01e00d00", "p11e00d00", "p11e00d11", "p11e00d12", 
"p11e00d13", "p11e00d21", "p11e00d22", "p11e00d23", "p11e11d00", 
"p11e12d00", "p11e13d00", "p11e21d00", "p11e22d00", "p11e23d00", 
"p12e00d00", "p13e00d00", "p14e00d00", "p21e00d00", "p22e00d00"
), class = "factor"), response = structure(c(2L, 2L, 2L, 2L, 
2L, 2L, 2L, 2L, 2L, 2L, 2L, 2L, 2L, 2L, 2L, 2L, 2L, 2L, 2L, 2L, 
2L, 2L, 2L, 2L, 2L, 2L, 2L, 2L, 2L, 2L, 2L, 2L, 2L, 2L, 2L), .Label = c("2", 
"1"), class = "factor"), n = c(345L, 511L, 583L, 613L, 612L, 
222L, 142L, 531L, 546L, 589L, 636L, 478L, 364L, 313L, 502L, 533L, 
587L, 603L, 385L, 298L, 263L, 518L, 546L, 563L, 593L, 435L, 351L, 
310L, 478L, 579L, 629L, 646L, 357L, 307L, 230L), freq = c(0.408284023668639, 
0.604733727810651, 0.689940828402367, 0.725443786982249, 0.724260355029586, 
0.262721893491124, 0.168047337278107, 0.628402366863905, 0.646153846153846, 
0.697041420118343, 0.752662721893491, 0.565680473372781, 0.430769230769231, 
0.370414201183432, 0.594082840236686, 0.630769230769231, 0.694674556213018, 
0.713609467455621, 0.455621301775148, 0.352662721893491, 0.311242603550296, 
0.61301775147929, 0.646153846153846, 0.666272189349112, 0.701775147928994, 
0.514792899408284, 0.415384615384615, 0.366863905325444, 0.565680473372781, 
0.685207100591716, 0.744378698224852, 0.764497041420118, 0.422485207100592, 
0.363313609467456, 0.272189349112426)), class = c("tbl_df", "tbl", 
"data.frame"), row.names = c(NA, -35L), .Names = c("block", "item", 
"response", "n", "freq"))

有五个块,每个块包含7个项目,并且一些项目在块中具有相同的名称。因此,我可以按以下方式逐步完成:

df %>% 
  ggplot(aes(x = item, y = freq)) + 
  geom_bar(stat = "identity", position = "dodge", color = "black") +
  facet_grid(.~block, scales = "free") + 
  coord_cartesian(ylim = c(0, 1), expand = F) +  # need to add expanse = F to prevent zooming away 
  scale_y_continuous(labels = scales::percent) +
  theme(axis.text.x = element_text(angle=45, hjust=1, vjust=1))

我还有向量,为每个块指出项目应该出现的顺序。例如:

block_3_order = c("p11e13d00","p11e12d00", "p11e11d00", "p11e00d00", "p11e21d00", "p11e22d00","p11e23d00")
             )
block_4_order =  c("p00e00d13", "p00e00d12", "p00e00d11", "p00e00d00", "p00e00d21","p00e00d22","p00e00d23")
             )

我尝试重新排序“item”因子,但为了获得所需的效果,我需要将数据帧拆分为表示块的子集。否则,我无法掌握如何将因子排序与项目的ggplot处理整合为一个单独的因素。

非常感谢任何帮助。

1 个答案:

答案 0 :(得分:3)

要在每个方面获得不同的自定义轴顺序,您可以创建每个方面"方面"作为一个单独的情节,然后将它们放在一起,好像它们是一个单面的情节。

library(tidyverse)
#devtools::install_github("baptiste/egg")
library(egg)
library(gridExtra)
library(grid)
theme_set(theme_bw())

首先,创建自定义排序。那些是NULL的只会在最终的情节中按字母顺序排序。

b.order = list(b1 = NULL,
               b2 = NULL,
               b3 = c("p11e13d00","p11e12d00", "p11e11d00", "p11e00d00", "p11e21d00", "p11e22d00","p11e23d00"),
               b4 = c("p00e00d13", "p00e00d12", "p00e00d11", "p00e00d00", "p00e00d21","p00e00d22","p00e00d23"),
               b5 = NULL)

创建一个图表列表,每个block一个。我们通过df分割block来实现此目的。要获得自定义排序,我们使用factor根据列表b.order设置自定义订单。

plist = map2(split(df, df$block), b.order,  
     ~ .x %>% group_by(block) %>% 
         mutate(item = factor(item, levels=if(is.null(.y)) sort(unique(item)) else .y)) %>%
       ggplot(aes(x = item, y = freq)) + 
        geom_bar(stat = "identity", position = "dodge", color = "black") +
        facet_grid(.~block, scales = "free") + 
        coord_cartesian(ylim = c(0, 1), expand = F) +  # need to add expanse = F to prevent zooming away 
        scale_y_continuous(labels = scales::percent) +
        theme(axis.text.x = element_text(angle=45, hjust=1, vjust=1),
             plot.margin=margin(b=-5)) +
        labs(x=""))

从除最左边的地块以外的所有地方删除y轴标签,标题和刻度:

plist[2:length(plist)] = plist[2:length(plist)] %>% 
  map(~ .x + theme(axis.text.y=element_blank(),
                   axis.title.y=element_blank(),
                   axis.ticks.y=element_blank()))   

安排情节。我们使用ggarrange包中的egg来确保绘图面板都具有相同的水平宽度。我们还需要在图表下方添加Item标签。但是,ggarrange会将绘图打印到输出设备,即使在arrangeGrob内也是如此。因此,我们创建对象p,清除设备,然后重绘最终的图。

p = arrangeGrob(ggarrange(plots=plist, ncol=length(plist)),
                textGrob("Item"), heights=c(20,1))
grid.newpage()
grid.draw(p)

enter image description here