我是一名记者,致力于绘制2002年至2012年间黑人农民数量增加或减少的县的地图。我使用R(3.2.3)来处理和绘制数据。
我已经能够将单一颜色的整个县级收益和损失 - 从负40到正165 - 映射到单一颜色,但这使得很难看到收益和损失的模式。我想要做的是使损失变为单一颜色(例如,蓝色)的所有变化,并在第二种颜色(例如,红色)的变化中呈现增益。
以下代码为看到正面和负面变化的县生成两个单独的(非常简化的)地图。任何人都知道如何在一张地图上以两种颜色捕获这些信息?理想情况下,县与#34;差异"值0将显示为灰色。谢谢你看这个!
df <- data.frame(GEOID = c("45001", "22001", "51001", "21001", "45003"),
Difference = c(-10, -40, 150, 95, 20))
#Second part: built a shapefile and join.
counties <- readOGR(dsn="Shapefile", layer="cb_2015_us_county_5m")
#Join the data about farmers to the spatial data.
counties@data <- left_join(counties@data, df)
#NAs are not permitted in qtm method, so let's replace them with zeros.
counties$Difference[is.na(counties$Difference)] <- 0
#Here are the counties that lost black farmers.
loss.counties <- counties[counties$Difference < 0, ]
qtm(loss.counties, "Difference")
#Here are the counties that gained black farmers.
gain.counties <- counties[counties$Difference > 0, ]
qtm(gain.counties, "Difference")
答案 0 :(得分:2)
使用原始帖子中的源数据,以上是我在上面评论中建议使用ggplot
的解决方案。
library(ggplot2)
library(ggmap)
library(maps)
library(dplyr)
# get data from
# https://quickstats.nass.usda.gov/results/A68E27D5-E9B2-3621-8F1E-58829A551F32
df <- read.csv("nass_data.csv")
df$County <- tolower(df$County)
df$State <- tolower(df$State)
#Calculate the difference between the 2002 and 2012 census95,
df <- df %>%
filter(Domain == "TOTAL", Year == 2002 | Year == 2012) %>%
group_by(County) %>%
mutate(Difference = ifelse(is.na(Value-lag(Value)), 0, Value-lag(Value))) %>%
select(County, State, Difference)
#get map data for US counties and states
county_map <- map_data("county")
county_map$County <- county_map$subregion
county_map$State <- county_map$region
#Join the data about farmers to the spatial data.
county_map <- left_join(county_map, df)
#plot using ggplot
ggplot(county_map, aes(x = long, y = lat, group=group)) +
geom_polygon(aes(fill = Difference)) +
scale_fill_gradient2(midpoint = 0, mid="#eee8d5", high="#dc322f", low="#268bd2")
答案 1 :(得分:2)
将这些数据包装起来可能更好。我快速判断了垃圾箱应该是什么,你应该查看数据,看它是否应该是不同的。我也非常手动地进行了分组,以试图显示正在进行的操作。
使用FIPS代码(&#34; ANSI&#34;列的组合)可以在县名难以匹配的情况下提供帮助,因此我为什么要这样做。
人们倾向于忽略AK&amp;嗨,但似乎有一些农场。
此外,红色/蓝色是加载颜色,确实应该避免。
library(ggplot2)
library(maps)
library(maptools)
library(rgeos)
library(albersusa) # devtools::install_github("hrbrmstr/albersusa")
library(ggalt)
library(ggthemes)
library(dplyr)
df <- read.csv("347E31A8-7257-3AEE-86D3-4BE3D08982A3.csv")
df <- df %>%
filter(Domain == "TOTAL", Year == 2002 | Year == 2012) %>%
group_by(County) %>%
mutate(delta=Value-lag(Value),
delta=ifelse(is.na(delta), 0, delta),
fips=sprintf("%02d%03d", State.ANSI, County.ANSI))
df$delta <- cut(df$delta, include.lowest=FALSE,
breaks=c(-400, -300, -200, -100, -1, 1, 100, 200, 300, 400),
labels=c("301 to 400 (losses)", "201 to 300", "101 to 200", "1 to 100",
"no gains/losses",
"+1 to 100", "+101 to 200", "+201 to 300", "301 to 400 (gains)"))
counties <- counties_composite()
counties_map <- fortify(counties, region="fips")
gg <- ggplot()
gg <- gg + geom_map(data=counties_map, map=counties_map,
aes(x=long, y=lat, map_id=id),
color="#b3b3b3", size=0.15, fill="white")
gg <- gg + geom_map(data=df, map=counties_map,
aes(fill=delta, map_id=fips),
color="#b3b3b3", size=0.15)
gg <- gg + scale_fill_manual(name="Change since 2002\n(white = no data)",
values=c("#543005", "#8c510a", "#bf812d", "#dfc27d",
"#e0e0e0",
"#80cdc1", "#35978f", "#01665e", "#003c30"),
guide=guide_legend(reverse=TRUE))
gg <- gg + coord_proj(us_laea_proj)
gg <- gg + labs(x="Grey == no data", y=NULL)
gg <- gg + theme_map()
gg <- gg + theme(legend.position=c(0.85, 0.2))
gg <- gg + theme(legend.key=element_blank())
gg