r - 将 ggplot2 对象中的图例名称从小到大排序
问题描述
我有下面的数据框,我想将图例名称的顺序设置为从小到大。Cases
这些值可能是字符,但它们与我认为可能有用的列对应,因为数据集是动态的。
Cum<-structure(list(Age.group = c("00-04", "00-04", "05-14", "05-14",
"15-24", "15-24", "25-49", "25-49", "50-64", "50-64", "65-79",
"65-79", "80+", "80+"), Gender = c("Female", "Male", "Female",
"Male", "Female", "Male", "Female", "Male", "Female", "Male",
"Female", "Male", "Female", "Male"), Cases = c(64578, 70518,
187568, 197015, 414405, 388138, 1342394, 1206168, 792180, 742744,
400232, 414613, 282268, 198026), lab = c("64,578", "70,518",
"187,568", "197,015", "414,405", "388,138", "1,342,394", "1,206,168",
"792,180", "742,744", "400,232", "414,613", "282,268", "198,026"
), Age.group.Sum = c(135096, 135096, 384583, 384583, 802543,
802543, 2548562, 2548562, 1534924, 1534924, 814845, 814845, 480294,
480294), lab2 = c("135,096", "135,096", "384,583", "384,583",
"802,543", "802,543", "2,548,562", "2,548,562", "1,534,924",
"1,534,924", "814,845", "814,845", "480,294", "480,294"), color = c("#4285f4",
"#4285f4", "#90a9e0", "#90a9e0", "#dd9e5f", "#dd9e5f", "#b45f06",
"#b45f06", "#b45f06", "#b45f06", "#dd9e5f", "#dd9e5f", "#aebbd6",
"#90a9e0"), Range = c("LESS THAN 74.5K", "LESS THAN 74.5K", "148.9K - 223.4K",
"148.9K - 223.4K", "372.3K - 446.7K", "372.3K - 446.7K", "MORE THAN 670.1K",
"MORE THAN 670.1K", "MORE THAN 670.1K", "MORE THAN 670.1K", "372.3K - 446.7K",
"372.3K - 446.7K", "223.4K - 297.8K", "148.9K - 223.4K")), class = "data.frame", row.names = c(NA,
-14L))
names(mycols) <- mycols
ylab <- c(0.5,1,1.5,2,2.5)
lbls <- setNames(unique(Cum$color), unique(Cum$Range))
ggplot_obj <- ggplot(data = Cum, aes(x = `Age.group`, y = Cases, group = Gender,fill = Range)) +
geom_bar(aes(
text = paste("<b>Gender:</b>", Gender, "<br><b>Age:</b>", `Age.group` ,
"<br><b>Cases:</b>", lab, "<br><b>Total cases in age group:</b>",
lab2)),
position = "dodge", stat = "identity") +
geom_text(aes(y = Cases + 10000, label = Gender), vjust = 1,
position = position_dodge(width=0.9),size=2) +
scale_fill_manual(values = lbls) +
coord_cartesian(ylim = c(0, max(Cum$Cases)*1.1), expand = FALSE) +
theme_bw()+ theme(
# remove the vertical grid lines
panel.grid.major.x = element_blank(),
panel.border = element_blank(), axis.line.x = element_line()
) +
scale_y_continuous(labels = unit_format(unit = "M", scale = 1e-6))+
xlab("Age group")
解决方案
我们可以将列转换为自定义顺序中指定factor
的levels
Cum$Range <- factor(Cum$Range, levels = c("LESS THAN 74.5K" , "148.9K - 223.4K" , "223.4K - 297.8K", "372.3K - 446.7K" , "MORE THAN 670.1K"))
ylab <- c(0.5,1,1.5,2,2.5)
lbls <- setNames(Cum$color[match(levels(Cum$Range), Cum$Range)], levels(Cum$Range))
ggplot
用OP 的代码构建绘图
-输出
更新
如果“范围”值是动态的(假设单位相同),则使用 提取数字部分parse_number
,order
并获取unique
值
lvls <- as.character(unique(Cum$Range[order(readr::parse_number(as.character(Cum$Range)))]))
Cum$Range <- factor(Cum$Range, levels = lvls)
或者另一种选择是arrange
通过“案例”并设置“范围”的级别
library(dplyr)
Cum <- Cum %>%
arrange(Cases, Age.group) %>%
mutate(Range = factor(Range, levels = unique(Range)))
lbls <- setNames(Cum$color[match(levels(Cum$Range), Cum$Range)], levels(Cum$Range))
推荐阅读
- flutter - PUB_HOSTED_URL 的默认值 FLUTTER_STORAGE_BASE_URL
- java - Wildfly 上的 Multipart/form-data RESTEasy 错误
- php - php通过sftp发送文件到ipv6主机
- python - 从音品号、弦号和拾音器设置中查找低音吉他的音高
- angular - 带有 ref 过滤器的 AngularFireList 删除所有项目而不是过滤
- python - 根据开始时间和结束时间之间的差异生成行(分钟)
- reactjs - React Bootstrap - 在路线更改时关闭 NavDropdown
- java - Java Spring Hibernate JPA PostgreSQL 避免保存重复的行/记录
- asp.net-mvc - 当从 iframe 为 SSO azure B2C msal .net 生成令牌时,为什么 Request.IsAuthenticated 为假
- r - R,sf 包:缓冲区和点未显示在地图上