不要删除 ggplot 中的 na 值
Do not remove na values in ggplot
我有一个数据框df
df<-structure(list(y = c(2268.14043972082, 2147.62290922552, 2269.1387550775,
2247.31983098201, 1903.39138268307, 2174.78291538358, 2359.51909126411,
2488.39004804939, 212.851575751527, 461.398994384333, 567.150629704352,
781.775113821961, 918.303706148872, 1107.37695799186, 1160.80594193377,
1412.61328924168, 1689.48879626486, 260.737164468854, 306.72700499362,
283.410379620422, 366.813913489692, 387.570173754128, 388.602676983443,
477.858510450125, 128.198042456082, 535.519377609133, 1028.8780498564,
1098.54431357711, 1265.26965941035, 1129.58344809909, 820.922447928053,
749.343583476846, 779.678206156474, 646.575242339517, 733.953282899613,
461.156280127354, 906.813018662913, 798.186995701282, 831.365377249207,
764.519073183124, 672.076289062505, 669.879217186302, 1341.47673353751,
1401.44881976186, 1640.27575962036), P = c(1750.51986303926,
1614.11541634798, 951.847023338079, 1119.3682884872, 1112.38984390156,
1270.65773075982, 1234.72262170166, 1338.46096616983, 1198.95775346458,
1136.69287367165, 1265.46480803983, 1364.70149818063, 1112.37006707489,
1346.49240261316, 1740.56677791104, 1410.99217295647, 1693.18871380948,
901.760176040232, 763.971046562772, 994.8699095021, 972.755147593882,
1011.41669411398, 643.705302958842, 537.54384616157, 591.212003320456,
464.405641604215, NA, NA, NA, NA, NA, 246.197052353527, 265.237238116562,
1260.68540103734, 398.080919081345, NA, 374.611004248261, 527.686996757984,
765.678002953529, 661.830007851124, 484.864011824131, 612.936006393284,
672.088483441621, 625.397994920611, 785.390003710985), x = c(49,
50, 51, 52, 53, 54, 55, 56, 1, 2, 3, 4, 5, 14, 15, 16, 17, 2,
3, 4, 5, 6, 10, 11, 3, 30, 64, 66, 67, 68, 69, 34, 35, 37, 39,
2, 17, 18, 99, 100, 102, 103, 67, 70, 72), Te = c(9.10006221322572,
7.65505467142961, 8.21480062559674, 8.09251754304318, 8.466220758789,
8.48094407814006, 8.77304120569444, 8.31727518543397, 8.14410265791868,
8.80921738865237, 9.04091478341757, 9.66233618146246, 8.77015716015164,
9.46037931956657, 9.59702379240667, 10.1739258740118, 9.39524442215692,
0.616491147620629, 0.631476354027448, 0.129135682201776, 1.87297579763483,
2.53941370394744, -0.518422834982312, 1.34466852591922, 1.05118063842584,
1.79515935418336, 6.65555189859301, 6.38647333946436, 6.48427760143803,
6.33587322941382, 7.3501870975794, 3.04366850755114, 1.94656549866681,
3.61970174782833, 4.41939287295897, 9.47923019665153, 8.87480698915229,
8.06993784515111, 2.31976094801132, 2.65270969716837, 2.21586561444892,
2.66012522311856, 5.72634186318572, 4.63445162539409, 6.18505171198551
)), .Names = c("y", "P", "x", "Te"), row.names = c(NA, -45L), class = "data.frame")
我使用 ggplot 绘制这个 y 对 x 的图,其中点的大小和颜色分别基于 T 和 P。
ggplot(df) +
geom_point(aes(x = x, y = y, size=P, colour=Te), alpha=0.7) +
scale_colour_gradient(low="#00FF33", high ="#FF0000", guide = "colourbar")+
labs(colour="T", size="P")+
xlab("x") + ylab("y")+
scale_size(range = c(3, 8)) +
theme_bw(base_size = 12, base_family = "Helvetica") +
theme(panel.grid.minor = element_line(colour="grey", size=0.5),
axis.text.x = element_text(angle = 45, hjust = 1),
legend.position="bottom",
legend.box="horizontal") +
guides(colour = guide_colourbar(title.position="top", title.hjust = 0.5),
size = guide_legend(title.position="top", title.hjust = 0.5))
一些点被删除了,因为我在 P 中有一些 NA 值。但是,我想保留这些点并给它们一个灰色。
有人知道怎么做吗?
一个解决方案是使用两个数据子集——第一次调用 geom_point
仅绘制 df$P
为 而非 的数据点 NA
。对 geom_point
的第二次调用绘制了 df$P
为 NA
的点,因此删除了 size = P
美学。
ggplot(df) +
geom_point(data = subset(df, !is.na(P)), aes(x = x, y = y, size=P, colour=Te), alpha=0.7) +
geom_point(data = subset(df, is.na(P)), aes(x = x, y = y, color = Te), alpha = 0.7, color = "black") +
scale_colour_gradient(low="#00FF33", high ="#FF0000", guide = "colourbar")+
labs(colour="T", size="P")+
xlab("x") + ylab("y")+
scale_size(range = c(3, 8)) +
theme_bw(base_size = 12, base_family = "Helvetica") +
theme(panel.grid.minor = element_line(colour="grey", size=0.5),
axis.text.x = element_text(angle = 45, hjust = 1),
legend.position="bottom",
legend.box="horizontal") +
guides(colour = guide_colourbar(title.position="top", title.hjust = 0.5),
size = guide_legend(title.position="top", title.hjust = 0.5))
注意:您可以通过在第一个 ggplot
电话。您还可以通过将所有内容放入 labs()
来减少 labs
、xlabs
和 ylabs
的一些重复。最后,gradient = "colourbar"
是 scale_colour_gradient
的 guide
参数的默认值,因此它也可以被删除:
ggplot(df, aes(x = x, y = y), alpha = 0.7) +
geom_point(data = subset(df, !is.na(P)), aes(size = P, color = Te)) +
geom_point(data = subset(df, is.na(P)), color = "black") +
scale_colour_gradient(low = "#00FF33", high = "#FF0000") +
labs(x = "x", y = "y", colour = "T", size = "P") +
scale_size(range = c(3, 8)) +
theme_bw(base_size = 12, base_family = "Helvetica") +
theme(panel.grid.minor = element_line(colour = "grey", size = 0.5),
axis.text.x = element_text(angle = 45, hjust = 1),
legend.position = "bottom",
legend.box = "horizontal") +
guides(colour = guide_colourbar(title.position = "top", title.hjust = 0.5),
size = guide_legend(title.position = "top", title.hjust = 0.5))
我有一个数据框df
df<-structure(list(y = c(2268.14043972082, 2147.62290922552, 2269.1387550775,
2247.31983098201, 1903.39138268307, 2174.78291538358, 2359.51909126411,
2488.39004804939, 212.851575751527, 461.398994384333, 567.150629704352,
781.775113821961, 918.303706148872, 1107.37695799186, 1160.80594193377,
1412.61328924168, 1689.48879626486, 260.737164468854, 306.72700499362,
283.410379620422, 366.813913489692, 387.570173754128, 388.602676983443,
477.858510450125, 128.198042456082, 535.519377609133, 1028.8780498564,
1098.54431357711, 1265.26965941035, 1129.58344809909, 820.922447928053,
749.343583476846, 779.678206156474, 646.575242339517, 733.953282899613,
461.156280127354, 906.813018662913, 798.186995701282, 831.365377249207,
764.519073183124, 672.076289062505, 669.879217186302, 1341.47673353751,
1401.44881976186, 1640.27575962036), P = c(1750.51986303926,
1614.11541634798, 951.847023338079, 1119.3682884872, 1112.38984390156,
1270.65773075982, 1234.72262170166, 1338.46096616983, 1198.95775346458,
1136.69287367165, 1265.46480803983, 1364.70149818063, 1112.37006707489,
1346.49240261316, 1740.56677791104, 1410.99217295647, 1693.18871380948,
901.760176040232, 763.971046562772, 994.8699095021, 972.755147593882,
1011.41669411398, 643.705302958842, 537.54384616157, 591.212003320456,
464.405641604215, NA, NA, NA, NA, NA, 246.197052353527, 265.237238116562,
1260.68540103734, 398.080919081345, NA, 374.611004248261, 527.686996757984,
765.678002953529, 661.830007851124, 484.864011824131, 612.936006393284,
672.088483441621, 625.397994920611, 785.390003710985), x = c(49,
50, 51, 52, 53, 54, 55, 56, 1, 2, 3, 4, 5, 14, 15, 16, 17, 2,
3, 4, 5, 6, 10, 11, 3, 30, 64, 66, 67, 68, 69, 34, 35, 37, 39,
2, 17, 18, 99, 100, 102, 103, 67, 70, 72), Te = c(9.10006221322572,
7.65505467142961, 8.21480062559674, 8.09251754304318, 8.466220758789,
8.48094407814006, 8.77304120569444, 8.31727518543397, 8.14410265791868,
8.80921738865237, 9.04091478341757, 9.66233618146246, 8.77015716015164,
9.46037931956657, 9.59702379240667, 10.1739258740118, 9.39524442215692,
0.616491147620629, 0.631476354027448, 0.129135682201776, 1.87297579763483,
2.53941370394744, -0.518422834982312, 1.34466852591922, 1.05118063842584,
1.79515935418336, 6.65555189859301, 6.38647333946436, 6.48427760143803,
6.33587322941382, 7.3501870975794, 3.04366850755114, 1.94656549866681,
3.61970174782833, 4.41939287295897, 9.47923019665153, 8.87480698915229,
8.06993784515111, 2.31976094801132, 2.65270969716837, 2.21586561444892,
2.66012522311856, 5.72634186318572, 4.63445162539409, 6.18505171198551
)), .Names = c("y", "P", "x", "Te"), row.names = c(NA, -45L), class = "data.frame")
我使用 ggplot 绘制这个 y 对 x 的图,其中点的大小和颜色分别基于 T 和 P。
ggplot(df) +
geom_point(aes(x = x, y = y, size=P, colour=Te), alpha=0.7) +
scale_colour_gradient(low="#00FF33", high ="#FF0000", guide = "colourbar")+
labs(colour="T", size="P")+
xlab("x") + ylab("y")+
scale_size(range = c(3, 8)) +
theme_bw(base_size = 12, base_family = "Helvetica") +
theme(panel.grid.minor = element_line(colour="grey", size=0.5),
axis.text.x = element_text(angle = 45, hjust = 1),
legend.position="bottom",
legend.box="horizontal") +
guides(colour = guide_colourbar(title.position="top", title.hjust = 0.5),
size = guide_legend(title.position="top", title.hjust = 0.5))
一些点被删除了,因为我在 P 中有一些 NA 值。但是,我想保留这些点并给它们一个灰色。
有人知道怎么做吗?
一个解决方案是使用两个数据子集——第一次调用 geom_point
仅绘制 df$P
为 而非 的数据点 NA
。对 geom_point
的第二次调用绘制了 df$P
为 NA
的点,因此删除了 size = P
美学。
ggplot(df) +
geom_point(data = subset(df, !is.na(P)), aes(x = x, y = y, size=P, colour=Te), alpha=0.7) +
geom_point(data = subset(df, is.na(P)), aes(x = x, y = y, color = Te), alpha = 0.7, color = "black") +
scale_colour_gradient(low="#00FF33", high ="#FF0000", guide = "colourbar")+
labs(colour="T", size="P")+
xlab("x") + ylab("y")+
scale_size(range = c(3, 8)) +
theme_bw(base_size = 12, base_family = "Helvetica") +
theme(panel.grid.minor = element_line(colour="grey", size=0.5),
axis.text.x = element_text(angle = 45, hjust = 1),
legend.position="bottom",
legend.box="horizontal") +
guides(colour = guide_colourbar(title.position="top", title.hjust = 0.5),
size = guide_legend(title.position="top", title.hjust = 0.5))
注意:您可以通过在第一个 ggplot
电话。您还可以通过将所有内容放入 labs()
来减少 labs
、xlabs
和 ylabs
的一些重复。最后,gradient = "colourbar"
是 scale_colour_gradient
的 guide
参数的默认值,因此它也可以被删除:
ggplot(df, aes(x = x, y = y), alpha = 0.7) +
geom_point(data = subset(df, !is.na(P)), aes(size = P, color = Te)) +
geom_point(data = subset(df, is.na(P)), color = "black") +
scale_colour_gradient(low = "#00FF33", high = "#FF0000") +
labs(x = "x", y = "y", colour = "T", size = "P") +
scale_size(range = c(3, 8)) +
theme_bw(base_size = 12, base_family = "Helvetica") +
theme(panel.grid.minor = element_line(colour = "grey", size = 0.5),
axis.text.x = element_text(angle = 45, hjust = 1),
legend.position = "bottom",
legend.box = "horizontal") +
guides(colour = guide_colourbar(title.position = "top", title.hjust = 0.5),
size = guide_legend(title.position = "top", title.hjust = 0.5))