1、两个变量:x,y皆连续
使用数据集mtcars
mtcars数据集包含从1974年《美国汽车趋势》杂志中提取的数据,该数据描述了32辆汽车(1973–74年型号)的油耗以及汽车设计和性能的10个其他属性。
data:image/s3,"s3://crabby-images/0245e/0245e6cd618700411671b19e236c8d1c4baddbf5" alt=""
#先创建一个ggplot图层
library(ggplot2)
b <- ggplot(data = mtcars, aes(x=wt, y=mpg))
#DatistEQ回收数据,后续代码省略此行
ggsave(gettempfile(), width = 15, height = 10, dpi=300,units = "cm")
可能添加的图层有:
- geom_point():散点图
- geom_smooth():平滑线
- geom_quantile():分位线
- geom_rug():边际地毯线
- geom_jitter():避免重叠
- geom_text():添加文本注释
data:image/s3,"s3://crabby-images/0d106/0d1068ea1cb5192583dd1e92e4245fd5bfb13b58" alt=""
1.1 散点图
b+geom_point()
data:image/s3,"s3://crabby-images/789f6/789f613d2c31a683646ab6584a0a94091918d950" alt=""
将变量cyl映射给点的颜色和形状
b + geom_point(aes(color = factor(cyl), shape = factor(cyl)))
data:image/s3,"s3://crabby-images/60103/60103d7e2f3143ab3184a3c8488c80a77454b0e9" alt=""
自定义颜色
b+geom_point(aes(color=factor(cyl), shape=factor(cyl)))+
scale_color_manual(values=c("#999999", "#E69F00", "#56B4E9"))+theme_classic()
data:image/s3,"s3://crabby-images/7e48f/7e48f1b7af1e21c90768cfcdd3d1673b001f562d" alt=""
1.2 平滑线
可以添加回归曲线
b+geom_smooth()
data:image/s3,"s3://crabby-images/96ea1/96ea18d117cf7d715d6dbd78d0c40253cb15135d" alt=""
散点图+回归线
b+geom_point()+
geom_smooth(method = "lm", se=FALSE)#去掉置信区间
data:image/s3,"s3://crabby-images/1375d/1375de5c3a38973ab4d5dd8398c66736baf00af4" alt=""
使用loess方法
b+geom_point()+
geom_smooth(method = "loess")
data:image/s3,"s3://crabby-images/67ccb/67ccbb25c6bc077dca40352b1ace259ac0f0cf09" alt=""
将变量映射给颜色和形状
b+geom_point(aes(color=factor(cyl), shape=factor(cyl)))+
geom_smooth(aes(color=factor(cyl), shape=factor(cyl)), method = "lm", se=FALSE, fullrange=TRUE)
data:image/s3,"s3://crabby-images/fa2a6/fa2a6811b84217dee6c9a2fff236f433735dee73" alt=""
1.3 分位线
# Package `quantreg` required for `stat_quantile`.
if (!require("quantreg")) install.packages("quantreg")
ggplot(data = mpg, aes(cty, hwy))+
geom_point()+geom_quantile()+
theme_minimal()
data:image/s3,"s3://crabby-images/43f77/43f7733fbbaac8649fe4e4404163cf6b1984f4e8" alt=""
1.4 边际地毯线
使用数据集faithful
ggplot(data = faithful, aes(x=eruptions, y=waiting))+
geom_point()+geom_rug()
data:image/s3,"s3://crabby-images/7c439/7c439f1e9d1d72c9d37f36cc3526720651170bf1" alt=""
避免重叠
实际上geom_jitter()是geom_point(position="jitter")的简称,下面使用数据集mpg
p <- ggplot(data = mpg, aes(displ, hwy))
p+geom_point()
data:image/s3,"s3://crabby-images/5408c/5408cdb38554493bdb59c2418001bd6bae6deb9e" alt=""
1.5 增加抖动防止重叠
p+geom_jitter(width = 0.5, height = 0.5)
data:image/s3,"s3://crabby-images/1fdca/1fdca85540646d797494cdd287b94cf7560be342" alt=""
其中两个参数:
width:x轴方向的抖动幅度
height:y轴方向的抖动幅度
1.6 文本注释
参数label用来指定注释标签 (ggrepel可以避免标签重叠)
b+geom_text(aes(label=rownames(mtcars)))
data:image/s3,"s3://crabby-images/9ee12/9ee122c39a206087148cf98b1814bf8d7ee49c14" alt=""
完整代码如下:
header1("两个变量:x,y皆连续")
header2("散点图")
library(ggplot2)
b <- ggplot(data = mtcars, aes(x=wt, y=mpg))
b+geom_point()
ggsave(gettempfile(), width = 15, height = 10, dpi=300,units = "cm")
#将变量cyl映射给点的颜色和形状
b + geom_point(aes(color = factor(cyl), shape = factor(cyl)))
ggsave(gettempfile(), width = 15, height = 10, dpi=300,units = "cm")
#自定义颜色
b+geom_point(aes(color=factor(cyl), shape=factor(cyl)))+
scale_color_manual(values=c("#999999", "#E69F00", "#56B4E9"))+theme_classic()
ggsave(gettempfile(), width = 15, height = 10, dpi=300,units = "cm")
header2("平滑线")
b+geom_smooth()
ggsave(gettempfile(), width = 15, height = 10, dpi=300,units = "cm")
#散点图+回归线
b+geom_point()+
geom_smooth(method = "lm", se=FALSE)#去掉置信区间
ggsave(gettempfile(), width = 15, height = 10, dpi=300,units = "cm")
#使用loess方法
b+geom_point()+
geom_smooth(method = "loess")
ggsave(gettempfile(), width = 15, height = 10, dpi=300,units = "cm")
#将变量映射给颜色和形状
b+geom_point(aes(color=factor(cyl), shape=factor(cyl)))+
geom_smooth(aes(color=factor(cyl), shape=factor(cyl)), method = "lm", se=FALSE, fullrange=TRUE)
ggsave(gettempfile(), width = 15, height = 10, dpi=300,units = "cm")
#分位线
# Package `quantreg` required for `stat_quantile`.
if (!require("quantreg")) install.packages("quantreg")
ggplot(data = mpg, aes(cty, hwy))+ geom_point() + geom_quantile() + theme_minimal()
ggsave(gettempfile(), width = 15, height = 10, dpi=300,units = "cm")
ggplot(mtcars, aes(hp, disp)) +
geom_point() +
geom_quantile(quantiles = 0.5, aes(group = factor(gear), colour = factor(gear)),
xseq = min(mtcars$hp):max(mtcars$hp))
ggsave(gettempfile(), width = 15, height = 10, dpi=300,units = "cm")
#边际地毯线
#使用数据集faithful
ggplot(data = faithful, aes(x=eruptions, y=waiting))+
geom_point()+geom_rug()
ggsave(gettempfile(), width = 15, height = 10, dpi=300,units = "cm")
#避免重叠
#实际上geom_jitter()是geom_point(position="jitter")的简称,下面使用数据集mpg
p <- ggplot(data = mpg, aes(displ, hwy))
p+geom_point()
ggsave(gettempfile(), width = 15, height = 10, dpi=300,units = "cm")
#增加抖动防止重叠
p+geom_jitter(width = 0.5, height = 0.5)
ggsave(gettempfile(), width = 15, height = 10, dpi=300,units = "cm")
#文本注释
#参数label用来指定注释标签 (ggrepel可以避免标签重叠)
b <- ggplot(data = mtcars, aes(x=wt, y=mpg))
b+geom_text(aes(label=rownames(mtcars)))
ggsave(gettempfile(), width = 15, height = 10, dpi=300,units = "cm")
2、两个变量:连续二元分布
使用数据集diamonds,该数据集收集了约54000颗钻石的价格和质量的信息。每条记录由十个变量构成,其中有三个是名义变量,分别描述钻石的切工,颜色和净度;
注:数据集diamonds,源于ggplot2包(因为钻石的价格定价取决于重量,颜色,刀工等影响,价格该如何制定合理,为公司抢占市场制定价格提供依据。)
data:image/s3,"s3://crabby-images/266ad/266ad5bc54296d7d64d1c4aab4e2a9824f603458" alt=""
carat:克拉重量
cut:切工
color:颜色
clarity:净度
depth:深度
table:钻石宽度
以及X,Y,Z
data:image/s3,"s3://crabby-images/4e640/4e6405f4d572a059b7b826ac75ada160300906ec" alt=""
创建ggplot图层,后面再逐步添加图层
c <- ggplot(data=diamonds, aes(carat, price))
可添加的图层有:
geom_bin2d(): 二维封箱热图
geom_hex(): 六边形封箱图
geom_density_2d(): 二维等高线密度图
data:image/s3,"s3://crabby-images/80de1/80de1d3558940eb46b1f46fb17dff3213c024154" alt=""
2.1 二维封箱热图
geom_bin2d()将点的数量用矩形封装起来,通过颜色深浅来反映点密度
c+geom_bin2d()
data:image/s3,"s3://crabby-images/39c4c/39c4c8fef2dd47f4693309c396c59de15d2e829b" alt=""
设置bin的数量
c+geom_bin2d(bins=150)
data:image/s3,"s3://crabby-images/e50b0/e50b0ee7291b7c011b5351a6e60a00a444688553" alt=""
2.2 六边形封箱图
geom_hex()依赖于另一个R包hexbin,所以没安装的先安装:
if (!require("hexbin")) install.packages("hexbin")
library(hexbin)
c+geom_hex()
data:image/s3,"s3://crabby-images/eb2e6/eb2e6986a7fdf2080cead951daf89ab614024b77" alt=""
修改bin的数目
c+geom_hex(bins=10)
data:image/s3,"s3://crabby-images/ffa00/ffa0068cb29ef5aed050259158f032b2dfae77f0" alt=""
2.3 二维等高线密度图
sp <- ggplot(faithful, aes(x=eruptions, y=waiting))
sp+geom_point()+ geom_density_2d()
data:image/s3,"s3://crabby-images/47e24/47e244fcf00a14b053c443cc0921c045c6ecbb4a" alt=""
完整代码如下:
library(ggplot2)
#diamonds有54000颗钻石的数据,太大只显示头部的几行记录
output(head(diamonds))
#二维封箱热图
header1("二维封箱热图")
c <- ggplot(data=diamonds, aes(carat, price))
c+geom_bin2d()
ggsave(gettempfile(), width = 15, height = 10, dpi=300,units = "cm")
#设置bin的数量
c+geom_bin2d(bins=150)
ggsave(gettempfile(), width = 15, height = 10, dpi=300,units = "cm")
#六边形封箱图
header1("六边形封箱图")
if (!require("hexbin")) install.packages("hexbin")
library(hexbin)
c+geom_hex()
ggsave(gettempfile(), width = 15, height = 10, dpi=300,units = "cm")
#修改bin的数目
c+geom_hex(bins=10)
ggsave(gettempfile(), width = 15, height = 10, dpi=300,units = "cm")
header1("二维等高线密度图")
sp <- ggplot(faithful, aes(x=eruptions, y=waiting))
sp+geom_point()+ geom_density_2d()
ggsave(gettempfile(), width = 15, height = 10, dpi=300,units = "cm")
3、两个变量:连续函数
主要是如何通过线来连接两个变量,使用数据集economics。
head(economics)
data:image/s3,"s3://crabby-images/6ec44/6ec449f42706f496e9e990574b1411e1c0d60a0a" alt=""
先创建一个ggplot图层,后面逐步添加图层
d <- ggplot(data = economics, aes(x=date, y=unemploy))
可添加的图层有:
geom_area():面积图
geom_line():折线图
geom_step(): 阶梯图
3.1 面积图
d+geom_area()
data:image/s3,"s3://crabby-images/63ce6/63ce6cfc93abd5b75737cf30ed91b51143955b01" alt=""
3.2 线图
d+geom_line()
data:image/s3,"s3://crabby-images/a06c0/a06c093e607892cf238595b2ac667800b814a493" alt=""
3.3 阶梯图
set.seed(1111)
ss <- economics[sample(1:nrow(economics), 20),]
ggplot(ss, aes(x=date, y=unemploy))+geom_step()
data:image/s3,"s3://crabby-images/751c9/751c91f80acb0dd9d5c3343223a0edcca9cad2f3" alt=""
完整代码如下:
library(ggplot2)
output(head(economics))
#面积图
header1("面积图")
d <- ggplot(data = economics, aes(x=date, y=unemploy))
d+geom_area()
ggsave(gettempfile(), width = 15, height = 10, dpi=300,units = "cm")
header1("线图")
d+geom_line()
ggsave(gettempfile(), width = 15, height = 10, dpi=300,units = "cm")
header1("阶梯图")
set.seed(1111)
ss <- economics[sample(1:nrow(economics), 20),]
ggplot(ss, aes(x=date, y=unemploy))+ geom_step()
ggsave(gettempfile(), width = 15, height = 10, dpi=300,units = "cm")
4、 两个变量:x离散,y连续
使用数据集ToothGrowth,其中的变量len(Tooth length)是连续变量,dose是离散变量。
ToothGrowth$dose <- as.factor(ToothGrowth$dose)
head(ToothGrowth)
创建图层
e <- ggplot(data = ToothGrowth, aes(x=dose, y=len))
可添加的图层有:
geom_boxplot(): 箱线图
geom_violin():小提琴图
geom_dotplot():点图
geom_jitter(): 带状图
geom_line(): 线图
geom_bar(): 条形图
data:image/s3,"s3://crabby-images/87f7e/87f7ed987997bb44c3d3cba6eccff22eeef80507" alt=""
4.1 箱线图
e+geom_boxplot()
data:image/s3,"s3://crabby-images/eeb58/eeb582e68e6d9fbf54b43f2f16496805df5121e3" alt=""
添加有缺口的箱线图
e+geom_boxplot(notch = TRUE)
data:image/s3,"s3://crabby-images/300dd/300ddf6adeba7d76ecb7e7b72d42b73addf09e6d" alt=""
将dose映射给填充颜色
e+geom_boxplot(aes(fill=dose))
data:image/s3,"s3://crabby-images/cd6d5/cd6d5d22ba0145f719969c5650896e8a7f47b8a9" alt=""
按supp进行分类并映射给填充颜色
ggplot(ToothGrowth, aes(x=dose, y=len))+ geom_boxplot(aes(fill=supp))
data:image/s3,"s3://crabby-images/1aa44/1aa4476bde9f33b8680e58b3a78118bb2f6c63c7" alt=""
4.2 小提琴图
e+geom_violin(trim = FALSE)
data:image/s3,"s3://crabby-images/551f1/551f1e218a789305fc88705c77fcc0a57f489d28" alt=""
添加中值点
e+geom_violin(trim = FALSE)+
stat_summary(fun.data = mean_sdl, fun.args = list(mult=1),
geom="pointrange", color="red")
data:image/s3,"s3://crabby-images/7b481/7b48197d520f070a725e4ead9e2d06bac645abe7" alt=""
与箱线图结合
e+geom_violin(trim = FALSE)+
geom_boxplot(width=0.2)
data:image/s3,"s3://crabby-images/7d2f1/7d2f1514fce52fc28b0eb3bc014f6d2ea9ec7d16" alt=""
将dose映射给颜色进行分组
e+geom_violin(aes(color=dose), trim = FALSE)
data:image/s3,"s3://crabby-images/ffe7f/ffe7fdbbd2316df7d62931780421daf3d34212f1" alt=""
4.3 点图
e+geom_dotplot(binaxis = "y", stackdir = "center")
data:image/s3,"s3://crabby-images/aa77a/aa77a01a061a848eb532dc6a71e9a3a9b8643ba0" alt=""
添加中值点
e + geom_dotplot(binaxis = "y", stackdir = "center") +
stat_summary(fun.data=mean_sdl, color = "red",geom = "pointrange",fun.args=list(mult=1))
data:image/s3,"s3://crabby-images/fdc91/fdc9169d9b73352d57d2b409c97a8f43a43fd363" alt=""
与箱线图结合
e + geom_boxplot() +
geom_dotplot(binaxis = "y", stackdir = "center")
data:image/s3,"s3://crabby-images/6d51c/6d51cb480c95681ece76ab429b1f4c8712130578" alt=""
添加小提琴图
e + geom_violin(trim = FALSE) +
geom_dotplot(binaxis='y', stackdir='center')
data:image/s3,"s3://crabby-images/27a7b/27a7b8a4df5e0719547cb5cdc287d6e277e3a3b1" alt=""
将dose映射给颜色以及填充色
e + geom_dotplot(aes(color = dose, fill = dose),
binaxis = "y", stackdir = "center")
data:image/s3,"s3://crabby-images/592f3/592f3b5c33aaa260e4d43c80423d92ade4ad2209" alt=""
4.5 带状图
带状图是一种一维散点图,当样本量很小时,与箱线图相当
e + geom_jitter(position=position_jitter(0.2))
data:image/s3,"s3://crabby-images/c1e9e/c1e9eb7ee6b902c9a570f9b6417b61e1d6941903" alt=""
添加中值点
e + geom_jitter(position=position_jitter(0.2)) +
stat_summary(fun.data="mean_sdl", fun.args = list(mult=1),
geom="pointrange", color = "red")
data:image/s3,"s3://crabby-images/f86a4/f86a40e8b15e9b8d8794893e3e307428e050b88e" alt=""
与点图结合
e + geom_jitter(position=position_jitter(0.2)) +
geom_dotplot(binaxis = "y", stackdir = "center")
data:image/s3,"s3://crabby-images/bb8cb/bb8cbbef69b27a18e7f61d38553b577033c17f73" alt=""
与小提琴图结合
e + geom_violin(trim = FALSE) +
geom_jitter(position=position_jitter(0.2))
data:image/s3,"s3://crabby-images/e5146/e514682dd25e7574d91b1d625175273a7d096cd4" alt=""
将dose映射给颜色和形状
e + geom_jitter(aes(color = dose, shape = dose),
position=position_jitter(0.2))
data:image/s3,"s3://crabby-images/ac906/ac90643c57791296885ee73e067617f63a6ec548" alt=""
4.6 线图
#构造数据集
df <- data.frame(supp=rep(c("VC", "OJ"), each=3),
dose=rep(c("D0.5", "D1", "D2"),2),
len=c(6.8, 15, 33, 4.2, 10, 29.5))
head(df)
data:image/s3,"s3://crabby-images/2bf6b/2bf6b13e9c77f8ff9f85102a0397c4d35520b57c" alt=""
将supp映射线型
ggplot(df, aes(x=dose, y=len, group=supp)) +
geom_line(aes(linetype=supp))+
geom_point()
data:image/s3,"s3://crabby-images/7b92c/7b92c82051e67bd3394edf7c15012f041825983d" alt=""
修改线型、点的形状以及颜色
ggplot(df, aes(x=dose, y=len, group=supp)) +
geom_line(aes(linetype=supp, color = supp))+
geom_point(aes(shape=supp, color = supp))
data:image/s3,"s3://crabby-images/21608/216087b0762e8f37dddacc40d85d354ed8e7dd37" alt=""
4.7 条形图
#构造数据集
df <- data.frame(dose=c("D0.5", "D1", "D2"),
len=c(4.2, 10, 29.5))
head(df)
## dose len
## 1 D0.5 4.2
## 2 D1 10.0
## 3 D2 29.5
df2 <- data.frame(supp=rep(c("VC", "OJ"), each=3),
dose=rep(c("D0.5", "D1", "D2"),2),
len=c(6.8, 15, 33, 4.2, 10, 29.5))
head(df2)
## supp dose len
## 1 VC D0.5 6.8
## 2 VC D1 15.0
## 3 VC D2 33.0
## 4 OJ D0.5 4.2
## 5 OJ D1 10.0
## 6 OJ D2 29.5
创建图层
f <- ggplot(df, aes(x = dose, y = len))
f + geom_bar(stat = "identity")
data:image/s3,"s3://crabby-images/d0c1b/d0c1bd35794a4189b52652ca48c4b9601dee86f0" alt=""
修改填充色以及添加标签
f + geom_bar(stat="identity", fill="steelblue")+
geom_text(aes(label=len), vjust=-0.3, size=3.5)+
theme_minimal()
data:image/s3,"s3://crabby-images/8a87b/8a87bf071b60236a2de8a59270fd09d04f100afb" alt=""
将dose映射给条形图颜色
f + geom_bar(aes(color = dose),
stat="identity", fill="white")
data:image/s3,"s3://crabby-images/d2071/d20716afbe7c01d5bc55b24dd37b65faacd95832" alt=""
修改填充色
f + geom_bar(aes(fill = dose), stat="identity")
data:image/s3,"s3://crabby-images/4a0de/4a0dee4fda52a96280ef7cc5d4867aec5259950c" alt=""
将变量supp映射给填充色,从而达到分组效果
g <- ggplot(data=df2, aes(x=dose, y=len, fill=supp))
g + geom_bar(stat = "identity")#position默认为stack
data:image/s3,"s3://crabby-images/b0e5f/b0e5f11462ab6ea7470f01f5b5657bd429d44878" alt=""
修改position为dodge
g + geom_bar(stat="identity", position=position_dodge())
data:image/s3,"s3://crabby-images/40f47/40f47aca823506370c0f319e83ea7c76b31a3327" alt=""
完整代码如下:
library(ggplot2)
#output(head(ToothGrowth))
ToothGrowth$dose <- as.factor(ToothGrowth$dose)
output(head(ToothGrowth))
#箱线图
header1("箱线图")
e <- ggplot(data = ToothGrowth, aes(x=dose, y=len))
e+geom_boxplot()
ggsave(gettempfile(), width = 15, height = 10, dpi=300,units = "cm")
#添加有缺口的箱线图
e+geom_boxplot(notch = TRUE)
ggsave(gettempfile(), width = 15, height = 10, dpi=300,units = "cm")
#将dose映射给填充颜色
e+geom_boxplot(aes(fill=dose))
ggsave(gettempfile(), width = 15, height = 10, dpi=300,units = "cm")
#按supp进行分类并映射给填充颜色
ggplot(ToothGrowth, aes(x=dose, y=len))+ geom_boxplot(aes(fill=supp))
ggsave(gettempfile(), width = 15, height = 10, dpi=300,units = "cm")
#小提琴图
header1("小提琴图")
e+geom_violin(trim = FALSE)
ggsave(gettempfile(), width = 15, height = 10, dpi=300,units = "cm")
#添加中值点
if (!require("Hmisc")) install.packages("Hmisc")
e+geom_violin(trim = FALSE)+
stat_summary(fun.data = mean_sdl, fun.args = list(mult=1),
geom="pointrange", color="red")
ggsave(gettempfile(), width = 15, height = 10, dpi=300,units = "cm")
#与箱线图结合
e+geom_violin(trim = FALSE)+geom_boxplot(width=0.2)
ggsave(gettempfile(), width = 15, height = 10, dpi=300,units = "cm")
#将dose映射给颜色进行分组
e+geom_violin(aes(color=dose), trim = FALSE)
ggsave(gettempfile(), width = 15, height = 10, dpi=300,units = "cm")
#点图
header1("点图")
e+geom_dotplot(binaxis = "y", stackdir = "center")
ggsave(gettempfile(), width = 15, height = 10, dpi=300,units = "cm")
#添加中值点
e + geom_dotplot(binaxis = "y", stackdir = "center") +
stat_summary(fun.data=mean_sdl, color = "red",geom = "pointrange",fun.args=list(mult=1))
ggsave(gettempfile(), width = 15, height = 10, dpi=300,units = "cm")
#与箱线图结合
e + geom_boxplot() +
geom_dotplot(binaxis = "y", stackdir = "center")
ggsave(gettempfile(), width = 15, height = 10, dpi=300,units = "cm")
#添加小提琴图
e + geom_violin(trim = FALSE) +
geom_dotplot(binaxis='y', stackdir='center')
ggsave(gettempfile(), width = 15, height = 10, dpi=300,units = "cm")
#将dose映射给颜色以及填充色
e + geom_dotplot(aes(color = dose, fill = dose),
binaxis = "y", stackdir = "center")
ggsave(gettempfile(), width = 15, height = 10, dpi=300,units = "cm")
#带状图
header1("带状图")
e + geom_jitter(position=position_jitter(0.2))
ggsave(gettempfile(), width = 15, height = 10, dpi=300,units = "cm")
#添加中值点
e + geom_jitter(position=position_jitter(0.2)) +
stat_summary(fun.data="mean_sdl", fun.args = list(mult=1),
geom="pointrange", color = "red")
ggsave(gettempfile(), width = 15, height = 10, dpi=300,units = "cm")
#与点图结合
e + geom_jitter(position=position_jitter(0.2)) +
geom_dotplot(binaxis = "y", stackdir = "center")
ggsave(gettempfile(), width = 15, height = 10, dpi=300,units = "cm")
#与小提琴图结合
e + geom_violin(trim = FALSE) +
geom_jitter(position=position_jitter(0.2))
ggsave(gettempfile(), width = 15, height = 10, dpi=300,units = "cm")
#将dose映射给颜色和形状
e + geom_jitter(aes(color = dose, shape = dose),
position=position_jitter(0.2))
ggsave(gettempfile(), width = 15, height = 10, dpi=300,units = "cm")
#线图
header1("线图")
df <- data.frame(supp=rep(c("VC", "OJ"), each=3),
dose=rep(c("D0.5", "D1", "D2"),2),
len=c(6.8, 15, 33, 4.2, 10, 29.5))
output( head(df))
ggplot(df, aes(x=dose, y=len, group=supp)) +
geom_line(aes(linetype=supp))+
geom_point()
ggsave(gettempfile(), width = 15, height = 10, dpi=300,units = "cm")
#修改线型、点的形状以及颜色
ggplot(df, aes(x=dose, y=len, group=supp)) +
geom_line(aes(linetype=supp, color = supp))+
geom_point(aes(shape=supp, color = supp))
ggsave(gettempfile(), width = 15, height = 10, dpi=300,units = "cm")
header1("条形图")
df <- data.frame(dose=c("D0.5", "D1", "D2"),
len=c(4.2, 10, 29.5))
output(head(df))
df2 <- data.frame(supp=rep(c("VC", "OJ"), each=3),
dose=rep(c("D0.5", "D1", "D2"),2),
len=c(6.8, 15, 33, 4.2, 10, 29.5))
output(head(df2))
f <- ggplot(df, aes(x = dose, y = len))
f + geom_bar(stat = "identity")
ggsave(gettempfile(), width = 15, height = 10, dpi=300,units = "cm")
#修改填充色以及添加标签
f + geom_bar(stat="identity", fill="steelblue")+
geom_text(aes(label=len), vjust=-0.3, size=3.5)+
theme_minimal()
ggsave(gettempfile(), width = 15, height = 10, dpi=300,units = "cm")
#将dose映射给条形图颜色
f + geom_bar(aes(color = dose),
stat="identity", fill="white")
ggsave(gettempfile(), width = 15, height = 10, dpi=300,units = "cm")
#修改填充色
f + geom_bar(aes(fill = dose), stat="identity")
ggsave(gettempfile(), width = 15, height = 10, dpi=300,units = "cm")
#将变量supp映射给填充色,从而达到分组效果
g <- ggplot(data=df2, aes(x=dose, y=len, fill=supp))
g + geom_bar(stat = "identity")#position默认为stack
ggsave(gettempfile(), width = 15, height = 10, dpi=300,units = "cm")
#修改position为dodge
g + geom_bar(stat="identity", position=position_dodge())
ggsave(gettempfile(), width = 15, height = 10, dpi=300,units = "cm")
5、 两个变量:x、y皆离散
使用数据集diamonds中的两个离散变量color以及cut
ggplot(diamonds, aes(cut, color)) +
geom_jitter(aes(color = cut), size = 0.5)
data:image/s3,"s3://crabby-images/3635f/3635fe163a9b424d956fbf7464eb6fbb1091a825" alt=""
6、 两个变量:绘制误差图
df <- ToothGrowth
df$dose <- as.factor(df$dose)
head(df)
## len supp dose
## 1 4.2 VC 0.5
## 2 11.5 VC 0.5
## 3 7.3 VC 0.5
## 4 5.8 VC 0.5
## 5 6.4 VC 0.5
## 6 10.0 VC 0.5
绘制误差图需要知道均值以及标准误,下面这个函数用来计算每组的均值以及标准误。
data_summary <- function(data, varname, grps){
require(plyr)
summary_func <- function(x, col){
c(mean = mean(x[[col]], na.rm=TRUE),
sd = sd(x[[col]], na.rm=TRUE))
}
data_sum<-ddply(data, grps, .fun=summary_func, varname)
data_sum <- rename(data_sum, c("mean" = varname))
return(data_sum)
}
计算均值以及标准误
df2 <- data_summary(df, varname="len", grps= "dose")
# Convert dose to a factor variable
df2$dose=as.factor(df2$dose)
head(df2)
## dose len sd
## 1 0.5 10.605 4.499763
## 2 1 19.735 4.415436
## 3 2 26.100 3.774150
创建图层
f <- ggplot(df2, aes(x = dose, y = len,
ymin = len-sd, ymax = len+sd))
可添加的图层有:
geom_crossbar(): 空心柱,上中下三线分别代表ymax、mean、ymin
geom_errorbar(): 误差棒
geom_errorbarh(): 水平误差棒
geom_linerange():竖直误差线
geom_pointrange():中间为一点的误差线
data:image/s3,"s3://crabby-images/02800/02800799c85300d193c9d32acee9f891762b516e" alt=""
6.1 空心柱
geom_crossbar()
f+geom_crossbar()
data:image/s3,"s3://crabby-images/f29ea/f29ea66d218fe59658b86057599aea1b665fc013" alt=""
将dose映射给颜色
f+geom_crossbar(aes(color=dose))
data:image/s3,"s3://crabby-images/fcd61/fcd6154f4d4c3b21bd37b8f2523143baecefd47e" alt=""
自定义颜色
f+geom_crossbar(aes(color=dose))+
scale_color_manual(values = c("#999999", "#E69F00", "#56B4E9"))+theme_classic()
data:image/s3,"s3://crabby-images/64bfc/64bfceeed4146d0d27350dd10d00b7c5196c685c" alt=""
修改填充色
f+geom_crossbar(aes(fill=dose))+
scale_fill_manual(values = c("#999999", "#E69F00", "#56B4E9"))+
theme_classic()
data:image/s3,"s3://crabby-images/0e6cc/0e6cc0fa8096598e5b07a8f8053245616d32beb7" alt=""
通过将supp映射给颜色实现分组,可以利用函数stat_summary()来计算mean和sd
f <- ggplot(df, aes(x=dose, y=len, color=supp))
f+stat_summary(fun.data = mean_sdl, fun.args = list(mult=1), geom="crossbar", width=0.6, position = position_dodge(0.8))
data:image/s3,"s3://crabby-images/01a03/01a0372eb4862bb20df92f96b7820a8ed44c3854" alt=""
6.2 误差棒
f <- ggplot(df2, aes(x=dose, y=len, ymin=len-sd, ymax=len+sd))
将dose映射给颜色
f+geom_errorbar(aes(color=dose), width=0.2)
data:image/s3,"s3://crabby-images/51b0f/51b0f03d1824179d196a7a5e9f00ae8dba50d6de" alt=""
与线图结合
f+geom_line(aes(group=1))+
geom_errorbar(width=0.15)
data:image/s3,"s3://crabby-images/af1cc/af1cc115b2cd6e1d5d7969eec4b6954ff16cbbe2" alt=""
与条形图结合,并将变量dose映射给颜色
f+geom_bar(aes(color=dose), stat = "identity", fill="white")+
geom_errorbar(aes(color=dose), width=0.1)
data:image/s3,"s3://crabby-images/74abf/74abf0cae807084ea117831427178361682e7ecc" alt=""
6.3 水平误差棒
#构造数据集
df2 <- data_summary(ToothGrowth, varname="len", grps = "dose")
df2$dose <- as.factor(df2$dose)
head(df2)
## dose len sd
## 1 0.5 10.605 4.499763
## 2 1 19.735 4.415436
## 3 2 26.100 3.774150
创建图层
f <- ggplot(data = df2, aes(x=len, y=dose,xmin=len-sd, xmax=len+sd))
参数xmin与xmax用来设置水平误差棒
f+geom_errorbarh()
data:image/s3,"s3://crabby-images/d6991/d69912c7d15fcf43d8998fb1ceb8db6514bc8927" alt=""
通过映射实现分组
f+geom_errorbarh(aes(color=dose))
data:image/s3,"s3://crabby-images/62775/62775a2b260f409e1b1eb3bdc0efdb0a8384a163" alt=""
6.4 竖直误差线
geom_linerange()与geom_pointrange()
f <- ggplot(df2, aes(x=dose, y=len, ymin=len-sd, ymax=len+sd))
line range
f+geom_linerange()
data:image/s3,"s3://crabby-images/84c05/84c05edf3924dc7f7c79d746005deaa9e6a038b5" alt=""
6.5 中间为一点的误差线
point range
f+geom_pointrange()
data:image/s3,"s3://crabby-images/5e0c4/5e0c48c841d3c03d16311192d6672de587d9c882" alt=""
6.6 点图+误差棒
g <- ggplot(df, aes(x=dose, y=len))+
geom_dotplot(binaxis = "y", stackdir = "center")
添加geom_crossbar()
g+stat_summary(fun.data = mean_sdl, fun.args = list(mult=1), geom="crossbar", color="red", width=0.1)
data:image/s3,"s3://crabby-images/91c87/91c8710aafeec313b17a2ec70abea8dc86ee2620" alt=""
添加geom_errorbar()
g + stat_summary(fun.data=mean_sdl, fun.args = list(mult=1),
geom="errorbar", color="red", width=0.2) +
stat_summary(fun.y=mean, geom="point", color="red")
data:image/s3,"s3://crabby-images/38399/38399685e57a7a5fdbb7f20cd42eb2a7b348865f" alt=""
添加geom_pointrange()
g + stat_summary(fun.data=mean_sdl, fun.args = list(mult=1),
geom="pointrange", color="red")
data:image/s3,"s3://crabby-images/00f78/00f78e2e29de4069e975ab44b967760683d7ee03" alt=""
完整代码如下:
library(ggplot2)
df <- ToothGrowth
df$dose <- as.factor(df$dose)
head(df)
data_summary <- function(data, varname, grps){
require(plyr)
summary_func <- function(x, col){
c(mean = mean(x[[col]], na.rm=TRUE),
sd = sd(x[[col]], na.rm=TRUE))
}
data_sum<-ddply(data, grps, .fun=summary_func, varname)
data_sum <- rename(data_sum, c("mean" = varname))
return(data_sum)
}
df2 <- data_summary(df, varname="len", grps= "dose")
# Convert dose to a factor variable
df2$dose=as.factor(df2$dose)
head(df2)
f <- ggplot(df2, aes(x = dose, y = len,
ymin = len-sd, ymax = len+sd))
f+geom_crossbar()
ggsave(gettempfile(), width = 15, height = 10, dpi=300,units = "cm")
#将dose映射给颜色
f+geom_crossbar(aes(color=dose))
ggsave(gettempfile(), width = 15, height = 10, dpi=300,units = "cm")
#自定义颜色
f+geom_crossbar(aes(color=dose))+
scale_color_manual(values = c("#999999", "#E69F00", "#56B4E9"))+theme_classic()
ggsave(gettempfile(), width = 15, height = 10, dpi=300,units = "cm")
#修改填充色
f+geom_crossbar(aes(fill=dose))+
scale_fill_manual(values = c("#999999", "#E69F00", "#56B4E9"))+
theme_classic()
ggsave(gettempfile(), width = 15, height = 10, dpi=300,units = "cm")
f <- ggplot(df, aes(x=dose, y=len, color=supp))
f+stat_summary(fun.data = mean_sdl, fun.args = list(mult=1), geom="crossbar", width=0.6, position = position_dodge(0.8))
ggsave(gettempfile(), width = 15, height = 10, dpi=300,units = "cm")
header1("误差棒")
f <- ggplot(df2, aes(x=dose, y=len, ymin=len-sd, ymax=len+sd))
#将dose映射给颜色
f+geom_errorbar(aes(color=dose), width=0.2)
ggsave(gettempfile(), width = 15, height = 10, dpi=300,units = "cm")
#与线图结合
f+geom_line(aes(group=1))+
geom_errorbar(width=0.15)
ggsave(gettempfile(), width = 15, height = 10, dpi=300,units = "cm")
f+geom_bar(aes(color=dose), stat = "identity", fill="white")+
geom_errorbar(aes(color=dose), width=0.1)
ggsave(gettempfile(), width = 15, height = 10, dpi=300,units = "cm")
header1("水平误差棒")
df2 <- data_summary(ToothGrowth, varname="len", grps = "dose")
df2$dose <- as.factor(df2$dose)
output(head(df2))
#创建图层
f <- ggplot(data = df2, aes(x=len, y=dose,xmin=len-sd, xmax=len+sd))
f+geom_errorbarh()
ggsave(gettempfile(), width = 15, height = 10, dpi=300,units = "cm")
f+geom_errorbarh(aes(color=dose))
ggsave(gettempfile(), width = 15, height = 10, dpi=300,units = "cm")
#line range
f <- ggplot(df2, aes(x=dose, y=len, ymin=len-sd, ymax=len+sd))
f+geom_linerange()
ggsave(gettempfile(), width = 15, height = 10, dpi=300,units = "cm")
#point range
f+geom_pointrange()
ggsave(gettempfile(), width = 15, height = 10, dpi=300,units = "cm")
#点图+误差棒
g <- ggplot(df, aes(x=dose, y=len))+
geom_dotplot(binaxis = "y", stackdir = "center")
#添加geom_crossbar()
g+stat_summary(fun.data = mean_sdl, fun.args = list(mult=1), geom="crossbar", color="red", width=0.1)
ggsave(gettempfile(), width = 15, height = 10, dpi=300,units = "cm")
#添加geom_errorbar()
g + stat_summary(fun.data=mean_sdl, fun.args = list(mult=1),
geom="errorbar", color="red", width=0.2) +
stat_summary(fun.y=mean, geom="point", color="red")
ggsave(gettempfile(), width = 15, height = 10, dpi=300,units = "cm")
#添加geom_pointrange()
g + stat_summary(fun.data=mean_sdl, fun.args = list(mult=1),
geom="pointrange", color="red")
ggsave(gettempfile(), width = 15, height = 10, dpi=300,units = "cm")
7、 两个变量:地图绘制
ggplot2提供了绘制地图的函数geom_map(),依赖于包maps提供地理信息。
安装map
if (!require("maps")) install.packages("maps")
下面将绘制美国地图,数据集采用USArrests
library(maps)
head(USArrests)
## Murder Assault UrbanPop Rape
## Alabama 13.2 236 58 21.2
## Alaska 10.0 263 48 44.5
## Arizona 8.1 294 80 31.0
## Arkansas 8.8 190 50 19.5
## California 9.0 276 91 40.6
## Colorado 7.9 204 78 38.7
对数据进行整理一下,添加一列state
crimes <- data.frame(state=tolower(rownames(USArrests)), USArrests)
head(crimes)
## Murder Assault UrbanPop Rape
## Alabama 13.2 236 58 21.2
## Alaska 10.0 263 48 44.5
## Arizona 8.1 294 80 31.0
## Arkansas 8.8 190 50 19.5
## California 9.0 276 91 40.6
## Colorado 7.9 204 78 38.7
#数据重铸
library(reshape2)
crimesm <- melt(crimes, id=1)
head(crimesm)
## state variable value
## 1 alabama Murder 13.2
## 2 alaska Murder 10.0
## 3 arizona Murder 8.1
## 4 arkansas Murder 8.8
## 5 california Murder 9.0
## 6 colorado Murder 7.9
map_data <- map_data("state")
#绘制地图,使用Murder进行着色
ggplot(crimes, aes(map_id=state))+
geom_map(aes(fill=Murder), map=map_data)+
expand_limits(x=map_data$long, y=map_data$lat)
data:image/s3,"s3://crabby-images/3f2a4/3f2a40e6aead1b298a2e602147069722ba2c532c" alt=""
完整代码如下:
library(ggplot2)
if (!require("maps")) install.packages("maps")
library(maps)
output(head(USArrests))
crimes <- data.frame(state=tolower(rownames(USArrests)), USArrests)
output(head(crimes))
if (!require("reshape2")) install.packages("reshape2")
library(reshape2)
crimesm <- melt(crimes, id=1)
output(head(crimesm))
map_data <- map_data("state")
ggplot(crimes, aes(map_id=state))+
geom_map(aes(fill=Murder), map=map_data)+
expand_limits(x=map_data$long, y=map_data$lat)
ggsave(gettempfile(), width = 15, height = 10, dpi=300,units = "cm")
网友评论