25 Drawing Five Common Plots by ggplot2
Xirui Guo
library(ggplot2)
library(tidyverse)
library(ggpubr)
library(gridExtra)
library(reshape2)
library(Lock5withR)
library(fivethirtyeight)
library(RColorBrewer)
library(plotly)
25.1 Motivation
The ggplot2 is a powerful and effective package for drawing plots. It has a lot of syntaxes to support people get the graphs they want. A good plot needs to clearly represent the information. Scatter plots, line plots, histograms, boxplots, and heatmaps are frequently used in daily life. This Markdown hopes to be a guide about how to quickly and suitably draw the above five plots by ggplot2.
25.2 Graph1 scatter plot: geom_point
Using data mtcars
The main code for drawing scatter plot is geom_point; however, we usually don’t use it single because we need the plot shows more information and here are some syntaxes people use together with geom_point
:aes(size , color)
: sometimes it is effective, but people need to avoid showing too much information and making the graph hard to read..alpha
: change the transparency of point.geom_text
: add labels of each point.geom_smooth
: show the regression line and correspond standard error boundary.
mtcars$vs <- as.factor(mtcars$vs)
ggplot(mtcars, aes(x=wt, y=mpg, size=cyl, color=vs)) +
geom_point(alpha = .4) +
geom_text(label=rownames(mtcars),
nudge_x = 0.25, nudge_y = 0.25,
check_overlap = T)+
geom_smooth(method=lm , color="red", fill="lightblue", se=TRUE)
data:image/s3,"s3://crabby-images/9b7c6/9b7c68708caf20233f89bd5ddc5c38447b3180b4" alt=""
25.3 Graph2 line chart: geom_line
People need to clarify the x-axis and y-axis and can use group
to draw the line with different colors.
# library(reshape2)
x <- -10:10
var1 <- dnorm(x,-2,1)
var2 <- dnorm(x,2,1)
var3 <- dt(x,2,2)
data <- data.frame(x,var1,var2,var3)
data_n <- melt(data, id="x")
ggplot(data_n,aes(x=x, y=value, group=variable, color=variable))+
geom_line()
data:image/s3,"s3://crabby-images/f791e/f791e512cf50cf14df40d8ce06303b621629f3e7" alt=""
Using geom_line twice: a way for representing line from different groups without legend.
data_n <- data_n %>%
mutate(variable2=variable)
ggplot(data_n, aes(x=x, y=value))+
geom_line(data=data_n %>% select(-variable), aes(group=variable2), color="grey", size=0.5, alpha=0.8) +
geom_line(aes(color=variable), color="blue", size=1)+
facet_wrap(~variable)
data:image/s3,"s3://crabby-images/7b57c/7b57cb48e7c38308ccf6e1249f689e402d0b2865" alt=""
25.4 Graph3 box plot: geom_boxplot
Using the Data: StudentSurvey in Lock5withR package(PSet1). Drawing a “simple” box-plot first:labs()
: simultaneously add the main title and axis labels
# library(Lock5withR)
p3<-ggplot(StudentSurvey, aes(x = SAT, y = Year)) +
geom_boxplot()+
labs(title="Plot of SAT score and Year", x="SAT score", y="Year")
p3
data:image/s3,"s3://crabby-images/2a654/2a654db8eb6ee90aa8425efbaec8442e1a97f65c" alt=""
How to make boxplot shows more information:
1. Using theme()
+ element_text()
to modify the color, font, size of text.
p3+theme(
plot.title = element_text(color = "red", size = 14, face = "bold.italic"),
axis.title.x = element_text(color="blue", size = 14, face = "bold"),
axis.title.y = element_text(color="green", size = 14, face = "bold")
)
data:image/s3,"s3://crabby-images/09ef2/09ef20e38bb592712a210408b0e072112b746521" alt=""
- Adding legend and modifying the legend tittle
p3<-ggplot(StudentSurvey, aes(x = SAT, y = Year, fill=Year)) +
geom_boxplot()+
labs(fill="School Year")
p3
data:image/s3,"s3://crabby-images/dcc97/dcc97ffa59f9dcab4400c62d90516eea250f63cd" alt=""
3.Changing the position of legend: five choices “left”,“top”, “right”, “bottom”, “none”
p3<- p3+
theme(legend.position = "top")
p3
data:image/s3,"s3://crabby-images/2bb00/2bb00f191f0c0e7d1be7a406a25dc78fe8e802e2" alt=""
- Modifying the title, label and background of legend
p3+
theme(
legend.title = element_text(color="blue"),
legend.text = element_text(color="red"),
legend.background = element_rect(fill="lightblue")
)
data:image/s3,"s3://crabby-images/0aa1d/0aa1d7a2c773fe6581025a68d4ba918e5c29a466" alt=""
- Changing the name and order of factor’s level
Y <- fct_recode(StudentSurvey$Year, "NA" = "", "1st" = "FirstYear",
"2nd" = "Sophomore", "3rd" = "Junior", "4th" = "Senior")
Y <- fct_relevel(Y,"1st","2nd","3rd","4th")
p3<-ggplot(StudentSurvey, aes(x = SAT, y = Y, fill=Y)) +
geom_boxplot()+
labs(fill="School Year")
p3
data:image/s3,"s3://crabby-images/d3c54/d3c541bb208a186afdd169de9cd53de72368a61c" alt=""
- 6 ways to change the background of whole plots
p3_1<-p3+theme_gray()
p3_2<-p3+theme_bw()
p3_3<-p3+theme_linedraw()
p3_4<-p3+theme_light()
p3_5<-p3+theme_minimal()
p3_6<-p3+theme_classic()
ggarrange(p3_1,p3_2,p3_3,p3_4,p3_5,p3_6,nrow=3,ncol=2)
data:image/s3,"s3://crabby-images/c1695/c1695c7b93d3b4b527bf1765958550b2914d7e50" alt=""
25.5 Graph4 histogram: geom_histogram
Using Data: bad_drivers in fivethirtyeight package. Common syntaxes with geom_histogram:binwidth
: control the width of each bin.fill
: the color of bin.color
: the frame color of bin.alpha
: control the transparency of the bin color.
# library(fivethirtyeight)
p4 <- ggplot(bad_drivers,aes(x=perc_alcohol,y=..count..)) +
geom_histogram(binwidth=3, fill="lightblue", color="black", alpha=0.7)
p4
data:image/s3,"s3://crabby-images/66c16/66c16155eef19a42003e152923a3adbeedec5dd5" alt=""
coord_flip()
:make the histogram bar become horizontal
p4<- p4 +
coord_flip()
p4
data:image/s3,"s3://crabby-images/f0da1/f0da1081b22e3fe130ab8f8a3abc27d82b43853d" alt=""
scale_x_reverse()
and scale_y_reverse()
:reverse the x-axis and y-axis
p4+
scale_y_reverse()
data:image/s3,"s3://crabby-images/50dce/50dce5c55de6f8943ffcc555b1c9f9d03cfeb97e" alt=""
25.6 Graph5 heatmap: geom_tile
The data is from the class notes
grade <- rep(c("first", "second", "third", "fourth"), 3)
subject <- rep(c("math", "reading", "gym"), each = 4)
statescore <- sample(50, 12) + 50
df <- data.frame(grade, subject, statescore)
p5 <- ggplot(df, aes(grade, subject, fill = statescore)) +
geom_tile()
p5
data:image/s3,"s3://crabby-images/712ac/712ac0c25b0a45f6dd4f9eb192168f8f9672c753" alt=""
- Changing the color
scale_fill_gradient()
,scale_fill_distiller()
andscale_fill_viridis()
scale_fill_gradient()
can customize the colorscale_fill_distiller()
usually need palette = RColorBrewerscale_fill_viridis()
need to let discrete=False when the variable is continuous
# library(RColorBrewer)
display.brewer.all()
data:image/s3,"s3://crabby-images/f487e/f487e4a458179678157ae8d17425d0d911dc760f" alt=""
p5_1<-p5 + scale_fill_gradient(low="white", high="purple") + theme(legend.position="top")
p5_2<-p5 + scale_fill_distiller(palette = "RdBu")+ theme(legend.position="top")
p5_3<-p5 + scale_fill_viridis_c()+ theme(legend.position="top")
ggarrange(p5_1,p5_2,p5_3,nrow=1,ncol=3)
data:image/s3,"s3://crabby-images/1197b/1197b3d027a52081805f3af79bedec8ed94caf24" alt=""
- adding text in each square and interact
25.7 Effective ways for showing more information
25.7.1 Way1: Faceting
- faceting by single discrete variable:
# vertical faceting
p3 +
facet_grid(Award~.)
data:image/s3,"s3://crabby-images/fdff7/fdff7f226a0a0766e9678e03cc5dee00bacf2f1a" alt=""
# horizontal faceting
p3 +
facet_grid(.~Award)
data:image/s3,"s3://crabby-images/4d401/4d401e4fd977eb375df0c71512a8e2495b88f6dc" alt=""
- faceting by two discrete variables:
# column facet by Year and row facet by Award
p3+
facet_grid(Year~Award, scales='free')
data:image/s3,"s3://crabby-images/08174/081744e59f2cea70bb3919bc056690dbbcc56fc4" alt=""
25.7.2 Way2: Representing multiple charts on a single page
Using Data: bad_drivers with syntaxes grid.arrange()
# Make 3 simple graphics:
g6_1 <- ggplot(mtcars, aes(x=qsec)) +
geom_density(fill="slateblue")
g6_2 <- ggplot(mtcars, aes(x=drat, y=qsec, color=cyl)) +
geom_point(size=5) + theme(legend.position="none")
g6_3 <- ggplot(mtcars, aes(x=factor(cyl), y=qsec, fill=cyl)) +
geom_boxplot() +
theme(legend.position="none")
# Plots
grid.arrange(g6_1, arrangeGrob(g6_2, g6_3, ncol=2), nrow = 2)
data:image/s3,"s3://crabby-images/40470/404709e814bfad0a0a5da38c9e5b32f653b2d4e8" alt=""
grid.arrange(g6_1, g6_2, g6_3, nrow = 3)
data:image/s3,"s3://crabby-images/b3acc/b3accc9af40d1ccabfc1feab5546d06e79f7179d" alt=""