Mastering the grammar
library(ggplot2)
mpg = na.omit(mpg)
# The fuel economy dataset, mpg, records make, model, class, engine size,
# transmission and fuel economy for a selection of US cars in 1999 and 2008
# A scatterplot of engine displacement in litres (displ) vs. average
# highway miles per gallon (hwy). # Points are coloured according to number
# of cylinders. This plot summarises the most important factor governing
# fuel economy: engine size.
qplot(displ, hwy, data = mpg, colour = factor(cyl))
data:image/s3,"s3://crabby-images/c1f67/c1f6708584c291d4e82b6789947c0bf03e68f13e" alt="plot of chunk ggplot2-part2-1"
# Instead of using points to represent the data, we could use other geoms
# like lines (left) or bars (right). Neither of these geoms makes sense for
# this data, but they are still grammatically valid.
qplot(displ, hwy, data = mpg, colour = factor(cyl), geom = "line") + theme(legend.position = "none")
data:image/s3,"s3://crabby-images/8be88/8be885c3dd11b6321703ee938a90a3e9bbcb97cb" alt="plot of chunk ggplot2-part2-1"
qplot(displ, hwy, data = mpg, colour = factor(cyl), geom = "bar", stat = "identity",
position = "identity") + theme(legend.position = "none")
data:image/s3,"s3://crabby-images/b3d5d/b3d5de748c268322039a5c09093c0334aa734e3a" alt="plot of chunk ggplot2-part2-1"
# More complicated plots don't have their own names. This plot overlays a
# per group regression line on the existing plot. What would you call this
# plot?
qplot(displ, hwy, data = mpg, colour = factor(cyl)) + geom_smooth(data = subset(mpg,
cyl != 5), method = "lm")
data:image/s3,"s3://crabby-images/662b3/662b353c861b0ff580d707f01b670afb3c6f93a3" alt="plot of chunk ggplot2-part2-1"
# A more complex plot with facets and multiple layers.
qplot(displ, hwy, data = mpg, facets = . ~ year) + geom_smooth()
data:image/s3,"s3://crabby-images/711b3/711b3a0cf0d5dcaf5ef5d90eec8f5ce418583e70" alt="plot of chunk ggplot2-part2-1"
# Examples of legends from four different scales. continuous variable
# mapped to size, and to colour, discrete variable mapped to shape, and to
# colour. The ordering of scales seems upside-down, but this matches the
# labelling of the $y$-axis: small values occur at the bottom.
x <- 1:10
y <- factor(letters[1:5])
qplot(x, x, size = x)
data:image/s3,"s3://crabby-images/d1575/d157565ad5793dfad3b8f356e34ae13ba5fa1bd8" alt="plot of chunk ggplot2-part2-1"
qplot(x, x, 1:10, colour = x)
data:image/s3,"s3://crabby-images/8c228/8c2289f1e30156d3cbc99d371fccae0bb00d088e" alt="plot of chunk ggplot2-part2-1"
qplot(y, y, 1:10, shape = y)
data:image/s3,"s3://crabby-images/496ec/496eca65f354169dd288a940ab57b2cadfb91277" alt="plot of chunk ggplot2-part2-1"
qplot(y, y, 1:10, colour = y)
data:image/s3,"s3://crabby-images/5ff69/5ff699f3fcf01d448ac9314839389d486992f649" alt="plot of chunk ggplot2-part2-1"
# Examples of axes and grid lines for three coordinate systems: Cartesian,
# semi-log and polar. The polar coordinate system illustrates the
# difficulties associated with non-Cartesian coordinates: it is hard to draw
# the axes well.
x1 <- c(1, 10)
y1 <- c(1, 5)
p <- qplot(x1, y1, geom = "blank", xlab = NULL, ylab = NULL) + theme_bw()
p
data:image/s3,"s3://crabby-images/5739f/5739fe2a9ae22f0610ddd5d37cbdadb77145e23c" alt="plot of chunk ggplot2-part2-1"
p + coord_trans(y = "log10")
data:image/s3,"s3://crabby-images/d2ed8/d2ed8068c1e1cf222254e1ad20228fc148431224" alt="plot of chunk ggplot2-part2-1"
data:image/s3,"s3://crabby-images/36ef6/36ef60be379459280da6b03a9cade43054870ddc" alt="plot of chunk ggplot2-part2-1"
p <- qplot(displ, hwy, data = mpg, colour = factor(cyl))
summary(p)
data: manufacturer, model, displ, year, cyl, trans, drv, cty, hwy,
fl, class [234x11]
mapping: colour = factor(cyl), x = displ, y = hwy
faceting: facet_null()
-----------------------------------
geom_point:
stat_identity:
position_identity: (width = NULL, height = NULL)
# Save plot object to disk
save(p, file = "plot.rdata")
# Load from disk
load("plot.rdata")
# Save png to disk
ggsave("plot.png", width = 5, height = 5)
Further reading