Plot Snippets - ggvis
Foreword
- Output options: the ‘tango’ syntax and the ‘readable’ theme.
- Snippets and results.
ggvis
generates html outputs. Graphics presented here are images: .png files; .gif files when specified.
Documentation¶
Dataset¶
For most examples, we use the mtcars
, pressure
, faithful
datasets.
The ggvis
Package¶
library(ggvis)
The Grammar of Graphics¶
Start to explore
# change the code below to plot the disp variable of mtcars on the x axis
mtcars %>%
ggvis(~disp, ~mpg) %>%
layer_points()
ggvis
and its capabilities
# Change the code below to make a graph with red points
mtcars %>%
ggvis(~wt, ~mpg, fill := "red") %>%
layer_points()
# Change the code below draw smooths instead of points
mtcars %>%
ggvis(~wt, ~mpg) %>%
layer_smooths()
# Change the code below to make a graph containing both points and a smoothed summary line
mtcars %>%
ggvis(~wt, ~mpg) %>%
layer_points() %>%
layer_smooths()
ggvis
grammar
# Make a scatterplot of the pressure dataset
pressure %>%
ggvis(~temperature, ~pressure) %>%
layer_points
# Adapt the code you wrote for the first challenge: show bars instead of points
pressure %>%
ggvis(~temperature, ~pressure) %>%
layer_bars
# Adapt the code you wrote for the first challenge: show lines instead of points
pressure %>%
ggvis(~temperature, ~pressure) %>%
layer_lines
# Adapt the code you wrote for the first challenge: map the fill property to the temperature variable
pressure %>%
ggvis(~temperature, ~pressure, fill = ~temperature) %>%
layer_points
# Extend the code you wrote for the previous challenge: map the size property to the pressure variable
pressure %>%
ggvis(~temperature, ~pressure, fill = ~temperature, size = ~pressure) %>%
layer_points
4 essential components of a graph
faithful %>%
ggvis(~waiting, ~eruptions, fill := "red") %>%
layer_points() %>%
add_axis("y", title = "Duration of eruption (m)",
values = c(2, 3, 4, 5), subdivide = 9) %>%
add_axis("x", title = "Time since previous eruption (m)")
Lines and Syntax¶
Three operators: %>%
, =
and :=
layer_points(ggvis(faithful, ~waiting, ~eruptions))
# Rewrite the code with the pipe operator
faithful %>%
ggvis(~waiting, ~eruptions) %>%
layer_points()
pressure %>%
ggvis(~temperature, ~pressure) %>%
layer_points()
# Modify this graph to map the size property to the pressure variable
pressure %>%
ggvis(~temperature, ~pressure, size = ~pressure) %>%
layer_points()
pressure %>%
ggvis(~temperature, ~pressure) %>%
layer_points()
# Modify this graph by setting the size property
pressure %>%
ggvis(~temperature, ~pressure, size := 100) %>%
layer_points()
pressure %>%
ggvis(~temperature, ~pressure, fill = "red") %>%
layer_points()
# Fix this code to set the fill property to red
pressure %>%
ggvis(~temperature, ~pressure, fill := "red") %>%
layer_points()
Referring to different objects
red <- "green"
pressure$red <- pressure$temperature
pressure %>%
ggvis(~temperature, ~pressure, fill := red) %>%
layer_points()
Properties for points
# Change the code to set the fills using pressure$black
pressure %>%
ggvis(~temperature, ~pressure, fill := ~'black') %>%
layer_points()
# Plot the faithful data as described in the second instruction
faithful %>%
ggvis(~waiting, ~eruptions, size = ~eruptions, opacity := 0.5, fill := "blue", stroke := "black") %>%
layer_points()
# Plot the faithful data as described in the third instruction
faithful %>%
ggvis(~waiting, ~eruptions, size := 100, fill := "red", fillOpacity = ~eruptions, stroke := "red", shape := "cross") %>%
layer_points()
Properties for lines
# Change the code below to use the lines mark
pressure %>%
ggvis(~temperature, ~pressure) %>%
layer_lines()
# Set the properties described in the second instruction in the graph below
pressure %>%
ggvis(~temperature, ~pressure, stroke := "red", strokeWidth := 2, strokeDash := 6) %>%
layer_lines()
Display model fits
layer_lines()
will always connect the points in your plot from the leftmost point to the rightmost point. This can be undesirable if you are trying to plot a specific shape.
layer_paths()
: this mark connects the points in the order that they appear in the data set. So the paths mark will connect the point that corresponds to the first row of the data to the point that corresponds to the second row of data, and so on - no matter where those points appear in the graph.
# change the third line of code to plot a map of Texas
library(maps)
library(ggplot2)
texas <- ggplot2::map_data("state", region = "texas")
texas %>%
ggvis(~long, ~lat) %>%
layer_paths()
# Same plot, but set the fill property of the texas map to dark orange
texas %>%
ggvis(~long, ~lat, fill := "darkorange") %>%
layer_paths()
compute_smooth()
to simplify model fits
compute_model_prediction()
is a useful function to use with line graphs. It takes a data frame as input and returns a new data frame as output. The new data frame will contain the x and y values of a line fitted to the data in the original data frame.
Generate the x and y coordinates for a LOESS smooth line.
faithful %>%
compute_model_prediction(eruptions ~ waiting, model = "lm") %>%
head(10)
1 2 3 4 5 6 7 8 9 10 11 |
|
# Compute the x and y coordinates for a loess smooth line that predicts mpg with the wt
mtcars %>%
compute_smooth(mpg ~ wt) %>%
head(10)
1 2 3 4 5 6 7 8 9 10 11 |
|
#model = "loess" is set by default
Transformations¶
Histograms (1)
# Build a histogram of the waiting variable of the faithful data set.
faithful %>%
ggvis(~waiting) %>%
layer_histograms()
# Build the same histogram, but with a binwidth (width argument) of 5 units
faithful %>%
ggvis(~waiting) %>%
layer_histograms(width = 5)
Histograms (2)
faithful %>%
ggvis(~waiting) %>%
layer_histograms(width = 5)
# Transform the code: just compute the bins instead of plotting a histogram
faithful %>%
compute_bin(~waiting, width = 5)
1 2 3 4 5 6 7 8 9 10 11 12 |
|
# Combine the solution to the first challenge with layer_rects() to build a histogram
faithful %>%
compute_bin(~waiting, width = 5) %>%
ggvis(x = ~xmin_, x2 = ~xmax_, y = 0, y2 = ~count_) %>%
layer_rects()
Density plots
# Combine compute_density() with layer_lines() to make a density plot of the waiting variable.
faithful %>%
compute_density(~waiting) %>%
ggvis(~pred_,~resp_) %>%
layer_lines()
# Build a density plot directly using layer_densities. Use the correct variables and properties.
faithful %>%
ggvis(~waiting) %>%
layer_densities(fill := "green")
Shortcuts
# Complete the code to plot a bar graph of the cyl factor.
mtcars %>%
ggvis(~factor(cyl)) %>%
layer_bars()
# Adapt the solution to the first challenge to just calculate the count values. No plotting!
mtcars %>%
compute_count(~factor(cyl))
1 2 3 4 |
|
ggvis
and group_by
mtcars %>%
group_by(am) %>%
ggvis(~mpg, ~wt, stroke = ~factor(am)) %>%
layer_smooths()
# Change the code to plot a unique smooth line for each value of the cyl variable.
mtcars %>%
group_by(cyl) %>%
ggvis(~mpg, ~wt, stroke = ~factor(cyl)) %>%
layer_smooths()
# Adapt the graph to contain a separate density for each value of cyl.
mtcars %>%
group_by(cyl) %>%
ggvis(~mpg) %>%
layer_densities()
# Copy and alter the solution to the second challenge to map the fill property to a categorical version of cyl.
mtcars %>%
group_by(cyl) %>%
ggvis(~mpg) %>%
layer_densities(fill = ~factor(cyl))
group_by()
versus interaction()
mtcars %>%
group_by(cyl) %>%
ggvis(~mpg) %>%
layer_densities(fill = ~factor(cyl))
# Alter the graph: separate density for each unique combination of 'cyl' and 'am'.
mtcars %>%
group_by(cyl,am) %>%
ggvis(~mpg, fill = ~factor(cyl)) %>%
layer_densities()
#factor(cyl),factor(am)
mtcars %>%
group_by(cyl, am) %>%
ggvis(~mpg, fill = ~factor(cyl)) %>%
layer_densities()
# Update the graph to map `fill` to the unique combinations of the grouping variables.
mtcars %>%
group_by(cyl, am) %>%
ggvis(~mpg, fill = ~interaction(cyl,am)) %>%
layer_densities()
Chaining is a virtue
mtcars %>%
group_by(cyl, am) %>%
ggvis(~mpg, fill = ~interaction(cyl, am)) %>%
layer_densities()
This call is exactly equivalent to the following piece of code that is very hard to read:
layer_densities(ggvis(group_by(mtcars, cyl, am), ~mpg, fill = ~interaction(cyl, am)))
Interactivity and Layers¶
The basics of interactive plots
# Run this code and inspect the output. Follow the link in the instructions for the interactive version
faithful %>%
ggvis(~waiting, ~eruptions, fillOpacity := 0.5,
shape := input_select(label = "Choose shape:", choices = c("circle", "square", "cross", "diamond", "triangle-up", "triangle-down"))) %>%
layer_points()
.gif file:
# Copy the first code chunk and alter the code to make the fill property interactive using a select box
faithful %>%
ggvis(~waiting, ~eruptions, fillOpacity := 0.5, shape := input_select(label = "Choose shape:", choices = c("circle", "square", "cross", "diamond", "triangle-up", "triangle-down")), fill := input_select(label = "Choose color:", choices = c("black","red","blue","green"))) %>%
layer_points()
.gif file:
# Add radio buttons to control the fill of the plot
mtcars %>%
ggvis(~mpg, ~wt, fill := input_radiobuttons(label = "Choose color:", choices = c("black","red","blue","green"))) %>%
layer_points()
.gif file:
Input widgets in more detail
mtcars %>%
ggvis(~mpg, ~wt, fill := input_radiobuttons(label = "Choose color:", choices = c("black", "red", "blue", "green"))) %>%
layer_points()
.gif file:
# Change the radiobuttons widget to a text widget
mtcars %>%
ggvis(~mpg, ~wt, fill := input_text(label = "Choose color:", value = c("black"))) %>%
layer_points()
.gif file:
mtcars %>%
ggvis(~mpg, ~wt) %>%
layer_points()
# Map the fill property to a select box that returns variable names
mtcars %>%
ggvis(~mpg, ~wt, fill = input_select(label = "Choose fill variable:", choices = names(mtcars), map = as.name)) %>%
layer_points()
.gif file:
Input widgets in more detail (2)
# Map the fill property to a select box that returns variable names
mtcars %>%
ggvis(~mpg, ~wt, fill = input_select(label = "Choose fill variable:", choices = names(mtcars), map = as.name)) %>%
layer_points()
.gif file:
Control parameters and values
# Map the bindwidth to a numeric field ("Choose a binwidth:")
mtcars %>%
ggvis(~mpg) %>%
layer_histograms(width = input_numeric(value = 1, label = "Choose a binwidth:"))
.gif file:
# Map the binwidth to a slider bar ("Choose a binwidth:") with the correct specifications
mtcars %>%
ggvis(~mpg) %>%
layer_histograms(width = input_slider(min = 1, max = 20, label = "Choose a binwidth:"))
.gif file:
Multi-layered plots and their properties
# Add a layer of points to the graph below.
pressure %>%
ggvis(~temperature, ~pressure, stroke := "skyblue") %>% layer_lines() %>%
layer_points()
# Copy and adapt the solution to the first instruction below so that only the lines layer uses a skyblue stroke.
pressure %>%
ggvis(~temperature, ~pressure) %>%
layer_lines(stroke := "skyblue") %>%
layer_points()
# Rewrite the code below so that only the points layer uses the shape property.
pressure %>%
ggvis(~temperature, ~pressure) %>%
layer_lines(stroke := "skyblue") %>%
layer_points(shape := "triangle-up")
# Refactor the code for the graph below to make it as concise as possible
pressure %>%
ggvis(~temperature, ~pressure, stroke := "skyblue", strokeOpacity := 0.5, strokeWidth := 5) %>%
layer_lines() %>%
layer_points(fill = ~temperature, shape := "triangle-up", size := 300)
Multi-layered plots and their properties (2)
# Rewrite the code below so that only the points layer uses the shape property.
pressure %>%
ggvis(~temperature, ~pressure) %>%
layer_lines(stroke := "skyblue") %>%
layer_points(shape := "triangle-up")
# Refactor the code for the graph below to make it as concise as possible
pressure %>%
ggvis(~temperature, ~pressure, stroke := "skyblue",
strokeOpacity := 0.5, strokeWidth := 5) %>%
layer_lines() %>%
layer_points(fill = ~temperature, shape := "triangle-up", size := 300)
There is no limit on the number of layers!
# Create a graph containing a scatterplot, a linear model and a smooth line.
pressure %>%
ggvis(~temperature, ~pressure) %>%
layer_points() %>%
layer_lines(stroke := "black", opacity := 0.5) %>%
layer_model_predictions(model = "lm", stroke := "navy") %>%
layer_smooths(stroke := "skyblue")
Taking local and global to the next level
pressure %>%
ggvis(~temperature, ~pressure, stroke := "darkred") %>%
layer_lines(stroke := "orange", strokeDash := 5, strokeWidth := 5) %>%
layer_points(shape := "circle", size := 100, fill := "lightgreen") %>%
layer_smooths()
Customizing Axes, Legends, and Scales¶
Axes
# add the title of the x axis: "Time since previous eruption (m)"
faithful %>%
ggvis(~waiting, ~eruptions) %>%
layer_points() %>%
add_axis("y", title = "Duration of eruption (m)") %>%
add_axis("x", title = "Time since previous eruption (m)")
# Add to the code to place a labelled tick mark at 50, 60, 70, 80, 90 on the x axis.
faithful %>%
ggvis(~waiting, ~eruptions) %>%
layer_points() %>%
add_axis("y", title = "Duration of eruption (m)", values = c(2, 3, 4, 5), subdivide = 9) %>%
add_axis("x", title = "Time since previous eruption (m)", values = c(50, 60, 70, 80, 90), subdivide = 9)
# Add to the code below to change the location of the y axis
faithful %>%
ggvis(~waiting, ~eruptions) %>%
layer_points() %>%
add_axis("x", orient = "top") %>% add_axis("y", orient = "right")
Legends
# Add a legend to the plot below: use the correct title and orientation
faithful %>%
ggvis(~waiting, ~eruptions, opacity := 0.6, fill = ~factor(round(eruptions))) %>%
layer_points() %>%
add_legend("fill", title = "~ duration (m)", orient = "left")
#add_legend(vis, scales = NULL, orient = "right", title = NULL, format = NULL, values = NULL, properties = NULL)
# Use add_legend() to combine the legends in the plot below. Adjust its properties as instructed.
faithful %>%
ggvis(~waiting, ~eruptions, opacity := 0.6, fill = ~factor(round(eruptions)), shape = ~factor(round(eruptions)),
size = ~round(eruptions)) %>%
layer_points() %>%
add_legend(c("fill", "shape", "size"), title = "~ duration (m)", values = c(2,3,4,5))
Legends (2)
# Fix the legend
faithful %>%
ggvis(~waiting, ~eruptions, opacity := 0.6, fill = ~factor(round(eruptions)), shape = ~factor(round(eruptions)),
size = ~round(eruptions)) %>%
layer_points() %>%
add_legend(c("fill", "shape", "size"), title = "~ duration (m)")
Scale types
# Add to the code below to make the stroke color range from "darkred" to "orange".
mtcars %>%
ggvis(~wt, ~mpg, fill = ~disp, stroke = ~disp, strokeWidth := 2) %>%
layer_points() %>%
scale_numeric("fill", range = c("red", "yellow")) %>% scale_numeric("stroke", range = c("darkred", "orange"))
# Change the graph below to make the fill colors range from green to beige.
mtcars %>% ggvis(~wt, ~mpg, fill = ~hp) %>%
layer_points() %>% scale_numeric("fill", range = c("green", "beige"))
# Create a scale that will map `factor(cyl)` to a new range of colors: purple, blue, and green.
mtcars %>% ggvis(~wt, ~mpg, fill = ~factor(cyl)) %>%
layer_points() %>% scale_nominal("fill", range = c("purple", "blue", "green"))
Adjust any visual property
# Add a scale that limits the range of opacity from 0.2 to 1.
mtcars %>%
ggvis(x = ~wt, y = ~mpg, fill = ~factor(cyl), opacity = ~hp) %>%
layer_points() %>%
scale_numeric("opacity", range = c(0.2,1))
# Add a second scale that will expand the x axis to cover data values from 0 to 6.
mtcars %>%
ggvis(~wt, ~mpg, fill = ~disp) %>%
layer_points() %>%
scale_numeric("y", domain = c(0, NA)) %>%
scale_numeric("x", domain = c(0, 6))
Adjust any visual property (2)
# Add a second scale to set domain for x
mtcars %>%
ggvis(~wt, ~mpg, fill = ~disp) %>%
layer_points() %>%
scale_numeric("y", domain = c(0, NA)) %>%
scale_numeric("x", domain = c(0, 6))
“=
” versus “:=
“
# Set the fill value to the color variable instead of mapping it, and see what happens
mtcars$color <- c("red", "teal", "#cccccc", "tan")
mtcars %>%
ggvis(x = ~wt, y = ~mpg, fill = ~color) %>%
layer_points()
mtcars %>%
ggvis(x = ~wt, y = ~mpg, fill := ~color) %>%
layer_points()