问题
I've made a collection of histograms in ggplot2 and used ImageMagick to animate them into a gif. The idea is that the x-axis scale is supposed to be the same in all the graphs but this isn't quite true because the y-axis wiggles around due to the varying widths of the labels. How can I anchor the graph so that all the graphs have exactly the same axis positions?
Here's my ggplot code if it helps:
hist.fn<-function(tier,ddf){
df<-ddf[ddf$tier==tier,]
l<-match(tier,levels(df$tier))
hist.png<-ggplot(df,aes(df$"Premium Adult Individual Age 40" ))+
geom_histogram()+
labs(title=paste0(tier," premiums in federal exchanges"),
x ="Premium", y = "Frequency")+
coord_cartesian(xlim=c(0, 1500))+
theme_bw()+
theme(text = element_text(size=14), plot.title = element_text(face="bold"),axis.title.x =element_text(face="bold"),axis.title.y =element_text(face="bold"))
file=paste0(l,"hist.jpg")
ggsave(filename=file, plot=hist.png, width=13, height=8, dpi=50)
return(hist.png)
}
data.df$tier%>% levels %>% lapply(FUN=hist.fn,ddf=data.df) ->histograms.of.tiers
system("magick -delay 75 *hist.jpg hist.gif")
回答1:
First and foremost, I would like to point out that the plot might be misleading, due to the different y-axis values. The viewers' attention will go mostly to histogram and not the values. Therefore, I would highly recommend to fix the y-axis across the all of the plots.
library(ggplot2)
library(gridExtra)
library(stringr)
# Generate plots
# For each Species in iris dataset - generate a histogram of the Petal's length
plots = lapply(levels(iris$Species),
function(spec){
ggplot(iris[iris$Species == spec, ], aes(Petal.Length)) +
geom_histogram() +
ggtitle(spec)
})
# Show plots side by side
grid.arrange(grobs = plots, nrow = 1, ncol = 3, top = "Base\n\n")
.
.
# Solution 1 (recommended) - Set the same y-axis range for all the plots
alignLimits = function(plotsList){
# Extract limits of y-axis for each plot
y.limits = sapply(plotsList, function(.){layer_scales(.)$y$range$range})
y.min = min(y.limits[1,]) # Minimum of all the ranges
y.max = max(y.limits[2,]) # Maximum of all the ranges
# Apply new limits for each plot
return(lapply(plotsList,
function(.){. + coord_cartesian(ylim=c(y.min, y.max))}))
}
# Align limits of original plots and display
plots.limits = alignLimits(plots)
grid.arrange(grobs = plots.limits, nrow = 1, ncol = 3, top = "Aligned limits\n\n")
.
However, if you choose otherwise, I would go for padding the axis-labels with white spaces:
# Use whitespaces to pad
alignLables = function(plotsList){
# Extract labels of y-axis
# Note: Don't use the as.character on the maximum limit,
# as decimal places in labels may increase the character count
y.labels = lapply(plotsList, function(.){ggplot_build(.)$layout$panel_ranges[[1]]$y.labels})
# Calculate the maximum number of characters for each plot's labels
maxChars = sapply(y.labels, function(.){max(nchar(.))})
# Define a function that would space-pad the labels and apply
format.labels = function(label){str_pad(label, max(maxChars), pad = " ")}
return(lapply(plotsList, function(.){return(. + scale_y_continuous(labels = format.labels))}))
}
# Align labels of original plots and display
plots.labels = alignLables(plots)
grid.arrange(grobs = plots.labels, nrow = 1, ncol = 3, top = "Aligned labels\n\n")
Feel free to ask if there is anything which is not clear.
回答2:
By converting the plot to a gtable it's easy to set a fixed width, beware that this is not a stable interface and therefore may stop working in the future.
library(ggplot2)
library(grid)
library(gridExtra)
plot_random <- function(){
ggplot() +
labs(y=paste(letters[sample(1:24, sample(1:3))], collapse = "\n"))
}
pl <- replicate(3, plot_random(), simplify = FALSE)
gl <- lapply(pl, ggplotGrob)
wl <- lapply(gl, function(g) g$widths[4])
wmax <- do.call(unit.pmax, wl)
gl <- lapply(gl, function(g) {g$widths[4] <- wmax; g})
grid.arrange(arrangeGrob(grobs = pl, top = "Normal case"),
arrangeGrob(grobs = gl, top = "Standardised left"))
来源:https://stackoverflow.com/questions/48121528/how-do-i-set-width-of-y-axis-labels-in-ggplot2