Order Bubble Chart bubbles along y-axis using ggplot2 in r

713 Views Asked by At

I want to make a bubble chart using the following data:

> head(data1)
# A tibble: 6 x 4
  Group                        Group_Strength Group_N Group_Quality
  <chr>                                 <dbl>   <dbl>         <dbl>
1 Young Controls                         1          1          18.5
2 Healthy Age-Matched Controls          59         59          20  
3 Neurodegenerative Disease             36        178          19.1
4 Right Hemisphere Stroke                7.86     159          20.1
5 Left Hemisphere Stroke               -19         19          15  
6 Bilateral Stroke                      26         26          17  

I would like the size of each bubble to indicate the Group_N column, the color of each bubble to indicate the Group_Strength column, and the y-axis to indicate the Group_Quality column.

SO far I have been able to represent the Group_N column (bubble size) and the Group_strength column (color) using the following code. But I cannot figure out how to change the order of the bubbles along the y-axis to indicate Group_Quality:

library(packcircles)
library(ggplot2)
library(tidyverse)

data1$Group_N <- as.numeric(data1$Group_N)

# Generate the layout. sizetype can be area or radius, following your preference on what to be proportional to value.
packing1 <- circleProgressiveLayout(data1$Group_N, sizetype='area')
data1 <- cbind(data1, packing1)
dat.gg1 <- circleLayoutVertices(packing1, npoints=50)


dat.gg1$Group_Strength <- rep(data1$Group_Strength, each=51)
# Plot
ggplot() + 
  
  # bubbles
  geom_polygon(data = dat.gg1, aes(x, y, group = id, fill=Group_Strength), colour = "black", alpha = 0.6) +
  scale_fill_distiller(palette = "BuPu", direction = 1 ) +
  
  # text for each bubble
  geom_text(data = data1, aes(x, y, size=Group_N, label = Group)) +
  scale_size_continuous(range = c(1,4)) +
  
  # Theme:
  theme_void()  + 
  theme(legend.position="none") + 
  coord_equal()

Giving me the following figure:

BubblePlot

Can anyone suggest a way to represent Group_Quality along the y-axis, or in some other way? I am at a loss.


Data

data1 <- structure(list(Group = c("Young Controls", 
"Healthy Age-Matched Controls", 
"Neurodegenerative Disease", "Right Hemisphere Stroke", "Left Hemisphere Stroke", 
"Bilateral Stroke"), Group_Strength = c(1, 59, 36, 7.86, -19, 
26), Group_N = c(1L, 59L, 178L, 159L, 19L, 26L), Group_Quality = c(18.5, 
20, 19.1, 20.1, 15, 17)), class = "data.frame", row.names = c(NA, 
-6L))
1

There are 1 best solutions below

2
On

Here is one possible way using ggplot. adding the y-axis kind of destroyes the bubble-plot ides though.

The nicest way is probably to add the Groups as x as well:

library(tidyverse)

data1 <- structure(
  list(
    Group = c(
      "Young Controls",
      "Healthy Age-Matched Controls",
      "Neurodegenerative Disease",
      "Right Hemisphere Stroke",
      "Left Hemisphere Stroke",
      "Bilateral Stroke"
    ),
    Group_Strength = c(1, 59, 36, 7.86,-19,
                       26),
    Group_N = c(1L, 59L, 178L, 159L, 19L, 26L),
    Group_Quality = c(18.5,
                      20, 19.1, 20.1, 15, 17)
  ),
  class = "data.frame",
  row.names = c(NA,-6L)
)

data1 %>%
  ggplot(aes(x = Group, 
             y = Group_Quality
             )) +
  geom_point(aes(
    size = Group_N,
    color = Group_Strength)) +
  theme_minimal() +
  scale_size_area(max_size = 20) +
  geom_label(aes(label = Group),
             nudge_y = - .25 * IQR(data1$Group_Quality)) +
  ylim(min(data1$Group_Quality) * .9,
       max(data1$Group_Quality) * 1.05)

Or you could just set them as a constant:

library(tidyverse)

data1 <- structure(
  list(
    Group = c(
      "Young Controls",
      "Healthy Age-Matched Controls",
      "Neurodegenerative Disease",
      "Right Hemisphere Stroke",
      "Left Hemisphere Stroke",
      "Bilateral Stroke"
    ),
    Group_Strength = c(1, 59, 36, 7.86,-19,
                       26),
    Group_N = c(1L, 59L, 178L, 159L, 19L, 26L),
    Group_Quality = c(18.5,
                      20, 19.1, 20.1, 15, 17)
  ),
  class = "data.frame",
  row.names = c(NA,-6L)
)

data1 %>%
  ggplot(aes(x = 1, 
             y = Group_Quality
             )) +
  geom_point(aes(
    size = Group_N,
    color = Group_Strength)) +
  theme_minimal() +
  scale_size_area(max_size = 20) +
  geom_label(aes(label = Group),
             nudge_y = - .25 * IQR(data1$Group_Quality)) +
  ylim(min(data1$Group_Quality) * .9,
       max(data1$Group_Quality) * 1.05) +
  scale_x_continuous(breaks = NULL,name = '')

Created on 2020-12-17 by the reprex package (v0.3.0)


EDIT

Here's an added linebreak in the labels:

library(tidyverse)

data1 <- structure(
  list(
    Group = c(
      "Young Controls",
      "Healthy Age-Matched Controls",
      "Neurodegenerative Disease",
      "Right Hemisphere Stroke",
      "Left Hemisphere Stroke",
      "Bilateral Stroke"
    ),
    Group_Strength = c(1, 59, 36, 7.86,-19,
                       26),
    Group_N = c(1L, 59L, 178L, 159L, 19L, 26L),
    Group_Quality = c(18.5,
                      20, 19.1, 20.1, 15, 17)
  ),
  class = "data.frame",
  row.names = c(NA,-6L)
)

data1 %>%
  mutate(Group = str_replace_all(Group, '\\s', '\n')) %>% 
  ggplot(aes(x = Group, 
             y = Group_Quality
  )) +
  geom_point(aes(
    size = Group_N,
    color = Group_Strength)) +
  theme_minimal() +
  scale_size_area(max_size = 20) +
  geom_label(aes(label = Group),
             nudge_y = - .35 * IQR(data1$Group_Quality)) +
  ylim(min(data1$Group_Quality) * .9,
       max(data1$Group_Quality) * 1.05)

Created on 2020-12-19 by the reprex package (v0.3.0)