library(ggplot2)Let us make a data frame with two quantitative variables. We generate these variables using random numbers from normal/gaussian distribution.
set.seed(42) x <- rnorm(2000, mean=15, sd=20) y <- x+ rnorm(2000, mean=2, sd=30) df <- data.frame(x=x, y=y)Let us make a simple scatter plot to illustrate the problem of overplotting
df %>% ggplot(aes(x=x, y=y)) + geom_point()
data:image/s3,"s3://crabby-images/0372e/0372e38d48a61df2478040c78abe84cebe4876f2" alt=""
df %>% ggplot(aes(x=x,y=y)) + geom_point(alpha=0.3)
data:image/s3,"s3://crabby-images/0d4d9/0d4d94aa58b85a86c3aefc3f32149034cc1eb467" alt=""