From 1ae69c8e2acef38307d6c562efb8b0d659142b42 Mon Sep 17 00:00:00 2001 From: Quentin Dufour Date: Wed, 28 Sep 2022 14:59:18 +0200 Subject: To fit or not to fit --- artifacts/2022-09-23-s3lat/plot.R | 2 +- artifacts/2022-09-23-s3lat/plot.png | Bin 145685 -> 147625 bytes .../2022-09-24-s3billion/garage-regression.png | Bin 0 -> 291615 bytes artifacts/2022-09-24-s3billion/garage.png | Bin 250245 -> 237406 bytes artifacts/2022-09-24-s3billion/plot.R | 18 ++++++++++++++++-- 5 files changed, 17 insertions(+), 3 deletions(-) create mode 100644 artifacts/2022-09-24-s3billion/garage-regression.png diff --git a/artifacts/2022-09-23-s3lat/plot.R b/artifacts/2022-09-23-s3lat/plot.R index dd904e6..98eba52 100644 --- a/artifacts/2022-09-23-s3lat/plot.R +++ b/artifacts/2022-09-23-s3lat/plot.R @@ -19,7 +19,7 @@ ggplot(c, aes(x=endpoint,y=time_mean,fill=daemon,ymin=time_min,ymax=time_max)) + coord_flip() + labs( x="S3 Endpoint", - y="Latency (ms)", + y="Request duration (ms)", fill="Daemon", caption="Get the code to reproduce this graph at https://git.deuxfleurs.fr/Deuxfleurs/mknet", title="S3 endpoint latency in a simulated geo-distributed cluster", diff --git a/artifacts/2022-09-23-s3lat/plot.png b/artifacts/2022-09-23-s3lat/plot.png index 8962b65..92eac3f 100644 Binary files a/artifacts/2022-09-23-s3lat/plot.png and b/artifacts/2022-09-23-s3lat/plot.png differ diff --git a/artifacts/2022-09-24-s3billion/garage-regression.png b/artifacts/2022-09-24-s3billion/garage-regression.png new file mode 100644 index 0000000..f2c0aef Binary files /dev/null and b/artifacts/2022-09-24-s3billion/garage-regression.png differ diff --git a/artifacts/2022-09-24-s3billion/garage.png b/artifacts/2022-09-24-s3billion/garage.png index 319760d..9554e60 100644 Binary files a/artifacts/2022-09-24-s3billion/garage.png and b/artifacts/2022-09-24-s3billion/garage.png differ diff --git a/artifacts/2022-09-24-s3billion/plot.R b/artifacts/2022-09-24-s3billion/plot.R index 2baf70d..bf8b29c 100644 --- a/artifacts/2022-09-24-s3billion/plot.R +++ b/artifacts/2022-09-24-s3billion/plot.R @@ -1,12 +1,25 @@ library(tidyverse) +library(ggpmisc) -read_csv("garage-v0.8-beta2-lmdb.csv") %>% mutate(batch_dur_sec = batch_dur_nanoseconds / 1000 / 1000 / 1000 ) -> s +read_csv("garage-v0.8-beta2-lmdb.csv") %>% mutate(batch_dur_sec = batch_dur_nanoseconds / 1000 / 1000 / 1000) %>% filter(total_objects != 0) -> s + +reg1 <- lm(s$batch_dur_sec~s$total_objects) +reg2 <- lm(s$batch_dur_sec ~ log(s$total_objects)) + +f1 <- y~log(x) +f2 <- y~x + ggplot(s, aes(x=total_objects, y=batch_dur_sec)) + geom_point() + - geom_smooth(method = "gam", se = FALSE) + + #geom_smooth(method="lm",formula=f1, se = FALSE, color="red") + + #geom_smooth(method="lm",formula=f2, se = FALSE, color="blue") + + #stat_poly_eq(formula = f1, label.y = 0.9, color = "red", aes(label=paste(..eq.label..,..rr.label..,..adj.rr.label..,..AIC.label..,..BIC.label.., sep = "~~~"))) + + #stat_poly_eq(formula = f2, label.y = 0.8, color="blue",aes(label=paste(..eq.label..,..rr.label..,..adj.rr.label..,..AIC.label..,..BIC.label.., sep = "~~~"))) + + #geom_smooth(method = "gam", se = FALSE) + scale_x_continuous(expand=c(0,0), breaks = scales::pretty_breaks(n = 10))+ scale_y_continuous(expand=c(0,0), breaks = scales::pretty_breaks(n = 10))+ + coord_cartesian(ylim=c(0,60)) + labs( y="Time (in sec) spent sending a batch (8192 objects)", x="Total number of objects stored in the cluster", @@ -15,6 +28,7 @@ ggplot(s, aes(x=total_objects, y=batch_dur_sec)) + subtitle="Daemon: Garage v0.8 beta 2 with LMDB as db_engine\nBenchmark: 128 batch. 8192 objects/batch. 32 threads/batch. 256 objects/thread. 16-byte/objects.\nEnvironment: mknet (Ryzen 5 1400, 16GB RAM, SSD). DC topo (3 nodes, 1Gb/s, 1ms latency).") + theme_classic() ggsave("./garage.png", width=200, height=120, units="mm") +#ggsave("./garage-regression.png", width=200, height=120, units="mm") -- cgit v1.2.3