|
@@ -24,12 +24,39 @@ theme(axis.title.y=element_text(vjust=0.9),
|
|
|
|
|
|
|
|
|
se <- function(x) sqrt(var(x)/length(x))
|
|
|
|
|
|
|
|
|
|
|
|
# survey
|
|
|
d <- all %>% filter(exp=="survey") %>% group_by(sys, s, conf) %>%
|
|
|
summarize(meant=mean(timesec), se=se(timesec)) %>%
|
|
|
mutate(tool=paste(sys,conf),
|
|
|
datasize=sapply(s, switch, alabama=47512, california=1060060, acs3yr=9093077)) %>%
|
|
|
filter(tool == "Renjin jitopt" | sys != "Renjin")
|
|
|
|
|
|
print(d %>% select(sys,s,meant) %>% arrange(s))
|
|
|
|
|
|
limits <- aes(ymax = meant + se, ymin=meant - se, width=2)
|
|
|
|
|
|
pdf("survey.pdf",width=10,height=7)
|
|
|
ggplot(d,aes(datasize,meant,group=tool)) +
|
|
|
geom_point(size=4) + geom_line(size=1.5, aes(group=tool, linetype=tool)) +
|
|
|
geom_pointrange(limits) +
|
|
|
#scale_y_log10(breaks=ybreaks, labels=ylabels) +
|
|
|
scale_x_log10(breaks=c(47512,1060060,9093077)) +
|
|
|
|
|
|
xlab("Dataset Size (elements, log scale)") + ylab("Execution Time (s)") + theme +
|
|
|
annotate("text", x=10^6.6, y=45, label="GNU R", family="serif", size=10)+
|
|
|
annotate("text", x=10^6.4, y=100, label="sqlsurvey", family="serif", size=10)+
|
|
|
annotate("text", x=10^6.8, y=15, label="Renjin", family="serif", size=10)
|
|
|
|
|
|
#scale_color_brewer(palette=cBrwPl) +
|
|
|
#guides(colour=guide_legend(keywidth=3.5))
|
|
|
|
|
|
dev.off()
|
|
|
|
|
|
|
|
|
|
|
|
# parallel
|
|
|
|
|
|
|
|
@@ -76,13 +103,12 @@ dev.off()
|
|
|
# # annotate("text", x=3.5, y=20, label="Renjin ", family="serif", size=10)
|
|
|
|
|
|
# print(p)
|
|
|
# dev.off()
|
|
|
|
|
|
|
|
|
stop()
|
|
|
# recycling
|
|
|
d <- all %>% filter(exp=="recycling", s > 5) %>% group_by(exp, sys, s, conf) %>%
|
|
|
summarize(meant=mean(timesec), se=se(timesec)) %>%
|
|
|
mutate(datasize=10^as.integer(s), tool=paste(sys, conf))
|
|
|
|
|
|
print(d)
|
|
@@ -102,39 +128,12 @@ p <- ggplot(d,aes(datasize,meant,group=tool)) +
|
|
|
annotate("text", x=10^7.8, y=21, label="GNU R", family="serif", size=10)
|
|
|
|
|
|
|
|
|
print(p)
|
|
|
dev.off()
|
|
|
|
|
|
# survey
|
|
|
d <- all %>% filter(exp=="survey") %>% group_by(sys, s, conf) %>%
|
|
|
summarize(meant=mean(timesec), se=se(timesec)) %>%
|
|
|
mutate(tool=paste(sys,conf),
|
|
|
datasize=sapply(s, switch, alabama=47512, california=1060060, acs3yr=9093077)) %>%
|
|
|
filter(tool == "Renjin jitopt" | sys != "Renjin")
|
|
|
|
|
|
print(d)
|
|
|
|
|
|
limits <- aes(ymax = meant + se, ymin=meant - se, width=2)
|
|
|
|
|
|
pdf("survey.pdf",width=10,height=7)
|
|
|
ggplot(d,aes(datasize,meant,group=tool)) +
|
|
|
geom_point(size=4) + geom_line(size=1.5, aes(group=tool, linetype=tool)) +
|
|
|
geom_pointrange(limits) +
|
|
|
#scale_y_log10(breaks=ybreaks, labels=ylabels) +
|
|
|
scale_x_log10(breaks=c(47512,1060060,9093077)) +
|
|
|
|
|
|
xlab("Dataset Size (elements, log scale)") + ylab("Execution Time (s)") + theme +
|
|
|
annotate("text", x=10^6.6, y=45, label="GNU R", family="serif", size=10)+
|
|
|
annotate("text", x=10^6.4, y=100, label="sqlsurvey", family="serif", size=10)+
|
|
|
annotate("text", x=10^6.8, y=15, label="Renjin", family="serif", size=10)
|
|
|
|
|
|
#scale_color_brewer(palette=cBrwPl) +
|
|
|
#guides(colour=guide_legend(keywidth=3.5))
|
|
|
|
|
|
dev.off()
|
|
|
|
|
|
|
|
|
# # identity
|
|
|
d <- all %>% filter(exp=="identity", s > 5) %>% group_by(exp, sys, conf, s) %>%
|
|
|
summarize(meant=mean(timesec), se=se(timesec)) %>%
|
|
|
mutate(tool=ifelse(conf=="none", sys, paste(sys,conf)), datasize=10^as.integer(s))
|
|
@@ -160,13 +159,13 @@ ggplot(d,aes(datasize,meant,group=tool)) +
|
|
|
|
|
|
dev.off()
|
|
|
|
|
|
|
|
|
# pushdown
|
|
|
|
|
|
d <- all %>% filter(exp=="pushdown", s > 4) %>% group_by(exp, sys, s) %>%
|
|
|
d <- all %>% filter(exp=="pushdown", s > 5) %>% group_by(exp, sys, s) %>%
|
|
|
summarize(meant=mean(timesec), se=se(timesec)) %>%
|
|
|
mutate(tool=sys, datasize=10^as.integer(s))
|
|
|
|
|
|
print(d)
|
|
|
|
|
|
limits <- aes(ymax = meant + se, ymin=meant - se, width=2)
|
|
@@ -176,13 +175,13 @@ p <- ggplot(d,aes(datasize,meant,group=tool)) +
|
|
|
geom_point(size=4) + geom_line(size=1.5, aes(group=tool, linetype=tool)) +
|
|
|
geom_pointrange(limits) +
|
|
|
# scale_y_log10(breaks=ybreaks, labels=ylabels) +
|
|
|
scale_x_log10(breaks=xbreaks, labels=xlabels) +
|
|
|
|
|
|
xlab("Dataset Size (elements, log scale)") + ylab("Execution Time (s)") + theme +
|
|
|
annotate("text", x=10^7.5, y=5, label="GNU R", family="serif", size=10)+
|
|
|
annotate("text", x=10^7.6, y=5, label="GNU R", family="serif", size=10)+
|
|
|
annotate("text", x=10^7.6, y=.4, label="Renjin ", family="serif", size=10)
|
|
|
|
|
|
print(p)
|
|
|
dev.off()
|
|
|
|
|
|
|