read.csv("results.csv")
data <- read.csv("results.csv")
library(ggplot2)
"this"[1]
"this"[2]
("this")[2]
("this")[1]
substr(data$query, 1, 2)
substr("this", 1, 3)
substr("this", 1, 2)
substr("this", 1, 1)
sapply(data$query, function(x) substr(x, 1,1))
data$query
substr(data$num, 1, 2)
substr(data$num, 2, 2)
data$query <- ifelse(data$query=="overall", "overall", substr(data$num, 2, 2))
data <- read.csv("results.csv")
data$query <- ifelse(data$num=="overall", "overall", substr(data$num, 2, 2))
head(data)
library(ggplot2)
ggplot(subset(data, query != "overall"), aes(x = query, y = time)
)
geom_boxplot
?geom_boxplot
head(data)
data$time_lower <- with(data, time - sdtime)
data$time_upper <- with(data, time + sdtime)
data$time_lower <- with(data, time - sdtime)
head(data)
ggplot(subset(data, query != "overall"), aes(x = query, y = time)) +
geom_boxplot(aes(x = , ymax = time_upper, ymmin = time_lower))
ggplot(subset(data, query != "overall"), aes(x = query)) +
geom_bar(stat = "identity", aes(fill = time, group = size), position = "dodge") +
geom_errorbar(aes(ymax = time_upper, ymin = time_lower, group = size),position = "dodge")
ggplot(subset(data, query != "overall"), aes(x = query)) +
geom_bar(stat = "identity", aes(y = time, fill = time, group = size), position = "dodge") +
geom_errorbar(aes(ymax = time_upper, ymin = time_lower, group = size),position = "dodge")
ggplot(subset(data, query != "overall"), aes(x = query)) +
geom_bar(stat = "identity", aes(y = time, fill = time, group = size), position = "dodge") +
geom_errorbar(aes(ymax = time_upper, ymin = time_lower, group = size),position = "dodge")
ggplot(subset(data, query != "overall"), aes(x = query)) +
geom_bar(stat = "identity", aes(y = time, fill = size, group = size), position = "dodge") +
geom_errorbar(aes(ymax = time_upper, ymin = time_lower, group = size),position = "dodge")
data$size <- as.factor(as.character(data$size))
ggplot(subset(data, query != "overall"), aes(x = query)) +
geom_bar(stat = "identity", aes(y = time, fill = size, group = size), position = "dodge") +
geom_errorbar(aes(ymax = time_upper, ymin = time_lower, group = size),position = "dodge")
?as.factor
data <- read.csv("results.csv")
data$query <- ifelse(data$num=="overall", "overall", substr(data$num, 2, 2))
data$size <- as.factor(as.character(data$size), levels = c("5", "10", "20"))
data$time_upper <- with(data, time + sdtime)
data$query <- ifelse(data$num=="overall", "overall", substr(data$num, 2, 2))
data$size <- factor(as.character(data$size), levels = c("5", "10", "20"))
data$time_upper <- with(data, time + sdtime)
data$time_lower <- with(data, time - sdtime)
ggplot(subset(data, query != "overall"), aes(x = query)) +
geom_bar(stat = "identity", aes(y = time, fill = size, group = size), position = "dodge") +
geom_errorbar(aes(ymax = time_upper, ymin = time_lower, group = size),position = "dodge")
library(ggplot2)
data <- read.csv("results.csv")
data$query <- ifelse(data$num=="overall", "overall", substr(data$num, 2, 2))
data$size <- factor(as.character(data$size), levels = c("5", "10", "20"))
data$time_upper <- with(data, time + sdtime)
data$time_lower <- with(data, time - sdtime)
ggplot(subset(data, query != "overall"), aes(x = query)) +
geom_bar(stat = "identity", aes(y = time, fill = size, group = size), position = "dodge") +
geom_errorbar(aes(ymax = time_upper, ymin = time_lower, group = size),position = "dodge")
by_query <- ggplot(subset(data, query != "overall"), aes(x = query)) +
geom_bar(stat = "identity", aes(y = time, fill = size, group = size), position = "dodge") +
geom_errorbar(aes(ymax = time_upper, ymin = time_lower, group = size),position = "dodge")
by_query <- by_query + labs(x = "Query", y = "Avg. Execution Time (ms)", fill = "Size (mm)")
by_query
overall <- ggplot(subset(data, query == "overall"), aes(x = size)) +
geom_bar(stat = "identity", aes(y = time), position = "dodge") +
geom_errorbar(aes(ymax = time_upper, ymin = time_lower),position = "dodge")
overall
by_query <- ggplot(data, aes(x = query)) +
geom_bar(stat = "identity", aes(y = time, fill = size, group = size), position = "dodge") +
geom_errorbar(aes(ymax = time_upper, ymin = time_lower, group = size),position = "dodge")
by_query <- by_query + labs(x = "Query", y = "Avg. Execution Time (ms)", fill = "Size (mm)")
by_query
by_query <- ggplot(subset(data, query != "overall"), aes(x = query)) +
geom_bar(stat = "identity", aes(y = time, fill = size, group = size), position = "dodge") +
geom_errorbar(aes(ymax = time_upper, ymin = time_lower, group = size),position = "dodge")
by_query
?ggsave
ggsave(filename = "timings.pdf", plot = by_query)
data <- read.csv("results.csv")
data$query <- ifelse(data$num=="overall", "overall", substr(data$num, 2, 2))
data$size <- factor(as.character(data$size), levels = c("5", "10", "20"))
data$time_upper <- with(data, time + sdtime)
data$time_lower <- with(data, time - sdtime)
by_query <- ggplot(subset(data, query != "overall"), aes(x = query)) +
geom_bar(stat = "identity", aes(y = time, fill = size, group = size), position = "dodge") +
geom_errorbar(aes(ymax = time_upper, ymin = time_lower, group = size),position = "dodge")
by_query <- by_query + labs(x = "Query", y = "Avg. Execution Time (ms)", fill = "Size (mm)")
by_query
ggsave(filename = "timings.pdf", plot = by_query)
data <- read.csv("comparison.csv")
head(data)
d10 <- subset(data, size == 10)
d20 <- subset(data, size == 20)
head(d10)
ggplot(data, aes(x = query, y = time)) + geom_bar(stat = "identity", aes(group = lang), position = "dodge")
library(ggplot2)
ggplot(data, aes(x = query, y = time)) + geom_bar(stat = "identity", aes(group = lang), position = "dodge")
ggplot(data, aes(x = query, y = time)) +
geom_bar(stat = "identity", aes(group = lang, fill = lang), position = "dodge")
data$query <- as.character(data$query)
d10 <- subset(data, size == 10)
d20 <- subset(data, size == 20)
ggplot(data, aes(x = query, y = time)) +
geom_bar(stat = "identity", aes(group = lang, fill = lang), position = "dodge") +
labs(x = "Query", y = "Avg. Execution Time over 10 Iterations", fill = "language")
ggplot(data, aes(x = query, y = time)) +
geom_bar(stat = "identity", aes(group = lang, fill = lang), position = "dodge") +
labs(x = "Query", y = "Avg. Execution Time over 10 Iterations", fill = "language") +
theme(legend.position = "bottom")
g <- function(dat) ggplot(dat, aes(x = query, y = time)) +
geom_bar(stat = "identity", aes(group = lang, fill = lang), position = "dodge") +
labs(x = "Query", y = "Avg. Execution Time over 10 Iterations", fill = "language") +
theme(legend.position = "bottom")
g10 <- g(d10) + labs(title = "10MM observations")
g20 <- g(d20) + labs(title = "20MM observations")
head(d10)
g10 <- g(d10) + labs(title = "10MM observations")
g20 <- g(d20) + labs(title = "20MM observations")
g10
g20
library(ggplot2)
source('~/PersonalProjects/kxmeetup/parallel_slides/data/graph.R', echo=TRUE)
scalable_data <- read.csv("parallel_scalability.csv")
head(scalable_data)
scalable_data$query <- as.character(scalable_data$query)
head(scalable_data)
ggplot(scalable_data, aes(x = workers, y = time)) +
geom_bar(stat = "identity", aes(group = query, fill = query), position = "dodge") +
labs(x = "Workers (10MM floating pt. nums / worker)"
y = "Avg. Execution Time (ms)")
ggplot(scalable_data, aes(x = workers, y = time)) +
geom_bar(stat = "identity", aes(group = query, fill = query), position = "dodge") +
labs(x = "Workers (10MM floating pt. nums / worker)",
y = "Avg. Execution Time (ms)")
library(ggplot2)
ggplot(scalable_data, aes(x = workers, y = time)) +
geom_bar(stat = "identity", aes(group = query, fill = query), position = "dodge") +
labs(x = "Workers (10MM floating pt. nums / worker)",
y = "Avg. Execution Time (ms)")
scalable_data$workers <- as.character(scalable_data$workers)
ggplot(scalable_data, aes(x = workers, y = time)) +
geom_bar(stat = "identity", aes(group = query, fill = query), position = "dodge") +
labs(x = "Workers (10MM floating pt. nums / worker)",
y = "Avg. Execution Time (ms)")
scalable_data$workers <- as.factor(as.character(scalable_data$workers), levels = c("3", "5", "10"))
scalable_data$workers <- factor(as.character(scalable_data$workers), levels = c("3", "5", "10"))
ggplot(scalable_data, aes(x = workers, y = time)) +
geom_bar(stat = "identity", aes(group = query, fill = query), position = "dodge") +
labs(x = "Workers (10MM floating pt. nums / worker)",
y = "Avg. Execution Time (ms)")
scalable_graph <- ggplot(scalable_data, aes(x = workers, y = time)) +
geom_bar(stat = "identity", aes(group = query, fill = query), position = "dodge") +
labs(x = "Workers (10MM floating pt. nums / worker)",
y = "Avg. Execution Time (ms)")
ggsave(filename = "../figures/scalable_graph.pdf", plot = scalable_graph)
source('~/PersonalProjects/kxmeetup/parallel_slides/data/graph.R', echo=TRUE)
