P39.R

# making table data sets
library(dplyr)
library(tidyr)
library(MorpheusData)

#############benchmark 39
set.seed(1)
x <- letters[1:10]
df1 <- data.frame(x)
z <- rnorm(20,100,10)
df2 <- data.frame(x,z)

write.csv(df1, "data-raw/p39_input1.csv", row.names=FALSE)
write.csv(df2, "data-raw/p39_input2.csv", row.names=FALSE)

df_out = inner_join(df1, df2) %>% group_by(x) %>% summarise(newZ=sum(z))

write.csv(df_out, "data-raw/p39_output1.csv", row.names=FALSE)

p39_output1 <- read.csv("data-raw/p39_output1.csv", check.names = FALSE)
fctr.cols <- sapply(p39_output1, is.factor)
int.cols <- sapply(p39_output1, is.integer)

p39_output1[, fctr.cols] <- sapply(p39_output1[, fctr.cols], as.character)
p39_output1[, int.cols] <- sapply(p39_output1[, int.cols], as.numeric)
save(p39_output1, file = "data/p39_output1.rdata")

p39_input1 <- read.csv("data-raw/p39_input1.csv", check.names = FALSE)
fctr.cols <- sapply(p39_input1, is.factor)
int.cols <- sapply(p39_input1, is.integer)

p39_input1[, fctr.cols] <- sapply(p39_input1[, fctr.cols], as.character)
p39_input1[, int.cols] <- sapply(p39_input1[, int.cols], as.numeric)
save(p39_input1, file = "data/p39_input1.rdata")

p39_input2 <- read.csv("data-raw/p39_input2.csv", check.names = FALSE)
fctr.cols <- sapply(p39_input2, is.factor)
int.cols <- sapply(p39_input2, is.integer)

p39_input2[, fctr.cols] <- sapply(p39_input2[, fctr.cols], as.character)
p39_input2[, int.cols] <- sapply(p39_input2[, int.cols], as.numeric)
save(p39_input2, file = "data/p39_input2.rdata")
fredfeng/MorpheusData documentation built on May 16, 2019, 2:42 p.m.