@@ -22,7 +22,7 @@ source(file.path(scriptDir, "porce", "utils.R"))
2222
2323# dataDir <- file.path(experimentDataDir, "PorcE", "impltype-comparison", "20180415-a001")
2424# dataDir <- file.path(localExperimentDataDir, "20180730-a010")
25- dataDir <- file.path(localExperimentDataDir , " 20180802-a001 " )
25+ dataDir <- file.path(localExperimentDataDir , " 20180805-a002 " )
2626scalaDataDir <- file.path(localExperimentDataDir , " 20180718-a002" )
2727
2828loadData <- function (dataDir ) {
@@ -165,61 +165,77 @@ print(kable(t, "latex"))
165165filledInData <- processedData %> %
166166 full_join(processedData %> %
167167 filter(optLevel == 3 , implType == " Orc" ) %> %
168- transmute(benchmarkProblemName , benchmarkName , optLevel = 0 , elapsedTime_mean = 8 * 60 ),
169- by = c(" benchmarkProblemName" , " benchmarkName" , " optLevel" )) %> %
168+ transmute(benchmarkProblemName , benchmarkName , nCPUs , optLevel = 0 , elapsedTime_mean = 10 * 60 ),
169+ by = c(" benchmarkProblemName" , " benchmarkName" , " optLevel" , " nCPUs " )) %> %
170170 mutate(elapsedTime_mean = if_else(is.na(elapsedTime_mean.x ), elapsedTime_mean.y , elapsedTime_mean.x ), elapsedTime_mean.x = NULL , elapsedTime_mean.y = NULL )
171171
172172times2 <-
173- full_join(filledInData ,
174- processedData %> %
175- filter(implType == " Orc" , optLevel == 3 , optimized == T ) %> %
176- transmute(benchmarkProblemName , orc3Time = elapsedTime_mean )) %> %
173+ processedData %> %
174+ filter(implType == " Orc" , optLevel == 3 ) %> %
175+ transmute(benchmarkProblemName , nCPUs , microbenchmark , orc3Time = elapsedTime_mean ) %> %
176+ full_join(processedData %> %
177+ filter(implType == " Orc" , optLevel == 0 ) %> %
178+ transmute(benchmarkProblemName , nCPUs , orc0Time = elapsedTime_mean ),
179+ by = c(" benchmarkProblemName" , " nCPUs" )) %> %
177180 full_join(processedData %> %
178181 filter(implType == " Scala" ) %> %
179- transmute(benchmarkProblemName , scalaTime = elapsedTime_mean )) %> %
182+ transmute(benchmarkProblemName , nCPUs , scalaTime = elapsedTime_mean ),
183+ by = c(" benchmarkProblemName" , " nCPUs" )) %> %
180184 full_join(processedData %> %
181185 filter(implType == " Orc+Scala" , optimized == T ) %> %
182- transmute(benchmarkProblemName , orcScalaTime = elapsedTime_mean ))
186+ transmute(benchmarkProblemName , nCPUs , orcScalaTime = elapsedTime_mean ),
187+ by = c(" benchmarkProblemName" , " nCPUs" )) %> %
188+ dropBounds()
183189 # filter(implType == "Orc") %>%
184190 # mutate(normalizedTime = elapsedTime_mean / orc3Time)
185191
186192# print(geomean((times2 %>% mutate(normalizedTime = elapsedTime_mean / orc3Time) %>% filter(optLevel == 3))$normalizedTime))
187193
188- normalizedToScalaTimeAtMost <- times2 %> % mutate(normalizedTime = elapsedTime_mean / if_else(is.na(scalaTime ), 8 * 60 , scalaTime ))
194+ times2 <- times2 %> % mutate(orcScalaTime = if_else(is.na(orcScalaTime ), orc3Time , orcScalaTime ))
195+
196+ normalizedToScalaTimeAtMost <- times2 %> % mutate_at(vars(ends_with(" Time" )), funs(. / if_else(is.na(scalaTime ), 10 * 60 , scalaTime )))
189197
190- print(
191- geomean((normalizedToScalaTimeAtMost %> % filter(implType == " Orc" , optLevel == 3 , microbenchmark == F ))$ normalizedTime )
198+ print_expr <- function (expr ) {
199+ s <- deparse(substitute(expr ))
200+ cat(paste(s , " =" , expr , " \n " ))
201+ }
202+
203+ print_expr(
204+ geomean((normalizedToScalaTimeAtMost %> % filter(microbenchmark == F , nCPUs == 24 ))$ orc3Time )
192205)
193- print (
194- geomean((normalizedToScalaTimeAtMost %> % filter(implType == " Orc " , optLevel == 3 , microbenchmark == T ))$ normalizedTime )
206+ print_expr (
207+ geomean((normalizedToScalaTimeAtMost %> % filter(microbenchmark == T , nCPUs == 24 ))$ orc3Time )
195208)
196- print (
197- geomean((normalizedToScalaTimeAtMost %> % filter(implType == " Orc+Scala " , optLevel == 3 , microbenchmark == F ))$ normalizedTime )
209+ print_expr (
210+ geomean((normalizedToScalaTimeAtMost %> % filter(microbenchmark == F , nCPUs == 24 ))$ orcScalaTime )
198211)
199212
200- normalizedToOrcScalaTimeAtMost <- times2 %> % mutate( normalizedTime = elapsedTime_mean / orcScalaTime )
213+ normalizedToOrcScalaTimeAtMost <- times2 %> % mutate_at(vars(ends_with( " Time " )), funs( . / if_else(is.na( orcScalaTime ), 10 * 60 , orcScalaTime )) )
201214
202- print (
203- geomean((normalizedToOrcScalaTimeAtMost %> % filter(implType == " Orc " , optLevel == 3 , optimized == T , microbenchmark == F ))$ normalizedTime )
215+ print_expr (
216+ geomean((normalizedToOrcScalaTimeAtMost %> % filter(microbenchmark == F , nCPUs == 24 ))$ orc3Time )
204217)
205- print (
206- geomean((normalizedToOrcScalaTimeAtMost %> % filter(implType == " Orc " , optLevel == 0 , optimized == T , microbenchmark == F ))$ normalizedTime )
218+ print_expr (
219+ geomean((normalizedToOrcScalaTimeAtMost %> % filter(microbenchmark == F , nCPUs == 24 ))$ orc0Time )
207220)
208- print (
209- geomean((normalizedToOrcScalaTimeAtMost %> % filter(implType == " Scala " , microbenchmark == F ))$ normalizedTime )
221+ print_expr (
222+ geomean((normalizedToOrcScalaTimeAtMost %> % filter(microbenchmark == F , nCPUs == 24 ))$ scalaTime )
210223)
211224
212- normalizedToOrc3Time <- times2 %> % mutate( normalizedTime = elapsedTime_mean / orc3Time )
225+ normalizedToOrc3TimeAtMost <- times2 %> % mutate_at(vars(ends_with( " Time " )), funs( . / if_else(is.na( orc3Time ), 10 * 60 , orc3Time )) )
213226
214- print(
215- geomean((normalizedToOrc3Time %> % filter(implType == " Orc" , optLevel == 3 , optimized == T , microbenchmark == F ))$ normalizedTime )
227+ print_expr(
228+ geomean((normalizedToOrc3TimeAtMost %> % filter(microbenchmark == F , nCPUs == 24 ))$ orc0Time )
229+ )
230+ print_expr(
231+ geomean((normalizedToOrc3TimeAtMost %> % filter(microbenchmark == F , nCPUs == 24 ))$ scalaTime )
216232)
217233
218234
219- # print (
235+ # print_expr (
220236# geomean((times2 %>% mutate(normalizedTime = elapsedTime_mean / scalaTime) %>% filter(implType == "Orc", optLevel == 3, normalizedTime > 1))$normalizedTime)
221237# )
222- # print (
238+ # print_expr (
223239# geomean((times2 %>% mutate(normalizedTime = elapsedTime_mean / scalaTime) %>% filter(implType == "Orc+Scala", optLevel == 3, normalizedTime > 1))$normalizedTime)
224240# )
225241
0 commit comments