analyze__benchmark_8py_source.html

 import json

 import sys

 from os import listdir

 import os.path

 import getopt


 # loads a single benchmark json at a time, and can access its data


 class BenchmarkLoader:

     def __init__(self, dir_name, filename_list):

         self.dir_name = dir_name

         self.filename_list = filename_list

         self.data = []


     # reading the benchmark json file

     def load(self, bench_filename):

         assert bench_filename in self.filename_list


         with open(self.dir_name + bench_filename) as json_file:

             # only load those queries that were successful

             filtered_input_data = filter(

                 lambda experiment: experiment["succeeded"] is True,

                 json.load(json_file),

             )

             # sort queries based on their IDs

             self.data = sorted(

                 filtered_input_data,

                 key=lambda experiment: experiment["results"]["query_id"],

             )


     def getFrontAttribute(self, attribute):

         if self.data:

             return self.data[0]["results"][attribute]

         else:

             return "None"


     def getExistingDataRunLabel(self):

         return self.getFrontAttribute("run_label")


     def getGpuName(self):

         return self.getFrontAttribute("run_gpu_name")


     def getRunTableName(self):

         return self.getFrontAttribute("run_table")


     # return a list of the attribute, from queries in query_names, stored in self.data

     def fetchAttribute(self, attribute, query_names):

         result = []

         for query in query_names:

             for experiment in self.data:

                 assert attribute in experiment["results"], (

                     attribute + " is not a valid attribute."

                 )

                 if query == experiment["results"]["query_id"]:

                     result.append(experiment["results"][attribute])

                     break

         return result


     def fetchQueryNames(self):

         result = []

         for experiment in self.data:

             result.append(experiment["results"]["query_id"])

         return result


 class BenchAnalyzer:

     def __init__(self, ref, sample, attribute):

         assert isinstance(ref, BenchmarkLoader)

         assert isinstance(sample, BenchmarkLoader)

         self.__header_info = [ref.getFrontAttribute("query_group"), attribute]

         self.__label_name_ref = ref.fetchQueryNames()

         self.__label_name_sample = sample.fetchQueryNames()

         self.__missing_queries_ref = []

         self.__missing_queries_sample = []

         self.collectMissingQueries()

         assert self.__label_name_ref == self.__label_name_sample

         self.__attribute_ref = ref.fetchAttribute(

             attribute, self.__label_name_ref

         )

         self.__attribute_sample = sample.fetchAttribute(

             attribute, self.__label_name_sample

         )


     # collects all those queries that does not exist in both of the results

     def collectMissingQueries(self):

         for query in self.__label_name_ref:

             if query not in self.__label_name_sample:

                 self.__missing_queries_sample.append(query)

                 self.__label_name_ref.remove(query)

         for query in self.__label_name_sample:

             if query not in self.__label_name_ref:

                 self.__missing_queries_ref.append(query)

                 self.__label_name_sample.remove(query)


     def printHeader(self):

         for h in self.__header_info:

             print("  " + h, end="")


     def findAnomaliesRatio(self, epsilon):

         found = False

         speedup = compute_speedup(

             self.__attribute_ref, self.__attribute_sample

         )

         print("Differences outside of %2.0f%%: " % (epsilon * 100), end="")

         self.printHeader()

         for i in range(len(speedup)):

             if abs(speedup[i] - 1.0) > epsilon:

                 if found == False:

                     found = True

                 print(

                     "\n%s: reference = %.2f ms, sample = %.2f ms, speedup = %.2fx"

                     % (

                         self.__label_name_ref[i],

                         self.__attribute_ref[i],

                         self.__attribute_sample[i],

                         speedup[i],

                     ),

                     end="",

                 )

         if found == False:

             print(": None", end="")

         if self.__missing_queries_ref:

             print("\n*** Missing queries from reference: ", end="")

             for query in self.__missing_queries_ref:

                 print(query + " ", end="")

         if self.__missing_queries_sample:

             print("\n*** Missing queries from sample: ", end="")

             for query in self.__missing_queries_sample:

                 print(query + " ", end="")

         print(

             "\n======================================================================="

         )


 def compute_speedup(x, y):

     result = []

     zipped = list(zip(x, y))

     for q in zipped:

         result.append(q[0] / q[1])

     return result


 class PrettyPrint:

     """

         This class is just used to print out the benchmark results into the terminal.

         By default, it is used for cross comparison of the results between a reference

         branch (ref) and a sample branch (sample); for a particular attribute, all elements

         within each branch are shown as well as the speedup (sample / ref).


         If cross_comparison is disabled, then it just shows the result for the ref branch.

     """


     def __init__(

         self,

         ref,

         sample,

         attribute,

         cross_comparison=True,

         num_items_per_line=5,

     ):

         self.__cross_comparison = cross_comparison

         assert isinstance(ref, BenchmarkLoader)

         if cross_comparison:

             assert isinstance(sample, BenchmarkLoader)

         self.__header_info = [

             ref.getRunTableName(),

             attribute,

             ref.getGpuName(),

         ]

         self.__num_items_per_line = num_items_per_line

         self.__label_name_ref = ref.fetchQueryNames()

         if cross_comparison:

             self.__label_name_sample = sample.fetchQueryNames()

             assert self.__label_name_ref == self.__label_name_sample

         self.__missing_queries_ref = []

         self.__missing_queries_sample = []

         if cross_comparison:

             self.collectMissingQueries()

         self.__attribute_ref = ref.fetchAttribute(

             attribute, self.__label_name_ref

         )

         if cross_comparison:

             self.__attribute_sample = sample.fetchAttribute(

                 attribute, self.__label_name_sample

             )

         self.__ref_line_count = 0

         self.__sample_line_count = 0


     # collects all those queries that does not exist in both of the results

     def collectMissingQueries(self):

         for query in self.__label_name_ref:

             if query not in self.__label_name_sample:

                 self.__missing_queries_sample.append(query)

                 self.__label_name_ref.remove(query)

         for query in self.__label_name_sample:

             if query not in self.__label_name_ref:

                 self.__missing_queries_ref.append(query)

                 self.__label_name_sample.remove(query)


     def printSolidLine(self, pattern):

         for i in range(self.__num_items_per_line + 1):

             for j in range(11):

                 print(pattern, end="")

         print("")


     def printHeader(self):

         for h in self.__header_info:

             print("\t" + h)

         self.printSolidLine("=")


     def getRefElementsPerLine(self):

         return self.__ref_line_count * self.__num_items_per_line


     def printLine(self, array):

         begin = self.getRefElementsPerLine()

         end = self.getRefElementsPerLine() + self.__num_items_per_line

         for i in range(begin, min(end, len(self.__attribute_ref))):

             if isinstance(array[i], float):

                 print("%10.2f" % (array[i]), end="")

             elif isinstance(array[i], str):

                 print("%10s" % (array[i]), end="")

             else:

                 assert False

         print("")


     def printAttribute(self):

         self.printHeader()

         ref_count = len(self.__attribute_ref)

         while self.getRefElementsPerLine() < ref_count:

             print("%10s" % "Queries", end="")

             self.printLine(self.__label_name_ref)

             self.printSolidLine("-")

             print("%10s" % "Reference", end="")

             self.printLine(self.__attribute_ref)

             if self.__cross_comparison:

                 print("%10s" % "Sample", end="")

                 self.printLine(self.__attribute_sample)

                 print("%10s" % "Speedup", end="")

                 self.printLine(

                     compute_speedup(

                         self.__attribute_ref, self.__attribute_sample

                     )

                 )

             self.printSolidLine("=")

             self.__ref_line_count += 1

         print("\n\n\n")


 def main(argv):

     try:

         opts, args = getopt.getopt(

             argv,

             "hs:r:e:a:p",

             [

                 "help",

                 "sample=",

                 "reference=",

                 "epsilon=",

                 "attribute=",

                 "print",

             ],

         )

     except getopt.GetOptError:

         print(

             "python3 analyze-benchmark.py -s <sample dir> -r <reference dir> -e <epsilon> -a <attribute> -p"

         )

         sys.exit(2)


     dir_artifact_sample = ""

     dir_artifact_ref = ""

     epsilon = 0.05

     query_attribute = (

         "query_exec_trimmed_avg"

     )  # default attribute to use for benchmark comparison


     to_print = False  # printing all the results, disabled by default


     for opt, arg in opts:

         if opt in ("-h", "--help"):

             print(

                 """

     -s/--sample:\t\t\t directory of the results for the benchmarked sample branch

     -r/--reference:\t\t\t directory of the results for the benchmarked reference branch

     -e/--epsilon:\t\t\t ratio tolerance for reporting results outside this range

     -a/--attribute:\t\t\t attribute to be used for benchmark comparison (default: query_total_avg)

     -p/--print:\t\t\t\t print all the results

                 """

             )

             sys.exit()

         else:

             if opt in ("-s", "--sample"):

                 dir_artifact_sample = arg

                 assert os.path.isdir(dir_artifact_sample)

             elif opt in ("-r", "--reference"):

                 dir_artifact_ref = arg

                 assert os.path.isdir(dir_artifact_ref)

             elif opt in ("-e", "--epsilon"):

                 epsilon = float(arg)

             elif opt in ("-a", "--attribute"):

                 query_attribute = arg

             elif opt in ("-p", "--print"):

                 to_print = True


     assert dir_artifact_ref != ""

     assert dir_artifact_sample != ""

     assert epsilon <= 1


     GPU_list_ref = listdir(dir_artifact_ref)

     GPU_list_sample = listdir(dir_artifact_sample)


     for gpu in GPU_list_ref:

         dir_name_ref = dir_artifact_ref + "/" + gpu + "/Benchmarks"

         filename_list_ref = listdir(dir_name_ref)

         dir_name_ref += "/"


         refBench = BenchmarkLoader(dir_name_ref, filename_list_ref)


         if gpu in GPU_list_sample:

             dir_name_sample = dir_artifact_sample + "/" + gpu + "/Benchmarks"

             filename_list_sample = listdir(dir_name_sample)

             dir_name_sample += "/"


             sampleBench = BenchmarkLoader(

                 dir_name_sample, filename_list_sample

             )

             first_header = True

             for index in range(len(filename_list_ref)):

                 refBench.load(filename_list_ref[index])

                 if filename_list_ref[index] in filename_list_sample:

                     sampleBench.load(filename_list_ref[index])

                     if first_header:

                         print(

                             "\n+++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++"

                         )

                         print("++++ " + sampleBench.getGpuName())

                         print(

                             "++++ reference("

                             + refBench.getFrontAttribute("run_label")

                             + "): "

                             + refBench.getFrontAttribute("run_version")

                         )

                         print(

                             "++++ sample("

                             + sampleBench.getFrontAttribute("run_label")

                             + "): "

                             + sampleBench.getFrontAttribute("run_version")

                         )

                         print(

                             "+++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++\n"

                         )

                         first_header = False


                     analyzer = BenchAnalyzer(

                         refBench, sampleBench, query_attribute

                     )

                     analyzer.findAnomaliesRatio(epsilon)

                     if to_print:

                         printer = PrettyPrint(

                             refBench, sampleBench, query_attribute

                         )

                         printer.printAttribute()

                 else:

                     print(

                         "No sample results for table "

                         + refBench.getRunTableName()

                         + " were found."

                     )

                     print(

                         "======================================================================="

                     )


         else:

             print(

                 "\n+++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++"

             )

             print("++++ No sample results for GPU " + gpu + " were found.")

             print(

                 "+++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++\n"

             )


 if __name__ == "__main__":

     main(sys.argv[1:])

analyze_benchmark.BenchmarkLoader.getGpuName
def getGpuName
Definition: analyze_benchmark.py:41

analyze_benchmark.PrettyPrint.printSolidLine
def printSolidLine
Definition: analyze_benchmark.py:201

analyze_benchmark.PrettyPrint
Definition: analyze_benchmark.py:144

analyze_benchmark.BenchmarkLoader
Definition: analyze_benchmark.py:10

analyze_benchmark.PrettyPrint.__label_name_ref
__label_name_ref
Definition: analyze_benchmark.py:172

analyze_benchmark.BenchmarkLoader.fetchAttribute
def fetchAttribute
Definition: analyze_benchmark.py:48

analyze_benchmark.PrettyPrint.__sample_line_count
__sample_line_count
Definition: analyze_benchmark.py:188

analyze_benchmark.PrettyPrint.__init__
def __init__
Definition: analyze_benchmark.py:161

analyze_benchmark.BenchAnalyzer.__label_name_sample
__label_name_sample
Definition: analyze_benchmark.py:73

analyze_benchmark.BenchmarkLoader.data
data
Definition: analyze_benchmark.py:14

analyze_benchmark.PrettyPrint.printAttribute
def printAttribute
Definition: analyze_benchmark.py:227

analyze_benchmark.compute_speedup
def compute_speedup
Definition: analyze_benchmark.py:136

analyze_benchmark.BenchmarkLoader.getRunTableName
def getRunTableName
Definition: analyze_benchmark.py:44

analyze_benchmark.PrettyPrint.__missing_queries_sample
__missing_queries_sample
Definition: analyze_benchmark.py:177

analyze_benchmark.BenchAnalyzer.collectMissingQueries
def collectMissingQueries
Definition: analyze_benchmark.py:86

analyze_benchmark.PrettyPrint.__attribute_ref
__attribute_ref
Definition: analyze_benchmark.py:180

analyze_benchmark.BenchAnalyzer.__missing_queries_sample
__missing_queries_sample
Definition: analyze_benchmark.py:75

analyze_benchmark.PrettyPrint.__num_items_per_line
__num_items_per_line
Definition: analyze_benchmark.py:171

analyze_benchmark.BenchAnalyzer
Definition: analyze_benchmark.py:67

heavyai::open
int open(const char *path, int flags, int mode)
Definition: heavyai_fs.cpp:66

analyze_benchmark.PrettyPrint.__missing_queries_ref
__missing_queries_ref
Definition: analyze_benchmark.py:176

analyze_benchmark.PrettyPrint.collectMissingQueries
def collectMissingQueries
Definition: analyze_benchmark.py:191

analyze_benchmark.PrettyPrint.getRefElementsPerLine
def getRefElementsPerLine
Definition: analyze_benchmark.py:212

analyze_benchmark.PrettyPrint.printLine
def printLine
Definition: analyze_benchmark.py:215

analyze_benchmark.BenchmarkLoader.dir_name
dir_name
Definition: analyze_benchmark.py:12

analyze_benchmark.PrettyPrint.__ref_line_count
__ref_line_count
Definition: analyze_benchmark.py:187

analyze_benchmark.PrettyPrint.__header_info
__header_info
Definition: analyze_benchmark.py:166

analyze_benchmark.PrettyPrint.__cross_comparison
__cross_comparison
Definition: analyze_benchmark.py:162

analyze_benchmark.BenchAnalyzer.__missing_queries_ref
__missing_queries_ref
Definition: analyze_benchmark.py:74

analyze_benchmark.BenchmarkLoader.getFrontAttribute
def getFrontAttribute
Definition: analyze_benchmark.py:32

analyze_benchmark.PrettyPrint.__label_name_sample
__label_name_sample
Definition: analyze_benchmark.py:174

analyze_benchmark.BenchAnalyzer.__attribute_sample
__attribute_sample
Definition: analyze_benchmark.py:81

analyze_benchmark.BenchAnalyzer.findAnomaliesRatio
def findAnomaliesRatio
Definition: analyze_benchmark.py:100

analyze_benchmark.BenchmarkLoader.load
def load
Definition: analyze_benchmark.py:17

analyze_benchmark.main
def main
Definition: analyze_benchmark.py:250

analyze_benchmark.BenchAnalyzer.printHeader
def printHeader
Definition: analyze_benchmark.py:96

analyze_benchmark.BenchmarkLoader.getExistingDataRunLabel
def getExistingDataRunLabel
Definition: analyze_benchmark.py:38

analyze_benchmark.BenchAnalyzer.__label_name_ref
__label_name_ref
Definition: analyze_benchmark.py:72

analyze_benchmark.BenchmarkLoader.__init__
def __init__
Definition: analyze_benchmark.py:11

analyze_benchmark.PrettyPrint.printHeader
def printHeader
Definition: analyze_benchmark.py:207

analyze_benchmark.BenchAnalyzer.__header_info
__header_info
Definition: analyze_benchmark.py:71

analyze_benchmark.BenchmarkLoader.fetchQueryNames
def fetchQueryNames
Definition: analyze_benchmark.py:60

analyze_benchmark.PrettyPrint.__attribute_sample
__attribute_sample
Definition: analyze_benchmark.py:184

analyze_benchmark.BenchAnalyzer.__init__
def __init__
Definition: analyze_benchmark.py:68

analyze_benchmark.BenchAnalyzer.__attribute_ref
__attribute_ref
Definition: analyze_benchmark.py:78

analyze_benchmark.BenchmarkLoader.filename_list
filename_list
Definition: analyze_benchmark.py:13