diff options
Diffstat (limited to 'notify/output-bmk-results.log')
-rw-r--r-- | notify/output-bmk-results.log | 160 |
1 files changed, 48 insertions, 112 deletions
diff --git a/notify/output-bmk-results.log b/notify/output-bmk-results.log index e41284d..06ab495 100644 --- a/notify/output-bmk-results.log +++ b/notify/output-bmk-results.log @@ -105,23 +105,23 @@ output-bmk-results.py(258): print(results_df) benchmark symbol ... status_x status_y 0 500.perlbench_r perlbench_r_base.default ... failed-to-run failed-to-run 1 502.gcc_r cpugcc_r_base.default ... failed-to-run failed-to-run -2 505.mcf_r mcf_r_base.default ... -1 -1 +2 505.mcf_r mcf_r_base.default ... -1 success 4 508.namd_r namd_r_base.default ... failed-to-run failed-to-run 5 510.parest_r parest_r_base.default ... failed-to-run failed-to-run 6 511.povray_r povray_r_base.default ... failed-to-run failed-to-run 7 519.lbm_r lbm_r_base.default ... failed-to-run failed-to-run -8 520.omnetpp_r omnetpp_r_base.default ... failed-to-run failed-to-run -9 523.xalancbmk_r cpuxalan_r_base.default ... failed-to-run failed-to-run +8 519.lbm_r lbm_r_base.default ... failed-to-run failed-to-run +9 520.omnetpp_r omnetpp_r_base.default ... failed-to-run failed-to-run 10 523.xalancbmk_r cpuxalan_r_base.default ... failed-to-run failed-to-run -11 525.x264_r x264_r_base.default ... failed-to-run failed-to-run -12 526.blender_r blender_r_base.default ... failed-to-run failed-to-run -13 531.deepsjeng_r deepsjeng_r_base.default ... -1 -1 -15 538.imagick_r imagick_r_base.default ... failed-to-run failed-to-run +11 523.xalancbmk_r cpuxalan_r_base.default ... failed-to-run failed-to-run +12 525.x264_r x264_r_base.default ... failed-to-run failed-to-run +13 526.blender_r blender_r_base.default ... failed-to-run failed-to-run +14 531.deepsjeng_r deepsjeng_r_base.default ... -1 success 16 538.imagick_r imagick_r_base.default ... failed-to-run failed-to-run 17 541.leela_r leela_r_base.default ... failed-to-run failed-to-run 18 541.leela_r leela_r_base.default ... failed-to-run failed-to-run 20 544.nab_r nab_r_base.default ... failed-to-run failed-to-run -21 557.xz_r xz_r_base.default ... -1 -1 +21 557.xz_r xz_r_base.default ... -1 success [19 rows x 20 columns] output-bmk-results.py(261): for index, row in results_df.iterrows(): @@ -410,23 +410,23 @@ output-bmk-results.py(258): print(results_df) benchmark symbol ... status_x status_y 0 500.perlbench_r perlbench_r_base.default ... failed-to-run failed-to-run 1 502.gcc_r cpugcc_r_base.default ... failed-to-run failed-to-run -2 505.mcf_r mcf_r_base.default ... -1 -1 +2 505.mcf_r mcf_r_base.default ... -1 success 4 508.namd_r namd_r_base.default ... failed-to-run failed-to-run 5 510.parest_r parest_r_base.default ... failed-to-run failed-to-run 6 511.povray_r povray_r_base.default ... failed-to-run failed-to-run 7 519.lbm_r lbm_r_base.default ... failed-to-run failed-to-run -8 520.omnetpp_r omnetpp_r_base.default ... failed-to-run failed-to-run -9 523.xalancbmk_r cpuxalan_r_base.default ... failed-to-run failed-to-run +8 519.lbm_r lbm_r_base.default ... failed-to-run failed-to-run +9 520.omnetpp_r omnetpp_r_base.default ... failed-to-run failed-to-run 10 523.xalancbmk_r cpuxalan_r_base.default ... failed-to-run failed-to-run -11 525.x264_r x264_r_base.default ... failed-to-run failed-to-run -12 526.blender_r blender_r_base.default ... failed-to-run failed-to-run -13 531.deepsjeng_r deepsjeng_r_base.default ... -1 -1 -15 538.imagick_r imagick_r_base.default ... failed-to-run failed-to-run +11 523.xalancbmk_r cpuxalan_r_base.default ... failed-to-run failed-to-run +12 525.x264_r x264_r_base.default ... failed-to-run failed-to-run +13 526.blender_r blender_r_base.default ... failed-to-run failed-to-run +14 531.deepsjeng_r deepsjeng_r_base.default ... -1 success 16 538.imagick_r imagick_r_base.default ... failed-to-run failed-to-run 17 541.leela_r leela_r_base.default ... failed-to-run failed-to-run 18 541.leela_r leela_r_base.default ... failed-to-run failed-to-run 20 544.nab_r nab_r_base.default ... failed-to-run failed-to-run -21 557.xz_r xz_r_base.default ... -1 -1 +21 557.xz_r xz_r_base.default ... -1 success [19 rows x 20 columns] output-bmk-results.py(261): for index, row in results_df.iterrows(): @@ -751,7 +751,7 @@ output-bmk-results.py(110): return default_threshold[(change_kind,metric,mod output-bmk-results.py(228): print("DEBUG: checking {0}.{1} : {2},{3} : {4}={5}% (threshold={6}%)"\ output-bmk-results.py(229): .format(sym_type, change_kind, row["benchmark"], row["symbol"], metric, 100-row["rel_" + metric], threshold)) output-bmk-results.py(228): print("DEBUG: checking {0}.{1} : {2},{3} : {4}={5}% (threshold={6}%)"\ -DEBUG: checking exe.regression : 519.lbm_r,lbm_r_base.default : sample=0% (threshold=3%) +DEBUG: checking exe.regression : 523.xalancbmk_r,cpuxalan_r_base.default : sample=-1% (threshold=3%) output-bmk-results.py(232): if not is_entry_xxx[change_kind](metric, row["rel_" + metric], threshold): --- modulename: output-bmk-results, funcname: is_entry_regression output-bmk-results.py(183): if metric in metric_utils.higher_regress_metrics: @@ -795,51 +795,7 @@ output-bmk-results.py(110): return default_threshold[(change_kind,metric,mod output-bmk-results.py(228): print("DEBUG: checking {0}.{1} : {2},{3} : {4}={5}% (threshold={6}%)"\ output-bmk-results.py(229): .format(sym_type, change_kind, row["benchmark"], row["symbol"], metric, 100-row["rel_" + metric], threshold)) output-bmk-results.py(228): print("DEBUG: checking {0}.{1} : {2},{3} : {4}={5}% (threshold={6}%)"\ -DEBUG: checking exe.regression : 523.xalancbmk_r,cpuxalan_r_base.default : sample=1% (threshold=3%) -output-bmk-results.py(232): if not is_entry_xxx[change_kind](metric, row["rel_" + metric], threshold): - --- modulename: output-bmk-results, funcname: is_entry_regression -output-bmk-results.py(183): if metric in metric_utils.higher_regress_metrics: -output-bmk-results.py(184): return (result - 100 > threshold) -output-bmk-results.py(233): continue -output-bmk-results.py(224): for index, row in out_df.iterrows(): -output-bmk-results.py(226): threshold = get_threshold(sym_type, metric, mode, row["benchmark"], row["symbol"]) - --- modulename: output-bmk-results, funcname: get_threshold -output-bmk-results.py(98): if metric == "sample": -output-bmk-results.py(99): spec_thr = get_specific_thresholds(metric, mode, bmk, symb) - --- modulename: output-bmk-results, funcname: get_specific_thresholds -output-bmk-results.py(57): if specific_variability is None: -output-bmk-results.py(60): var = specific_variability[ (specific_variability['benchmark'] == bmk) & (specific_variability['symbol'].str.strip() == symb)] -output-bmk-results.py(61): if var.empty: -output-bmk-results.py(62): return np.nan -output-bmk-results.py(100): if not np.isnan(spec_thr): -output-bmk-results.py(107): if metric == "num_vect_loops" or metric == "num_sve_loops": -output-bmk-results.py(110): return default_threshold[(change_kind,metric,mode)] -output-bmk-results.py(228): print("DEBUG: checking {0}.{1} : {2},{3} : {4}={5}% (threshold={6}%)"\ -output-bmk-results.py(229): .format(sym_type, change_kind, row["benchmark"], row["symbol"], metric, 100-row["rel_" + metric], threshold)) -output-bmk-results.py(228): print("DEBUG: checking {0}.{1} : {2},{3} : {4}={5}% (threshold={6}%)"\ -DEBUG: checking exe.regression : 531.deepsjeng_r,deepsjeng_r_base.default : sample=1% (threshold=3%) -output-bmk-results.py(232): if not is_entry_xxx[change_kind](metric, row["rel_" + metric], threshold): - --- modulename: output-bmk-results, funcname: is_entry_regression -output-bmk-results.py(183): if metric in metric_utils.higher_regress_metrics: -output-bmk-results.py(184): return (result - 100 > threshold) -output-bmk-results.py(233): continue -output-bmk-results.py(224): for index, row in out_df.iterrows(): -output-bmk-results.py(226): threshold = get_threshold(sym_type, metric, mode, row["benchmark"], row["symbol"]) - --- modulename: output-bmk-results, funcname: get_threshold -output-bmk-results.py(98): if metric == "sample": -output-bmk-results.py(99): spec_thr = get_specific_thresholds(metric, mode, bmk, symb) - --- modulename: output-bmk-results, funcname: get_specific_thresholds -output-bmk-results.py(57): if specific_variability is None: -output-bmk-results.py(60): var = specific_variability[ (specific_variability['benchmark'] == bmk) & (specific_variability['symbol'].str.strip() == symb)] -output-bmk-results.py(61): if var.empty: -output-bmk-results.py(62): return np.nan -output-bmk-results.py(100): if not np.isnan(spec_thr): -output-bmk-results.py(107): if metric == "num_vect_loops" or metric == "num_sve_loops": -output-bmk-results.py(110): return default_threshold[(change_kind,metric,mode)] -output-bmk-results.py(228): print("DEBUG: checking {0}.{1} : {2},{3} : {4}={5}% (threshold={6}%)"\ -output-bmk-results.py(229): .format(sym_type, change_kind, row["benchmark"], row["symbol"], metric, 100-row["rel_" + metric], threshold)) -output-bmk-results.py(228): print("DEBUG: checking {0}.{1} : {2},{3} : {4}={5}% (threshold={6}%)"\ -DEBUG: checking exe.regression : 538.imagick_r,imagick_r_base.default : sample=0% (threshold=3%) +DEBUG: checking exe.regression : 531.deepsjeng_r,deepsjeng_r_base.default : sample=0% (threshold=3%) output-bmk-results.py(232): if not is_entry_xxx[change_kind](metric, row["rel_" + metric], threshold): --- modulename: output-bmk-results, funcname: is_entry_regression output-bmk-results.py(183): if metric in metric_utils.higher_regress_metrics: @@ -989,7 +945,7 @@ output-bmk-results.py(110): return default_threshold[(change_kind,metric,mod output-bmk-results.py(228): print("DEBUG: checking {0}.{1} : {2},{3} : {4}={5}% (threshold={6}%)"\ output-bmk-results.py(229): .format(sym_type, change_kind, row["benchmark"], row["symbol"], metric, 100-row["rel_" + metric], threshold)) output-bmk-results.py(228): print("DEBUG: checking {0}.{1} : {2},{3} : {4}={5}% (threshold={6}%)"\ -DEBUG: checking exe.improvement : 519.lbm_r,lbm_r_base.default : sample=0% (threshold=3%) +DEBUG: checking exe.improvement : 523.xalancbmk_r,cpuxalan_r_base.default : sample=-1% (threshold=3%) output-bmk-results.py(232): if not is_entry_xxx[change_kind](metric, row["rel_" + metric], threshold): --- modulename: output-bmk-results, funcname: is_entry_improvement output-bmk-results.py(192): if metric in metric_utils.higher_regress_metrics: @@ -1033,51 +989,7 @@ output-bmk-results.py(110): return default_threshold[(change_kind,metric,mod output-bmk-results.py(228): print("DEBUG: checking {0}.{1} : {2},{3} : {4}={5}% (threshold={6}%)"\ output-bmk-results.py(229): .format(sym_type, change_kind, row["benchmark"], row["symbol"], metric, 100-row["rel_" + metric], threshold)) output-bmk-results.py(228): print("DEBUG: checking {0}.{1} : {2},{3} : {4}={5}% (threshold={6}%)"\ -DEBUG: checking exe.improvement : 523.xalancbmk_r,cpuxalan_r_base.default : sample=1% (threshold=3%) -output-bmk-results.py(232): if not is_entry_xxx[change_kind](metric, row["rel_" + metric], threshold): - --- modulename: output-bmk-results, funcname: is_entry_improvement -output-bmk-results.py(192): if metric in metric_utils.higher_regress_metrics: -output-bmk-results.py(193): return (100 - result > threshold) -output-bmk-results.py(233): continue -output-bmk-results.py(224): for index, row in out_df.iterrows(): -output-bmk-results.py(226): threshold = get_threshold(sym_type, metric, mode, row["benchmark"], row["symbol"]) - --- modulename: output-bmk-results, funcname: get_threshold -output-bmk-results.py(98): if metric == "sample": -output-bmk-results.py(99): spec_thr = get_specific_thresholds(metric, mode, bmk, symb) - --- modulename: output-bmk-results, funcname: get_specific_thresholds -output-bmk-results.py(57): if specific_variability is None: -output-bmk-results.py(60): var = specific_variability[ (specific_variability['benchmark'] == bmk) & (specific_variability['symbol'].str.strip() == symb)] -output-bmk-results.py(61): if var.empty: -output-bmk-results.py(62): return np.nan -output-bmk-results.py(100): if not np.isnan(spec_thr): -output-bmk-results.py(107): if metric == "num_vect_loops" or metric == "num_sve_loops": -output-bmk-results.py(110): return default_threshold[(change_kind,metric,mode)] -output-bmk-results.py(228): print("DEBUG: checking {0}.{1} : {2},{3} : {4}={5}% (threshold={6}%)"\ -output-bmk-results.py(229): .format(sym_type, change_kind, row["benchmark"], row["symbol"], metric, 100-row["rel_" + metric], threshold)) -output-bmk-results.py(228): print("DEBUG: checking {0}.{1} : {2},{3} : {4}={5}% (threshold={6}%)"\ -DEBUG: checking exe.improvement : 531.deepsjeng_r,deepsjeng_r_base.default : sample=1% (threshold=3%) -output-bmk-results.py(232): if not is_entry_xxx[change_kind](metric, row["rel_" + metric], threshold): - --- modulename: output-bmk-results, funcname: is_entry_improvement -output-bmk-results.py(192): if metric in metric_utils.higher_regress_metrics: -output-bmk-results.py(193): return (100 - result > threshold) -output-bmk-results.py(233): continue -output-bmk-results.py(224): for index, row in out_df.iterrows(): -output-bmk-results.py(226): threshold = get_threshold(sym_type, metric, mode, row["benchmark"], row["symbol"]) - --- modulename: output-bmk-results, funcname: get_threshold -output-bmk-results.py(98): if metric == "sample": -output-bmk-results.py(99): spec_thr = get_specific_thresholds(metric, mode, bmk, symb) - --- modulename: output-bmk-results, funcname: get_specific_thresholds -output-bmk-results.py(57): if specific_variability is None: -output-bmk-results.py(60): var = specific_variability[ (specific_variability['benchmark'] == bmk) & (specific_variability['symbol'].str.strip() == symb)] -output-bmk-results.py(61): if var.empty: -output-bmk-results.py(62): return np.nan -output-bmk-results.py(100): if not np.isnan(spec_thr): -output-bmk-results.py(107): if metric == "num_vect_loops" or metric == "num_sve_loops": -output-bmk-results.py(110): return default_threshold[(change_kind,metric,mode)] -output-bmk-results.py(228): print("DEBUG: checking {0}.{1} : {2},{3} : {4}={5}% (threshold={6}%)"\ -output-bmk-results.py(229): .format(sym_type, change_kind, row["benchmark"], row["symbol"], metric, 100-row["rel_" + metric], threshold)) -output-bmk-results.py(228): print("DEBUG: checking {0}.{1} : {2},{3} : {4}={5}% (threshold={6}%)"\ -DEBUG: checking exe.improvement : 538.imagick_r,imagick_r_base.default : sample=0% (threshold=3%) +DEBUG: checking exe.improvement : 531.deepsjeng_r,deepsjeng_r_base.default : sample=0% (threshold=3%) output-bmk-results.py(232): if not is_entry_xxx[change_kind](metric, row["rel_" + metric], threshold): --- modulename: output-bmk-results, funcname: is_entry_improvement output-bmk-results.py(192): if metric in metric_utils.higher_regress_metrics: @@ -1227,12 +1139,37 @@ output-bmk-results.py(110): return default_threshold[(change_kind,metric,mod output-bmk-results.py(228): print("DEBUG: checking {0}.{1} : {2},{3} : {4}={5}% (threshold={6}%)"\ output-bmk-results.py(229): .format(sym_type, change_kind, row["benchmark"], row["symbol"], metric, 100-row["rel_" + metric], threshold)) output-bmk-results.py(228): print("DEBUG: checking {0}.{1} : {2},{3} : {4}={5}% (threshold={6}%)"\ -DEBUG: checking symbol.regression : 538.imagick_r,libc.so.6 : sample=0% (threshold=15%) +DEBUG: checking symbol.regression : 538.imagick_r,libc.so.6 : sample=-50% (threshold=15%) output-bmk-results.py(232): if not is_entry_xxx[change_kind](metric, row["rel_" + metric], threshold): --- modulename: output-bmk-results, funcname: is_entry_regression output-bmk-results.py(183): if metric in metric_utils.higher_regress_metrics: output-bmk-results.py(184): return (result - 100 > threshold) -output-bmk-results.py(233): continue +output-bmk-results.py(235): percent_change, short_diag, long_diag = get_short_long_diag(row, metric, sym_type, change_kind) + --- modulename: output-bmk-results, funcname: get_short_long_diag +output-bmk-results.py(137): bmk = row["benchmark"] +output-bmk-results.py(139): rel_value = row["rel_" + metric] +output-bmk-results.py(140): prev_value = row[metric + "_x"] +output-bmk-results.py(141): curr_value = row[metric + "_y"] +output-bmk-results.py(142): if metric == "num_vect_loops" or metric == "num_sve_loops": +output-bmk-results.py(152): suffix = "" +output-bmk-results.py(153): if metric == "sample": +output-bmk-results.py(154): prefix_regression = "slowed down by" +output-bmk-results.py(155): prefix_improvement = "sped up by" +output-bmk-results.py(156): suffix = "perf samples" +output-bmk-results.py(167): if sym_type=="symbol": +output-bmk-results.py(168): item=bmk+":"+row["symbol"] +output-bmk-results.py(172): short_diag = "{1} {2}% - {0}".format(item, locals()["prefix_" + change_kind], abs(rel_value - 100)) +output-bmk-results.py(173): long_diag = "{0} - from {1} to {2} {3}".format(short_diag, prev_value, curr_value, suffix) +output-bmk-results.py(174): return abs(rel_value - 100), short_diag, long_diag +output-bmk-results.py(239): if metric == "sample" \ +output-bmk-results.py(240): and row['symbol_md5sum_x'] == row['symbol_md5sum_y'] \ +output-bmk-results.py(241): and row['symbol_md5sum_x'] != "-1" \ +output-bmk-results.py(242): and row['symbol_md5sum_x'] != "d41d8cd98f00b204e9800998ecf8427e": +output-bmk-results.py(243): f_skip.write_csv((row["benchmark"], row["symbol"], short_diag, long_diag)) + --- modulename: output-bmk-results, funcname: write_csv +output-bmk-results.py(41): if not self.predicate or not self.csvwriter: +output-bmk-results.py(43): self.csvwriter.writerow(arr) +output-bmk-results.py(244): continue output-bmk-results.py(224): for index, row in out_df.iterrows(): output-bmk-results.py(226): threshold = get_threshold(sym_type, metric, mode, row["benchmark"], row["symbol"]) --- modulename: output-bmk-results, funcname: get_threshold @@ -1311,7 +1248,7 @@ output-bmk-results.py(110): return default_threshold[(change_kind,metric,mod output-bmk-results.py(228): print("DEBUG: checking {0}.{1} : {2},{3} : {4}={5}% (threshold={6}%)"\ output-bmk-results.py(229): .format(sym_type, change_kind, row["benchmark"], row["symbol"], metric, 100-row["rel_" + metric], threshold)) output-bmk-results.py(228): print("DEBUG: checking {0}.{1} : {2},{3} : {4}={5}% (threshold={6}%)"\ -DEBUG: checking symbol.improvement : 538.imagick_r,libc.so.6 : sample=0% (threshold=15%) +DEBUG: checking symbol.improvement : 538.imagick_r,libc.so.6 : sample=-50% (threshold=15%) output-bmk-results.py(232): if not is_entry_xxx[change_kind](metric, row["rel_" + metric], threshold): --- modulename: output-bmk-results, funcname: is_entry_improvement output-bmk-results.py(192): if metric in metric_utils.higher_regress_metrics: @@ -1355,7 +1292,6 @@ output-bmk-results.py(305): f_skip.close() output-bmk-results.py(29): if not self.outf: output-bmk-results.py(31): self.outf.close() output-bmk-results.py(32): if os.stat(self.filename).st_size == 0: -output-bmk-results.py(33): os.remove(self.filename) output-bmk-results.py(306): f_regr.close() --- modulename: output-bmk-results, funcname: close output-bmk-results.py(29): if not self.outf: |