From c41730e024965b18c437461e6c11b38848223682 Mon Sep 17 00:00:00 2001 From: Wenjing Margaret Mao Date: Tue, 16 Apr 2024 18:11:56 +0800 Subject: [PATCH] edit 'ppl_result does not exist' issue, delete useless code (#10767) * edit ppl_result not exist issue, delete useless code * delete nonzero_min function --------- Co-authored-by: jenniew --- .../benchmark/perplexity/ppl_csv_to_html.py | 26 ------------------- 1 file changed, 26 deletions(-) diff --git a/python/llm/test/benchmark/perplexity/ppl_csv_to_html.py b/python/llm/test/benchmark/perplexity/ppl_csv_to_html.py index cef18a85..bb665136 100644 --- a/python/llm/test/benchmark/perplexity/ppl_csv_to_html.py +++ b/python/llm/test/benchmark/perplexity/ppl_csv_to_html.py @@ -33,26 +33,9 @@ def highlight_vals(val, max=3.0, color1='red', color2='green', color3='yellow', else: return '' -def nonzero_min(lst): - non_zero_lst = [num for num in lst if num > 0.0] - return min(non_zero_lst) if non_zero_lst else None - def is_diffs_within_normal_range(diff_ppl_result, threshold=5.0): return not any(diff < (-threshold) for diff in diff_ppl_result if isinstance(diff, float)) -def add_to_dict(dict, key, value): - if key not in dict: - dict[key] = [] - dict[key].append(value) - -def best_in_dict(dict, key, value): - if key in dict: - best_value = nonzero_min(dict[key]) - if best_value < value or value <= 0.0: - return best_value - return value - return value - def create_fp16_dict(fp16_path): fp16_df = pd.read_csv(fp16_path) fp16_dict = {} @@ -118,15 +101,6 @@ def main(): diff_ppl_result=['']*len(latest_csv.index) ppl_result = 'ppl_result' - - csv_dict = {} - for csv_file in csv_files: - current_csv = pd.read_csv(csv_file, index_col=0) - for current_csv_ind,current_csv_row in current_csv.iterrows(): - current_csv_model=current_csv_row['Model'].strip() - current_csv_precision=current_csv_row['Precision'].strip() - current_csv_model_ppl_result=current_csv_model+'-'+current_csv_precision+'-'+'ppl_result' - add_to_dict(csv_dict, current_csv_model_ppl_result, current_csv_row[ppl_result]) for latest_csv_ind,latest_csv_row in latest_csv.iterrows():