diff --git a/python/llm/dev/benchmark/perplexity/make_csv.py b/python/llm/dev/benchmark/perplexity/make_csv.py index 0876bec7..426e8d53 100644 --- a/python/llm/dev/benchmark/perplexity/make_csv.py +++ b/python/llm/dev/benchmark/perplexity/make_csv.py @@ -35,9 +35,8 @@ def make_csv(result_dict, output_path=None): current_date = datetime.datetime.now().strftime("%Y-%m-%d") file_name = f'results_{current_date}.csv' full_path = os.path.join(output_path, file_name) if output_path else file_name - print('Writing to', full_path) file_name = full_path - headers = ["Index", "Model", "Precision", "en", "zh"] + headers = ["Index", "Model", "Precision", "ppl_result"] with open(file_name, mode='w', newline='') as csv_file: writer = csv.writer(csv_file) @@ -46,10 +45,10 @@ def make_csv(result_dict, output_path=None): for model, model_results in result_dict.items(): for precision, prec_results in model_results.items(): row = [index, model, precision] - for language in headers[3:]: + for language in ["en","zh"]: task_results = prec_results.get(language.lower(), None) if task_results is None: - row.append("") + continue else: result = task_results["results"] row.append("%.4f" % result) @@ -89,6 +88,7 @@ def main(*args): output_path = args[2] merged_results = merge_results(input_path) + make_csv(merged_results, output_path) diff --git a/python/llm/dev/benchmark/perplexity/make_table.py b/python/llm/dev/benchmark/perplexity/make_table.py index 18906b5a..e502b5ce 100644 --- a/python/llm/dev/benchmark/perplexity/make_table.py +++ b/python/llm/dev/benchmark/perplexity/make_table.py @@ -35,8 +35,8 @@ def make_table(result_dict): """Generate table of results.""" md_writer = MarkdownTableWriter() latex_writer = LatexTableWriter() - md_writer.headers = ["Model", "Precision", "en", "zh"] - latex_writer.headers = ["Model", "Precision", "en", "zh"] + md_writer.headers = ["Model", "Precision", "ppl_result"]#["Model", "Precision", "en", "zh"] + latex_writer.headers = ["Model", "Precision", "ppl_result"]#"en", "zh"] languages = ["en", "zh"] values = [] @@ -46,7 +46,7 @@ def make_table(result_dict): for language in languages: task_results = prec_results.get(language, None) if task_results is None: - value.append("") + continue#value.append("") else: result = task_results["results"] value.append("%.4f" % result)