diff --git a/python/llm/dev/benchmark/all-in-one/run.py b/python/llm/dev/benchmark/all-in-one/run.py
index bcae312b..bc267208 100644
--- a/python/llm/dev/benchmark/all-in-one/run.py
+++ b/python/llm/dev/benchmark/all-in-one/run.py
@@ -401,6 +401,7 @@ def run_transformer_int4_gpu(repo_id,
                         result[in_out].append([model.first_cost, model.rest_cost_mean, model.encoder_time,
                                             actual_in_len, actual_out_len])
             except RuntimeError:
+                traceback.print_exc()
                 pass
     del model
     torch.xpu.empty_cache()
diff --git a/python/llm/test/benchmark/csv_to_html.py b/python/llm/test/benchmark/csv_to_html.py
index a4bd58d9..94969c5c 100644
--- a/python/llm/test/benchmark/csv_to_html.py
+++ b/python/llm/test/benchmark/csv_to_html.py
@@ -21,6 +21,12 @@ import sys
 import argparse
 import pandas as pd
 
+def highlight_vals(val, max=-3.0, color='yellow'):
+    if val < max:
+        return 'background-color: %s' % color
+    else:
+        return ''
+
 def main():
     parser = argparse.ArgumentParser(description="convert .csv file to .html file")
     parser.add_argument("-f", "--folder_path", type=str, dest="folder_path",
@@ -74,7 +80,14 @@ def main():
         latest_csv.insert(loc=6,column='diff2(%)',value=diff2)
 
     daily_html=csv_files[0].split(".")[0]+".html"
-    latest_csv.to_html(daily_html)
+
+    subset=['diff1(%)','diff2(%)']
+    columns={'1st token avg latency (ms)': '{:.2f}', '2+ avg latency (ms/token)': '{:.2f}', 'last1': '{:.2f}', 'diff1(%)': '{:.2f}',
+             'last2': '{:.2f}', 'diff2(%)': '{:.2f}', 'encoder time (ms)': '{:.2f}'}
+
+    with open(daily_html, 'w') as f:
+        f.write(latest_csv.style.format(columns).applymap(highlight_vals, subset)
+                        .set_table_attributes("border=1").render())
 
 if __name__ == "__main__":
     sys.exit(main())
\ No newline at end of file