ROCm · coketaste · Jan 16, 2026 · Jan 27, 2026 · Jan 27, 2026
diff --git a/src/madengine/tools/update_perf_csv.py b/src/madengine/tools/update_perf_csv.py
@@ -116,21 +116,29 @@ def handle_multiple_results(
         row = common_info_json.copy()
         model = r.pop("model")
         row["model"] = model_name + "_" + str(model)
-        row.update(r)
+
+        # Extract all columns from CSV result to ensure proper column alignment
+        # This ensures all result columns (benchmark, tp, inp, out, dtype, etc.) are captured
+        for key, value in r.items():
+            row[key] = value
 
-        if row["performance"] is not None and pd.notna(row["performance"]):
+        if row.get("performance") is not None and pd.notna(row.get("performance")):
             row["status"] = "SUCCESS"
         else:
             row["status"] = "FAILURE"
 
         final_multiple_results_df = pd.concat(
             [final_multiple_results_df, pd.DataFrame(row, index=[0])], ignore_index=True
         )
-        # Reorder columns according to existing perf csv
-        columns = perf_csv_df.columns.tolist()
-        # Add any additional columns to the end
-        columns = columns + [col for col in final_multiple_results_df.columns if col not in columns]
-        final_multiple_results_df = final_multiple_results_df[columns]
+
+    # Reorder columns according to existing perf csv (moved outside loop for efficiency)
+    if not final_multiple_results_df.empty:
+        desired_columns = perf_csv_df.columns.tolist()
+        # Add any additional columns from final_multiple_results_df
+        desired_columns = desired_columns + [col for col in final_multiple_results_df.columns if col not in desired_columns]
+        # Only select columns that actually exist in final_multiple_results_df to avoid KeyError
+        available_columns = [col for col in desired_columns if col in final_multiple_results_df.columns]
+        final_multiple_results_df = final_multiple_results_df[available_columns]
 
     perf_entry_df_to_csv(final_multiple_results_df)
     if perf_csv_df.empty:

diff --git a/src/madengine/tools/update_perf_super.py b/src/madengine/tools/update_perf_super.py
@@ -0,0 +1,327 @@
+"""Module to update the perf_entry_super.json file with enhanced performance data.
+
+This module is used to update the perf_entry_super.json file with performance data
+that includes configuration information from config files.
+
+Copyright (c) Advanced Micro Devices, Inc. All rights reserved.
+"""
+
+# built-in imports
+import json
+import os
+import typing
+# third-party imports
+import pandas as pd
+# MAD Engine imports
+from madengine.utils.config_parser import ConfigParser
+
+
+def read_json(js: str) -> dict:
+    """Read a JSON file.
+
+    Args:
+        js: The path to the JSON file.
+
+    Returns:
+        The JSON dictionary.
+    """
+    with open(js, 'r') as f:
+        return json.load(f)
+
+
+def write_json(data: typing.Union[dict, list], output_path: str) -> None:
+    """Write data to a JSON file.
+
+    Args:
+        data: The data to write (dict or list).
+        output_path: The path to the output JSON file.
+    """
+    with open(output_path, 'w') as f:
+        json.dump(data, f, indent=2)
+
+
+def load_perf_super_json(perf_super_json: str) -> list:
+    """Load existing perf_entry_super.json file.
+
+    Args:
+        perf_super_json: Path to perf_entry_super.json file.
+
+    Returns:
+        List of performance records, or empty list if file doesn't exist.
+    """
+    if not os.path.exists(perf_super_json):
+        return []
+
+    try:
+        data = read_json(perf_super_json)
+        # Ensure it's a list
+        if isinstance(data, list):
+            return data
+        else:
+            return [data]
+    except Exception as e:
+        print(f"Warning: Could not load existing perf_entry_super.json: {e}")
+        return []
+
+
+def handle_multiple_results_super(
+        perf_super_list: list,
+        multiple_results: str,
+        common_info: str,
+        model_name: str,
+        config_parser: ConfigParser
+    ) -> list:
+    """Handle multiple results with config matching.
+
+    Args:
+        perf_super_list: List of existing performance records.
+        multiple_results: The path to the multiple results CSV file.
+        common_info: The path to the common info JSON file.
+        model_name: The model name.
+        config_parser: ConfigParser instance for loading configs.
+
+    Returns:
+        Updated list of performance records with configs.
+    """
+    # Load multiple results CSV
+    multiple_results_df = pd.read_csv(multiple_results)
+    multiple_results_df.columns = multiple_results_df.columns.str.strip()
+
+    # Check required columns
+    required_cols = ['model', 'performance', 'metric']
+    for col in required_cols:
+        if col not in multiple_results_df.columns:
+            raise RuntimeError(f"{multiple_results} file is missing the {col} column")
+
+    # Load common info
+    common_info_json = read_json(common_info)
+
+    # Parse config file from args if present
+    configs_data = None
+    if 'args' in common_info_json and common_info_json['args']:
+        # Try to extract config path from args
+        scripts_path = common_info_json.get('pipeline', '')
+        configs_data = config_parser.parse_and_load(
+            common_info_json['args'],
+            scripts_path
+        )
+
+    # Process each result row
+    for result_row in multiple_results_df.to_dict(orient="records"):
+        record = common_info_json.copy()
+
+        # Update model name
+        result_model = result_row.pop("model")
+        record["model"] = f"{model_name}_{result_model}"
+
+        # Extract metadata fields that should be at top level
+        record["performance"] = result_row.get("performance")
+        record["metric"] = result_row.get("metric")
+
+        # Set status based on performance
+        if record.get("performance") is not None and pd.notna(record.get("performance")):
+            record["status"] = "SUCCESS"
+        else:
+            record["status"] = "FAILURE"
+
+        # Store all result data in multi_results field (structured data)
+        # This captures additional metrics beyond the primary performance metric
+        record["multi_results"] = result_row
+
+        # Match config to this specific result
+        if configs_data:
+            if isinstance(configs_data, list):
+                # For CSV configs with multiple rows, try to match
+                matched_config = config_parser.match_config_to_result(
+                    configs_data,
+                    result_row,
+                    result_model
+                )
+                record["configs"] = matched_config
+            else:
+                # For JSON/YAML configs, use as-is
+                record["configs"] = configs_data
+        else:
+            record["configs"] = None
+
+        perf_super_list.append(record)
+
+    return perf_super_list
+
+
+def handle_single_result_super(
+        perf_super_list: list,
+        single_result: str
+    ) -> list:
+    """Handle a single result.
+
+    Args:
+        perf_super_list: List of existing performance records.
+        single_result: The path to the single result JSON file.
+
+    Returns:
+        Updated list of performance records.
+    """
+    single_result_json = read_json(single_result)
+
+    # Ensure configs field exists (may be None)
+    if "configs" not in single_result_json:
+        single_result_json["configs"] = None
+
+    perf_super_list.append(single_result_json)
+    return perf_super_list
+
+
+def handle_exception_result_super(
+        perf_super_list: list,
+        exception_result: str
+    ) -> list:
+    """Handle an exception result.
+
+    Args:
+        perf_super_list: List of existing performance records.
+        exception_result: The path to the exception result JSON file.
+
+    Returns:
+        Updated list of performance records.
+    """
+    exception_result_json = read_json(exception_result)
+
+    # Ensure configs field exists (may be None)
+    if "configs" not in exception_result_json:
+        exception_result_json["configs"] = None
+
+    perf_super_list.append(exception_result_json)
+    return perf_super_list
+
+
+def update_perf_super_json(
+        perf_super_json: str,
+        multiple_results: typing.Optional[str] = None,
+        single_result: typing.Optional[str] = None,
+        exception_result: typing.Optional[str] = None,
+        common_info: typing.Optional[str] = None,
+        model_name: typing.Optional[str] = None,
+        scripts_base_dir: typing.Optional[str] = None,
+        cumulative_json: typing.Optional[str] = None,
+    ) -> None:
+    """Update the perf_entry_super.json file with the latest performance data.
+
+    Args:
+        perf_super_json: Path to perf_entry_super.json file (latest run only).
+        multiple_results: Path to multiple results CSV file.
+        single_result: Path to single result JSON file.
+        exception_result: Path to exception result JSON file.
+        common_info: Path to common info JSON file.
+        model_name: The model name.
+        scripts_base_dir: Base directory for scripts (for config file resolution).
+        cumulative_json: Path to cumulative perf_super.json file (all runs). If provided,
+                        results will be appended to this file in addition to perf_entry_super.json.
+    """
+    print(f"Updating perf_entry_super.json with enhanced performance data")
+
+    # Start with empty list for latest run
+    perf_super_list = []
+
+    # Create config parser
+    config_parser = ConfigParser(scripts_base_dir=scripts_base_dir)
+
+    # Handle different result types
+    if multiple_results:
+        perf_super_list = handle_multiple_results_super(
+            perf_super_list,
+            multiple_results,
+            common_info,
+            model_name,
+            config_parser,
+        )
+    elif single_result:
+        perf_super_list = handle_single_result_super(perf_super_list, single_result)
+    elif exception_result:
+        perf_super_list = handle_exception_result_super(
+            perf_super_list, exception_result
+        )
+    else:
+        print("No results to update in perf_entry_super.json")
+        return
+
+    # Write latest run to perf_entry_super.json
+    write_json(perf_super_list, perf_super_json)
+    print(f"Successfully updated {perf_super_json} (latest run)")
+
+    # Export latest run to CSV
+    export_perf_super_to_csv(perf_super_json)
+
+    # Update cumulative database if path provided
+    if cumulative_json:
+        cumulative_list = load_perf_super_json(cumulative_json)
+        cumulative_list.extend(perf_super_list)
+        write_json(cumulative_list, cumulative_json)
+        print(f"Successfully updated {cumulative_json} (cumulative - {len(cumulative_list)} total entries)")
+        export_perf_super_to_csv(cumulative_json)
+
+
+def export_perf_super_to_csv(perf_super_json: str) -> None:
+    """Export perf_entry_super.json to CSV format.
+
+    Flattens nested structures (multi_results, configs) and exports to CSV.
+
+    Args:
+        perf_super_json: Path to perf_entry_super.json file.
+    """
+    if not os.path.exists(perf_super_json):
+        print(f"Warning: {perf_super_json} does not exist. Skipping CSV export.")
+        return
+
+    try:
+        data = read_json(perf_super_json)
+
+        # Handle both single dict and list
+        if isinstance(data, dict):
+            data = [data]
+        elif not isinstance(data, list):
+            print(f"Warning: Unexpected data type in {perf_super_json}")
+            return
+
+        if len(data) == 0:
+            print(f"Warning: No data in {perf_super_json}")
+            return
+
+        # Flatten nested structures for CSV
+        flattened_data = []
+        for record in data:
+            flat_record = {}
+
+            for key, value in record.items():
+                if key == 'multi_results' and isinstance(value, dict):
+                    # Expand multi_results to top level with prefix
+                    for mr_key, mr_value in value.items():
+                        flat_record[f"mr_{mr_key}"] = mr_value
+                elif key == 'configs' and value is not None:
+                    # Convert configs to JSON string
+                    flat_record['configs'] = json.dumps(value)
+                elif isinstance(value, (list, dict)):
+                    # Convert other complex types to JSON strings
+                    flat_record[key] = json.dumps(value) if value else None
+                else:
+                    flat_record[key] = value
+
+            flattened_data.append(flat_record)
+
+        # Create DataFrame and export
+        df = pd.DataFrame(flattened_data)
+
+        # Reorder columns: put important ones first
+        priority_cols = ['model', 'status', 'performance', 'metric']
+        other_cols = [col for col in df.columns if col not in priority_cols]
+        ordered_cols = [col for col in priority_cols if col in df.columns] + other_cols
+        df = df[ordered_cols]
+
+        # Export to CSV
+        csv_filename = perf_super_json.replace('.json', '.csv')
+        df.to_csv(csv_filename, index=False)
+        print(f"Successfully exported {csv_filename}")
+
+    except Exception as e:
+        print(f"Error exporting {perf_super_json} to CSV: {e}")
+