magma/tuning/generate_tuning.py

*26bdecf3SSebastian Grimberg#!/usr/bin/env python3
*26bdecf3SSebastian Grimberg
*26bdecf3SSebastian Grimberg# Copyright (c) 2017-2018, Lawrence Livermore National Security, LLC.
*26bdecf3SSebastian Grimberg# Produced at the Lawrence Livermore National Laboratory. LLNL-CODE-734707.
*26bdecf3SSebastian Grimberg# All Rights reserved. See files LICENSE and NOTICE for details.
*26bdecf3SSebastian Grimberg#
*26bdecf3SSebastian Grimberg# This file is part of CEED, a collection of benchmarks, miniapps, software
*26bdecf3SSebastian Grimberg# libraries and APIs for efficient high-order finite element and spectral
*26bdecf3SSebastian Grimberg# element discretizations for exascale applications. For more information and
*26bdecf3SSebastian Grimberg# source code availability see http://github.com/ceed
*26bdecf3SSebastian Grimberg#
*26bdecf3SSebastian Grimberg# The CEED research is supported by the Exascale Computing Project 17-SC-20-SC,
*26bdecf3SSebastian Grimberg# a collaborative effort of two U.S. Department of Energy organizations (Office
*26bdecf3SSebastian Grimberg# of Science and the National Nuclear Security Administration) responsible for
*26bdecf3SSebastian Grimberg# the planning and preparation of a capable exascale ecosystem, including
*26bdecf3SSebastian Grimberg# software, applications, hardware, advanced system engineering and early
*26bdecf3SSebastian Grimberg# testbed platforms, in support of the nation's exascale computing imperative.
*26bdecf3SSebastian Grimberg
*26bdecf3SSebastian Grimbergimport argparse
*26bdecf3SSebastian Grimbergimport os
*26bdecf3SSebastian Grimbergimport io
*26bdecf3SSebastian Grimbergimport re
*26bdecf3SSebastian Grimbergimport subprocess
*26bdecf3SSebastian Grimbergimport pandas as pd
*26bdecf3SSebastian Grimbergimport time
*26bdecf3SSebastian Grimberg
*26bdecf3SSebastian Grimbergscript_dir = os.path.dirname(os.path.realpath(__file__))
*26bdecf3SSebastian Grimberg
*26bdecf3SSebastian Grimberg
*26bdecf3SSebastian Grimbergdef build(nb, build_cmd):
*26bdecf3SSebastian Grimberg    with open(f"{script_dir}/../ceed-magma-gemm-selector.cpp", 'r') as f:
*26bdecf3SSebastian Grimberg        data = f.read()
*26bdecf3SSebastian Grimberg        data = re.sub(
*26bdecf3SSebastian Grimberg            '.*(#define CEED_AUTOTUNE_RTC_NB).*',
*26bdecf3SSebastian Grimberg            r'\1' + f" {nb}",
*26bdecf3SSebastian Grimberg            data)
*26bdecf3SSebastian Grimberg    with open(f"{script_dir}/../ceed-magma-gemm-selector.cpp", 'w') as f:
*26bdecf3SSebastian Grimberg        f.write(data)
*26bdecf3SSebastian Grimberg    subprocess.run(build_cmd, cwd=f"{script_dir}/../../..")
*26bdecf3SSebastian Grimberg    subprocess.run(["make", "tuning"], cwd=f"{script_dir}")
*26bdecf3SSebastian Grimberg
*26bdecf3SSebastian Grimberg
*26bdecf3SSebastian Grimbergdef benchmark(backend):
*26bdecf3SSebastian Grimberg    data = subprocess.run(["./tuning", f"{backend}"], capture_output=True)
*26bdecf3SSebastian Grimberg    return pd.read_csv(io.StringIO(data.stdout.decode('utf-8')), header=None,
*26bdecf3SSebastian Grimberg                       delim_whitespace=True, names=['P', 'N', 'Q', 'Q_COMP', 'TRANS', 'MFLOPS'])
*26bdecf3SSebastian Grimberg
*26bdecf3SSebastian Grimberg
*26bdecf3SSebastian Grimbergif __name__ == "__main__":
*26bdecf3SSebastian Grimberg    # Command line arguments
*26bdecf3SSebastian Grimberg    parser = argparse.ArgumentParser("MAGMA RTC autotuning")
*26bdecf3SSebastian Grimberg    parser.add_argument(
*26bdecf3SSebastian Grimberg        "-arch",
*26bdecf3SSebastian Grimberg        help="Device architecture name for tuning data",
*26bdecf3SSebastian Grimberg        required=True)
*26bdecf3SSebastian Grimberg    parser.add_argument(
*26bdecf3SSebastian Grimberg        "-max-nb",
*26bdecf3SSebastian Grimberg        help="Maximum block size NB to consider for autotuning",
*26bdecf3SSebastian Grimberg        default=32,
*26bdecf3SSebastian Grimberg        type=int)
*26bdecf3SSebastian Grimberg    parser.add_argument(
*26bdecf3SSebastian Grimberg        "-ceed",
*26bdecf3SSebastian Grimberg        help="Ceed resource specifier",
*26bdecf3SSebastian Grimberg        default="/cpu/self")
*26bdecf3SSebastian Grimberg    parser.add_argument(
*26bdecf3SSebastian Grimberg        "-build-cmd",
*26bdecf3SSebastian Grimberg        help="Command used to build libCEED from the source root directory",
*26bdecf3SSebastian Grimberg        default="make")
*26bdecf3SSebastian Grimberg    args = parser.parse_args()
*26bdecf3SSebastian Grimberg
*26bdecf3SSebastian Grimberg    for nb in range(1, args.max_nb + 1):
*26bdecf3SSebastian Grimberg        # Rebuild the code for the given value of NB
*26bdecf3SSebastian Grimberg        build(nb, args.build_cmd)
*26bdecf3SSebastian Grimberg
*26bdecf3SSebastian Grimberg        # Run the benchmarks
*26bdecf3SSebastian Grimberg        start = time.perf_counter()
*26bdecf3SSebastian Grimberg        data_nb = benchmark(args.ceed)
*26bdecf3SSebastian Grimberg        print(
*26bdecf3SSebastian Grimberg            f"Finished benchmarks for NB = {nb}, backend = {args.ceed} ({time.perf_counter() - start} s)")
*26bdecf3SSebastian Grimberg
*26bdecf3SSebastian Grimberg        # Save the data for the highest performing NB
*26bdecf3SSebastian Grimberg        if nb == 1:
*26bdecf3SSebastian Grimberg            data = pd.DataFrame(data_nb)
*26bdecf3SSebastian Grimberg            data['NB'] = nb
*26bdecf3SSebastian Grimberg        else:
*26bdecf3SSebastian Grimberg            idx = data_nb['MFLOPS'] > data['MFLOPS']
*26bdecf3SSebastian Grimberg            data.loc[idx, 'NB'] = nb
*26bdecf3SSebastian Grimberg            data.loc[idx, 'MFLOPS'] = data_nb.loc[idx, 'MFLOPS']
*26bdecf3SSebastian Grimberg
*26bdecf3SSebastian Grimberg    # Print the results
*26bdecf3SSebastian Grimberg    with open(f"{script_dir}/{args.arch}_rtc.h", 'w') as f:
*26bdecf3SSebastian Grimberg        f.write(
*26bdecf3SSebastian Grimberg            "////////////////////////////////////////////////////////////////////////////////\n")
*26bdecf3SSebastian Grimberg        f.write(f"// auto-generated from data on {args.arch}\n\n")
*26bdecf3SSebastian Grimberg
*26bdecf3SSebastian Grimberg        rows = data.loc[data['TRANS'] == 1].to_string(header=False, index=False, columns=[
*26bdecf3SSebastian Grimberg                                                      'P', 'N', 'Q', 'Q_COMP', 'NB']).split('\n')
*26bdecf3SSebastian Grimberg        f.write(
*26bdecf3SSebastian Grimberg            "////////////////////////////////////////////////////////////////////////////////\n")
*26bdecf3SSebastian Grimberg        f.write(
*26bdecf3SSebastian Grimberg            f"std::vector<std::array<int, RECORD_LENGTH_RTC> > drtc_t_{args.arch}" +
*26bdecf3SSebastian Grimberg            " = {\n")
*26bdecf3SSebastian Grimberg        count = 0
*26bdecf3SSebastian Grimberg        for row in rows:
*26bdecf3SSebastian Grimberg            f.write("    {" + re.sub(r'(\s+)', r',\1', row) +
*26bdecf3SSebastian Grimberg                    ("},\n" if count < len(rows) - 1 else "}\n"))
*26bdecf3SSebastian Grimberg            count += 1
*26bdecf3SSebastian Grimberg        f.write("};\n\n")
*26bdecf3SSebastian Grimberg
*26bdecf3SSebastian Grimberg        rows = data.loc[data['TRANS'] == 0].to_string(header=False, index=False, columns=[
*26bdecf3SSebastian Grimberg                                                      'P', 'N', 'Q', 'Q_COMP', 'NB']).split('\n')
*26bdecf3SSebastian Grimberg        f.write(
*26bdecf3SSebastian Grimberg            "////////////////////////////////////////////////////////////////////////////////\n")
*26bdecf3SSebastian Grimberg        f.write(
*26bdecf3SSebastian Grimberg            f"std::vector<std::array<int, RECORD_LENGTH_RTC> > drtc_n_{args.arch}" +
*26bdecf3SSebastian Grimberg            " = {\n")
*26bdecf3SSebastian Grimberg        count = 0
*26bdecf3SSebastian Grimberg        for row in rows:
*26bdecf3SSebastian Grimberg            f.write("    {" + re.sub(r'(\s+)', r',\1', row) +
*26bdecf3SSebastian Grimberg                    ("},\n" if count < len(rows) - 1 else "}\n"))
*26bdecf3SSebastian Grimberg            count += 1
*26bdecf3SSebastian Grimberg        f.write("};\n")