# Invocation command line:
# /home/cpu2017/bin/harness/runcpu --configfile amd_speed_aocc400_znver4_A1.cfg --tune all --reportable --iterations 3 --nopower --runmode speed --tune base:peak --size test:train:refspeed fpspeed
# output_root was not used for this run
############################################################################
################################################################################
# AMD AOCC 400 SPEC CPU 2017 V1.1.9 Speed Configuration File for 64-bit Linux
#
#      File name                : amd_speed_aocc400_znver4_A1.cfg
#      Creation Date            : April 16, 2023
#      CPU 2017 Version         : 1.1.9
#      Supported benchmarks     : All Speed benchmarks (intspeed, fpspeed)
#      Compiler name/version    : AOCC 4.0.0
#      Operating system version : RHEL 8.6
#      Supported OS's           : Ubuntu 22.04, RHEL 8.6/9, SLE 15 SP4
#      Hardware                 : AMD znver4 (AMD64)
#      FP Base Pointer Size     : 64-bit
#      FP Peak Pointer Size     : 64-bit
#      INT Base Pointer Size    : 64-bit
#      INT Peak Pointer Size    : 64-bit
#      Auto Parallelization     : No
#
# Note: DO NOT EDIT THIS FILE, the only edits required to properly run these
# binaries are made in the ini Python file.  Please consult Readme.amd_speed_aocc400_znver4_A1.txt
# for a few uncommon exceptions which require edits to this file.
#
# Description:
#
# This binary package automates away many of the complexities necessary to set
# up and run SPEC CPU 2017 under optimized conditions on AMD znver4-based
# server platforms within Linux (AMD64).
#
# The binary package was built specifically for AMD znver4 microprocessors and
# is not intended to run on other products.
#
# Please install the binary package by following the instructions in
# "Readme.amd_speed_aocc400_znver4_A1.txt" under the "How To Use the Binaries" section.
#
# The binary package is designed to work without alteration on one socket AMD
# znver4-based servers with 96 cores, SMT enabled and 768 (64x12) GB of DDR5
# memory distributed evenly among all 12 channels using 64 GiB DIMMs.
#
# To run the binary package on other znver4 configurations, please review
# "Readme.amd_speed_aocc400_znver4_A1.txt". In general, znver4 CPUs
# should be autodetected with no action required by the user.
#
# In most cases, it should be unnecessary to edit "amd_speed_aocc400_znver4_A1.cfg" or any
# other file besides "ini_amd_speed_aocc400_znver4_A1.py" where reporting fields
# and run conditions are set.
#
# The run script automatically sets the optimal number of speed copies and binds
# them appropriately.
#
# The run script and accompanying binary package are designed to work on Ubuntu
# 22.04, RHEL 8.6/9, and SLE 15 SP4.
#
# Important! If you write your own run script, please set the stack size to
# "unlimited" when executing this binary package.  Failure to do so may cause
# some benchmarks to overflow the stack.  For example, to set stack size within
# the bash shell, include the following line somewhere at the top of your run
# script before the runcpu invocation:
#
#      ulimit -s unlimited
#
# Modification of this config file should only be necessary if you intend to
# rebuild the binaries.  General instructions for rebuilding the binaries are
# found in-line below.
#
################################################################################
# Modifiable macros:
################################################################################
# "allow_build"" switch:
# Change the following line to true if you intend to REBUILD the binaries (AMD
# does not support this). Valid values are "true" or "false" (no quotes).
%define allow_build false
# Only change these macros if you are rebuilding the binary package:
%define compiler_name aocc400
%define binary_package_name amd_speed_%{compiler_name}_znver4_A
%define binary_package_ext %{binary_package_name}
%define binary_package_revision 1
%define build_path ${SPEC}
%define flags_file_name  %{compiler_name}-flags.xml
# Do NOT change build_lib_dir after the build or it will trigger a
# rebuild of the xalanc. It should also remain literal:
%define build_lib_dir amd_speed_aocc400_znver4_A_lib
# To enable the platform file, be sure to uncomment the flagsurl02 header line
# below in the Header settings.
%define platform_file_name INVALID_platform_%{binary_package_name}.xml
################################################################################
# You should never have to change binary_package_full_name:
%define binary_package_full_name %{binary_package_name}%{binary_package_revision}

################################################################################
# Include file name
################################################################################
# The include file contains fields that are commonly changed. This file is auto-
# generated based upon INI file settings and should not need user modification
# for runs.

%define inc_file_name %{binary_package_full_name}.inc
%define flags_inc_file_name %{binary_package_full_name}_flags.inc

# Binary label extension:
# Only modify the binary label extension if you plan to rebuild the binaries.
# If you plan to recompile these CPU 2017 binaries, please choose a new extension
# name below to avoid confusion with the current binary set on your system
# under test, and to avoid confusion for SPEC submission reviewers.  You will
# also need to set "allow_build" to true above. Finally, you must modify the
# Paths section below to point to your library locations if the paths are not
# already set up in your build environment.
# Note that AMD calls an external script to set up the compiler and library
# paths before initiating the build.

%define ext %{binary_package_ext}

################################################################################
# Paths and Environment Variables
# ** MODIFY AS NEEDED (modification should not be necessary for runs) **
################################################################################
# Allow environment variables to be set before runs:
preenv                   = 1

# retain:true is necessary to avoid gcc out-of-memory exceptions on certain SUTs:
# oversize_threshold is required to support jemalloc 5.2.x+
preENV_MALLOC_CONF = oversize_threshold:0,retain:true
preENV_LIBOMP_NUM_HIDDEN_HELPER_THREADS = 0

# OpenMP environment variables:
preENV_OMP_SCHEDULE      = static
preENV_OMP_DYNAMIC       = false
preENV_OMP_STACKSIZE     = 128M

# Define the name of the directory that holds AMD library files:
%define lib_dir %{binary_package_name}_lib


# Set the shared object library path for runs and builds:
preENV_LD_LIBRARY_PATH   = $[top]/%{lib_dir}/lib:%{ENV_LD_LIBRARY_PATH}
%if '%{allow_build}' eq 'false'
  # The include file is only needed for runs, but not for builds.
#  include: %{inc_file_name}
#  ----- Begin inclusion of 'amd_speed_aocc400_znver4_A1.inc'
############################################################################
################################################################################
################################################################################
# File name: amd_speed_aocc400_znver4_A1.inc
# File generation code date: October 11, 2022
# File generation date/time: July 12, 2024 / 07:03:53
#
# This file is automatically generated during a SPEC CPU2017 run.
#
# To modify inc file generation, please consult the readme file or the run
# script.
################################################################################
################################################################################

################################################################################
################################################################################
# The following macros are generated for use in the cfg file.
################################################################################
################################################################################

%define logical_core_count 64
%define physical_core_count 64

%define physical_core_max 63

%define logical_core_max 63

################################################################################
################################################################################
# The following inc blocks set the speed thread counts and affinity settings.
#
# intspeed benchmarks: 600.perlbench_s,602.gcc_s,605.mcf_s,620.omnetpp_s,
#   623.xalancbmk_s,625.x264_s,631.deepsjeng_s,641.leela_s,648.exchange2_s,
#   657.xz_s
# fpspeed benchmarks: 603.bwaves_s,607.cactuBSSN_s,619.lbm_s,621.wrf_s,
#   627.cam4_s,628.pop2_s,638.imagick_s,644.nab_s,649.fotonik3d_s,
#   654.roms_s
#
# Selected thread counts from '9354' section of CPU info
################################################################################
# default preENV thread settings:
default:
preENV_OMP_THREAD_LIMIT  = 64
preENV_GOMP_CPU_AFFINITY = 0-63
################################################################################
################################################################################
# intspeed base thread counts:
intspeed=base:
threads                  = 64
ENV_GOMP_CPU_AFFINITY    = 0-63
bind0                    = numactl --physcpubind=0-63
submit = echo "$command" > run.sh ; $BIND bash run.sh
################################################################################
################################################################################
# fpspeed base thread counts:
fpspeed=base:
threads                  = 64
ENV_GOMP_CPU_AFFINITY    = 0-63
bind0                    = numactl --physcpubind=0-63
submit = echo "$command" > run.sh ; $BIND bash run.sh
################################################################################
################################################################################
# peak thread counts: 1
600.perlbench_s,602.gcc_s,605.mcf_s,620.omnetpp_s,623.xalancbmk_s,625.x264_s,631.deepsjeng_s,641.leela_s,648.exchange2_s=peak:
threads                  = 1
ENV_GOMP_CPU_AFFINITY    = 15
bind0                    = numactl --physcpubind=15
submit = echo "$command" > run.sh ; $BIND bash run.sh
################################################################################
################################################################################
# peak thread counts: 64
603.bwaves_s,619.lbm_s,621.wrf_s,628.pop2_s,649.fotonik3d_s=peak:
threads                  = 64
ENV_GOMP_CPU_AFFINITY    = 0-63
bind0                    = numactl --physcpubind=0-63
submit = echo "$command" > run.sh ; $BIND bash run.sh
################################################################################
################################################################################
# peak thread counts: 64
607.cactuBSSN_s,627.cam4_s,638.imagick_s,644.nab_s,657.xz_s=peak:
threads                  = 64
ENV_GOMP_CPU_AFFINITY    = 0-63
bind0                    = numactl --physcpubind=0-63
submit = echo "$command" > run.sh ; $BIND bash run.sh
################################################################################
################################################################################
# peak thread counts: 64
654.roms_s=peak:
threads                  = 64
ENV_GOMP_CPU_AFFINITY    = 0 32 1 33 2 34 3 35 4 36 5 37 6 38 7 39 8 40 9 41 10 42 11 43 12 44 13 45 14 46 15 47 16 48 17 49 18 50 19 51 20 52 21 53 22 54 23 55 24 56 25 57 26 58 27 59 28 60 29 61 30 62 31 63
bind0                    = numactl --physcpubind=0-63
submit = echo "$command" > run.sh ; $BIND bash run.sh
################################################################################

################################################################################
################################################################################
# Switch back to default:
default:
################################################################################


################################################################################
################################################################################
# The remainder of this file defines CPU2017 report parameters.
################################################################################
################################################################################
################################################################################
# SPEC CPU 2017 report header
################################################################################
license_num              =9019
tester                   =Cisco Systems
test_sponsor             =Cisco Systems
hw_vendor                =Cisco Systems
hw_model000              =Cisco UCS C245 M8 (AMD EPYC 9354 32-Core
hw_model001              =Processor)
#--------- If you install new compilers, edit this section --------------------
sw_compiler              =C/C++/Fortran: Version 4.0.0 of AOCC
################################################################################

################################################################################
# Hardware, firmware and software information
################################################################################
hw_avail                 =Jun-2024
sw_avail                 =Jun-2023
hw_cpu_name              =AMD EPYC 9354
hw_cpu_nominal_mhz       =3250
hw_cpu_max_mhz           =3800
hw_ncores                =64
hw_nthreadspercore       =1
hw_ncpuorder             =1,2 chips

hw_other                 =CPU Cooling: Air
fw_bios                  =Version 4.3.4a released May-2024
sw_base_ptrsize          =64-bit
hw_pcache                =32 KB I + 32 KB D on chip per core
hw_scache                =1 MB I+D on chip per core
hw_tcache000             =256 MB I+D on chip per chip, 32 MB shared / 4
hw_tcache001 = cores
hw_ocache                =None
sw_other                 =None

################################################################################
# Notes
################################################################################



# Enter notes_000 through notes_100 here.
notes_000                =Binaries were compiled on a system with 2x AMD EPYC 9174F CPU + 1.5TiB Memory using RHEL 8.6


notes_005                =
notes_010                =NA: The test sponsor attests, as of date of publication, that CVE-2017-5754 (Meltdown)
notes_015                =is mitigated in the system as tested and documented.
notes_020                =Yes: The test sponsor attests, as of date of publication, that CVE-2017-5753 (Spectre variant 1)
notes_025                =is mitigated in the system as tested and documented.
notes_030                =Yes: The test sponsor attests, as of date of publication, that CVE-2017-5715 (Spectre variant 2)
notes_035                =is mitigated in the system as tested and documented.
notes_040                =


notes_submit_000         ='numactl' was used to bind copies to the cores.
notes_submit_005         =See the configuration file for details.
notes_submit_010         =


notes_os_000             ='ulimit -s unlimited' was used to set environment stack size limit
notes_os_005             ='ulimit -l 2097152' was used to set environment locked pages in memory limit
notes_os_010             =
notes_os_015             =runcpu command invoked through numactl i.e.:
notes_os_020             =numactl --interleave=all runcpu <etc>
notes_os_025             =
notes_os_030             =To limit dirty cache to 8% of memory, 'sysctl -w vm.dirty_ratio=8' run as root.
notes_os_035             =To limit swap usage to minimum necessary, 'sysctl -w vm.swappiness=1' run as root.
notes_os_040             =To free node-local memory and avoid remote memory usage,
notes_os_045             ='sysctl -w vm.zone_reclaim_mode=1' run as root.
notes_os_050             =To clear filesystem caches, 'sync; sysctl -w vm.drop_caches=3' run as root.
notes_os_055             =To disable address space layout randomization (ASLR) to reduce run-to-run
notes_os_060             =variability, 'sysctl -w kernel.randomize_va_space=0' run as root.
notes_os_065             =
notes_os_thp_000         =To enable Transparent Hugepages (THP) for all allocations,
notes_os_thp_005         ='echo always > /sys/kernel/mm/transparent_hugepage/enabled' and
notes_os_thp_010         ='echo always > /sys/kernel/mm/transparent_hugepage/defrag' run as root.


notes_comp_000           =The AMD64 AOCC Compiler Suite is available at
notes_comp_005           =http://developer.amd.com/amd-aocc/
notes_comp_010           =
# notes_jemalloc_000       =jemalloc: configured and built with GCC v4.8.2 in RHEL 7.4 (No options specified)
# notes_jemalloc_005       =jemalloc 5.1.0 is available here:
# notes_jemalloc_010       =https://github.com/jemalloc/jemalloc/releases/download/5.1.0/jemalloc-5.1.0.tar.bz2
# notes_jemalloc_015       =
# sw_other000              =jemalloc: jemalloc memory allocator library v5.1.0

################################################################################
# The following note fields describe platorm settings.
################################################################################

# example: (edit and uncomment as necessary)
# notes_plat_000 =BIOS settings:
# notes_plat_002 = TDP: 400
# notes_plat_004 = Determinism Slider set to Power
# notes_plat_006 = PPT: 400
# notes_plat_010 = NPS: 4
# notes_plat_011 = Workload Profile = CPU Intensive
# notes_plat_012 = TSME = Disabled
# notes_plat_014 = SEV Control = Disabled
# notes_plat_015 = Fan Speed: Maximum


################################################################################
# The following are custom fields:
################################################################################

# Use custom_fields to enter lines that are not listed here. For example:
# notes_plat_100         = Energy Bias set to Max Performance
# new_field              = Ambient temperature set to 10C


################################################################################
# The following fields must be set here for only Int benchmarks.
################################################################################
intspeed:

sw_peak_ptrsize          =64-bit

notes_os_thp_003         =


################################################################################
# The following fields must be set here for FP benchmarks.
################################################################################
fpspeed:

sw_peak_ptrsize          =64-bit

notes_os_thp_015         =To always enable THP for peak runs of:
notes_os_thp_020         =603.bwaves_s, 607.cactuBSSN_s, 619.lbm_s, 627.cam4_s, 628.pop2_s, 638.imagick_s, 644.nab_s, 649.fotonik3d_s:
notes_os_thp_025         ='echo madvise > /sys/kernel/mm/transparent_hugepage/enabled; echo always > /sys/kernel/mm/transparent_hugepage/defrag'
notes_os_thp_030         =run as root.
notes_os_thp_035         =To disable THP for peak runs of 621.wrf_s:
notes_os_thp_040         ='echo never > /sys/kernel/mm/transparent_hugepage/enabled; echo always > /sys/kernel/mm/transparent_hugepage/defrag'
notes_os_thp_045         =run as root.
notes_os_thp_050         =To enable THP only on request for peak runs of 654.roms_s:
notes_os_thp_055         ='echo madvise > /sys/kernel/mm/transparent_hugepage/enabled; echo madvise > /sys/kernel/mm/transparent_hugepage/defrag'
notes_os_thp_060         =run as root.


################################################################################
# The following fields must be set here or they will be overwritten by sysinfo.
################################################################################

intspeed,fpspeed:
hw_disk                  =1 x 1.6 TB NVME SSD
hw_memory000             =1536 GB (24 x 64 GB 2Rx4 PC5-5600B-R,
hw_memory001             =running at 4800)
hw_memory002             =

hw_nchips                =2
prepared_by              =Cisco Systems
sw_file                  =btrfs
sw_os000                 =SUSE Linux Enterprise Server 15 SP5
sw_os001                 =kernel version                              # ex: Kernel 4.4.0-87-generic
sw_state                 =Run level 3 (multi-user)

################################################################################
# End of inc file
################################################################################
# Switch back to the default block after the include file:

default:

# ---- End inclusion of '/home/cpu2017/config/amd_speed_aocc400_znver4_A1.inc'
  # Switch back to default block after the include file:
default:
  fail_build             = 1
%elif '%{allow_build}' eq 'true'
  # If you intend to rebuild, be sure to set the library paths either in the
  # build script or here:
  preENV_LIBRARY_PATH   = $[top]/%{build_lib_dir}/lib:%{ENV_LIBRARY_PATH}
% define build_ncpus 16    # controls number of simultaneous compiles
  fail_build             = 0
  makeflags              = --jobs=%{build_ncpus} --load-average=%{build_ncpus}
%else
% error The value of "allow_build" is %{allow_build}, but it can only be "true" or "false". This error was generated
%endif


################################################################################
# Enable automated data collection per benchmark
################################################################################
# Data collection is not enabled for reportable runs.

# teeout is necessary to get data collection stdout into the logs. Best
# practices for the individual data collection items would be to have
# them store important output in separate files.  Filenames could be
# constructed from $SPEC (environment), $lognum (result number from runcpu),
# and benchmark name/number.
teeout = yes

# Run runcpu with '-v 35' (or greater) to log lists of variables which can
# be used in substitutions as below.
# For CPU2006, change $label to $ext
%define data-collection-parameters benchname='$name' benchnum='$num' benchmark='$benchmark' iteration=$iter size='$size' tune='$tune' label='$label' log='$log' lognum='$lognum' from_runcpu='$from_runcpu'
%define data-collection-start $[top]/data-collection/data-collection start %{data-collection-parameters}
%define data-collection-stop  $[top]/data-collection/data-collection stop %{data-collection-parameters}
monitor_specrun_wrapper = %{data-collection-start} ; $command ; %{data-collection-stop}


################################################################################
# Header settings
################################################################################
backup_config            = 0 # set to 0 if you do not want backup files
bench_post_setup         = sync
# command_add_redirect: If set, the generated ${command} will include
# redirection operators (stdout, stderr), which are passed along to the shell
# that executes the command. If this variable is not set, specinvoke does the
# redirection.
command_add_redirect     = yes
env_vars                 = yes
flagsurl000              = http://www.spec.org/cpu2017/flags/aocc400-flags.xml
flagsurl001 = http://www.spec.org/cpu2017/flags/Cisco-Platform-Settings-AMD-v3-revA.xml
#flagsurl02              = $[top]/%{platform_file_name}
# label: User defined extension string that tags your binaries & directories:
label                    = %{ext}
line_width               = 1020
log_line_width           = 1020
mean_anyway              = yes
output_format            = all
reportable               = yes
size                     = test,train,ref
teeout                   = yes
teerunout                = yes
tune                     = base,peak
use_submit_for_speed     = yes


################################################################################
# Include the flags file:
################################################################################

#include: %{flags_inc_file_name}
#  ----- Begin inclusion of 'amd_speed_aocc400_znver4_A1_flags.inc'
############################################################################
################################################################################
# AMD AOCC 4.0.0 SPEC CPU2017 V1.1.8 Speed Configuration Flags for AMD64 Linux
################################################################################
# Compilers
################################################################################

default:
CC                       = clang   -m64
CXX                      = clang++ -m64
FC                       = flang   -m64
CLD                      = clang   -m64
CXXLD                    = clang++ -m64
FLD                      = flang   -m64
CC_VERSION_OPTION        = --version
CXX_VERSION_OPTION       = --version
FC_VERSION_OPTION        = --version


################################################################################
# Portability Flags
################################################################################

default:
# data model applies to all benchmarks
EXTRA_PORTABILITY         = -DSPEC_LP64

# *** Benchmark-specific portability ***
# Anything other than the data model is only allowed where a need is proven.
# (ordered by last 2 digits of benchmark number)

600.perlbench_s: #lang='C'
PORTABILITY              = -DSPEC_LINUX_X64

621.wrf_s: #lang='F,C'
CPORTABILITY             = -DSPEC_CASE_FLAG
FPORTABILITY             = -Mbyteswapio

623.xalancbmk_s: #lang='CXX'
PORTABILITY              = -DSPEC_LINUX

627.cam4_s: #lang='F,C'
PORTABILITY              = -DSPEC_CASE_FLAG

628.pop2_s: #lang='F,C'
CPORTABILITY             = -DSPEC_CASE_FLAG
FPORTABILITY             = -Mbyteswapio


################################################################################
# Default libraries and variables
################################################################################

default:

# Libraries:
EXTRA_LIBS               = -fopenmp=libomp \
                           -lomp \
                           -lamdalloc \
                           -lamdlibm \
                           -lm

MATHLIBOPT               = #clearing this variable or else SPEC will set it to -lm

VECMATHLIB               = -fveclib=AMDLIBM

# Variables:
OPT_ROOT                 = -march=znver4 \
                           $(VECMATHLIB) \
                           -ffast-math \
                           -fopenmp

OPT_ROOT_BASE            = -O3 \
                           $(OPT_ROOT)

OPT_ROOT_PEAK            = -Ofast \
                           $(OPT_ROOT) \
                           -flto

THP_ALWAYS               = echo always > /sys/kernel/mm/transparent_hugepage/enabled; echo always > /sys/kernel/mm/transparent_hugepage/defrag
THP_NEVER                = echo never > /sys/kernel/mm/transparent_hugepage/enabled; echo never > /sys/kernel/mm/transparent_hugepage/defrag
THP_MADVISE              = echo madvise > /sys/kernel/mm/transparent_hugepage/enabled; echo madvise > /sys/kernel/mm/transparent_hugepage/defrag
DEFAULT_SUBMIT           = echo "$command" > run.sh ; $BIND bash run.sh


###############################################################################
# AOCC 4.0.0 workarounds that do not count as PORTABILITY
################################################################################
# The workarounds in this section would not qualify under the SPEC CPU
# PORTABILITY rule.
#   - In peak, they can be set as needed for individual benchmarks.
#   - In base, individual settings are not allowed; set for whole suite.
# Use EXTRA_CFLAGS, EXTRA_CXXFLAGS, and EXTRA_FFLAGS for them.
#
# See:
#     https://www.spec.org/cpu2017/Docs/runrules.html#portability
#     https://www.spec.org/cpu2017/Docs/runrules.html#BaseFlags

#######################
# Default workarounds #
#######################

default:
# Allow unused compile/link arguments without triggering warnings during build:
EXTRA_CFLAGS             = -Wno-unused-command-line-argument
EXTRA_CXXFLAGS           = -Wno-unused-command-line-argument
EXTRA_FFLAGS             = -Wno-unused-command-line-argument
LDOPTIONS                = -Wno-unused-command-line-argument

####################
# Base workarounds #
####################
#
# *** NONE ***
#

##############################
# Integer workarounds - base #
##############################

intrate=base:
# The following is necessary for 602 gcc:
EXTRA_LDFLAGS            = -z muldefs

#########################
# FP workarounds - base #
#########################
#
# *** NONE ***
#

####################
# Peak workarounds #
####################
#
# *** NONE ***
#

##############################
# Integer workarounds - peak #
##############################

602.gcc_s=peak: #lang='C'
EXTRA_LDFLAGS            = -z muldefs

#####################################
# Floating Point workarounds - peak #
#####################################
#
# *** NONE ***
#


################################################################################
# Tuning Flags
################################################################################

#####################
# Base tuning flags #
#####################

default=base:

COPTIMIZE                = $(OPT_ROOT_BASE) \
                           -flto \
                           -fstruct-layout=7 \
                           -mllvm -unroll-threshold=50 \
                           -mllvm -inline-threshold=1000 \
                           -fremap-arrays \
                           -fstrip-mining \
                           -mllvm -reduce-array-computations=3 \
                           -DSPEC_OPENMP \
                           -Wno-return-type \
                           -zopt

CXXOPTIMIZE              = $(OPT_ROOT_BASE) \
                           -flto \
                           -mllvm -unroll-threshold=100 \
                           -finline-aggressive \
                           -mllvm -loop-unswitch-threshold=200000 \
                           -mllvm -reduce-array-computations=3 \
                           -DSPEC_OPENMP \
                           -zopt

FOPTIMIZE                = $(OPT_ROOT_BASE) \
                           -flto \
                           -Mrecursive \
                           -funroll-loops \
                           -mllvm -lsr-in-nested-loop \
                           -mllvm -reduce-array-computations=3 \
                           -DSPEC_OPENMP \
                           -zopt

LDCXXFLAGS               = -Wl,-mllvm -Wl,-x86-use-vzeroupper=false

LDFLAGS                  = -Wl,-mllvm -Wl,-align-all-nofallthru-blocks=6 \
                           -Wl,-mllvm -Wl,-reduce-array-computations=3

LDFFLAGS                 = -Wl,-mllvm -Wl,-enable-X86-prefetching

#other libraries
# Put OpenMP and math libraries here:
# -lm needed at the end for some transcendental functions:
EXTRA_LIBS               = -fopenmp=libomp \
                           -lomp \
                           -lamdlibm \
                           -lamdalloc \
                           -lflang \
                           -lm

EXTRA_FLIBS              =

# Don't put the AMD and mvec math libraries in MATHLIBOPT because it will trigger a reporting issue
# because GCC won't use them. Forcefeed all benchmarks the math libraries in EXTRA_LIBS and clear
# out MATHLIBOPT.
MATHLIBOPT               =


#########################
# intspeed tuning flags #
#########################

intspeed:

FOPTIMIZE                = $(OPT_ROOT_BASE) \
                           -flto \
                           -mllvm -optimize-strided-mem-cost

EXTRA_FFLAGS             = -mllvm -unroll-aggressive \
                           -mllvm -unroll-threshold=150

EXTRA_CXXFLAGS           = -fvirtual-function-elimination \
                           -fvisibility=hidden

LDFLAGS                  = -Wl,-mllvm -Wl,-align-all-nofallthru-blocks=6 \
                           -Wl,-mllvm -Wl,-reduce-array-computations=3

LDCFLAGS                 = -Wl,-allow-multiple-definition

LDCXXFLAGS               =

LDFFLAGS                 = -Wl,-mllvm -Wl,-inline-recursion=4 \
                           -Wl,-mllvm -Wl,-lsr-in-nested-loop \
                           -Wl,-mllvm -Wl,-enable-iv-split

##############################
# intspeed base tuning flags #
##############################

intspeed=base:

EXTRA_LIBS               = -fopenmp=libomp \
                           -lomp \
                           -lamdlibm \
                           -lflang \
                           -lm

EXTRA_CLIBS              = -lamdalloc
EXTRA_CXXLIBS            = -lamdalloc-ext
EXTRA_FLIBS              = -lamdalloc

submit                   = ${THP_ALWAYS}; ${DEFAULT_SUBMIT}

##############################
# intspeed peak tuning flags #
##############################

intspeed=peak:

submit                   = ${THP_ALWAYS}; ${DEFAULT_SUBMIT}


#############################
# fpspeed base tuning flags #
#############################

fpspeed=base:

submit                   = ${THP_ALWAYS}; ${DEFAULT_SUBMIT}

#############################
# fpspeed peak tuning flags #
#############################

fpspeed=peak:

submit                   = ${THP_ALWAYS}; ${DEFAULT_SUBMIT}


#####################
# Peak tuning flags #
#####################

default=peak:

COPTIMIZE                = $(OPT_ROOT_PEAK) -fstruct-layout=9 \
                           -mllvm -unroll-threshold=50 \
                           -fremap-arrays \
                           -fstrip-mining \
                           -mllvm -inline-threshold=1000 \
                           -mllvm -reduce-array-computations=3 \
                           -DSPEC_OPENMP -Wno-return-type \
                           -zopt

CXXOPTIMIZE              = $(OPT_ROOT_PEAK) -finline-aggressive \
                           -mllvm -unroll-threshold=100 \
                           -mllvm -reduce-array-computations=3 \
                           -DSPEC_OPENMP \
                           -zopt

FOPTIMIZE                = $(OPT_ROOT_PEAK) -Mrecursive \
                           -mllvm -reduce-array-computations=3 \
                           -DSPEC_OPENMP \
                           -zopt

LDFLAGS                  = -Wl,-mllvm -Wl,-align-all-nofallthru-blocks=6 \
                           -Wl,-mllvm -Wl,-reduce-array-computations=3

LDFFLAGS                 = -Wl,-mllvm -Wl,-enable-X86-prefetching

LDCXXFLAGS               = -Wl,-mllvm -Wl,-x86-use-vzeroupper=false

EXTRA_LIBS               = -fopenmp=libomp \
                           -lomp \
                           -lamdlibm \
                           -lamdalloc \
                           -lflang \
                           -lm

feedback                 = 0
PASS1_CFLAGS             = -fprofile-instr-generate
PASS2_CFLAGS             = -fprofile-instr-use
PASS1_FFLAGS             = -fprofile-generate
PASS2_FFLAGS             = -fprofile-use
PASS1_CXXFLAGS           = -fprofile-instr-generate
PASS2_CXXFLAGS           = -fprofile-instr-use
PASS1_LDFLAGS            = -fprofile-instr-generate
PASS2_LDFLAGS            = -fprofile-instr-use
fdo_run1                 = $command ; llvm-profdata merge --output=default.profdata *.profraw


# Benchmark specific peak tuning flags:

603.bwaves_s=peak: #lang='F'
FOPTIMIZE                = -Ofast \
                           $(OPT_ROOT) \
                           -Mrecursive \
                           -mllvm -reduce-array-computations=3 \
                           -DSPEC_OPENMP \
                           -fvector-transform \
                           -fscalar-transform
submit                   = ${THP_ALWAYS}; ${DEFAULT_SUBMIT}

607.cactuBSSN_s=peak: #lang='CXX,C,F'
submit                   = ${THP_ALWAYS}; ${DEFAULT_SUBMIT}

619.lbm_s=peak:
submit                   = ${THP_ALWAYS}; ${DEFAULT_SUBMIT}

620.omnetpp_s=peak: #lang='CXX'
EXTRA_LIBS               = -fopenmp=libomp \
                           -lomp \
                           -lamdlibm \
                           -lamdalloc-ext \
                           -lflang -lm

621.wrf_s=peak: #lang='F,C'
FOPTIMIZE                = $(OPT_ROOT_BASE) \
                           -Mrecursive \
                           -funroll-loops \
                           -mllvm -lsr-in-nested-loop \
                           -mllvm -reduce-array-computations=3 \
                           -DSPEC_OPENMP \
                           -zopt
submit                   = ${THP_NEVER}; ${DEFAULT_SUBMIT}

623.xalancbmk_s=peak: #lang='CXX'
EXTRA_CXXFLAGS           = -mllvm -do-block-reorder=aggressive \
                           -fvirtual-function-elimination -fvisibility=hidden
LDFLAGS                  = -Wl,-mllvm -Wl,-align-all-nofallthru-blocks=6 \
                           -Wl,-mllvm -Wl,-reduce-array-computations=3 \
                           -Wl,-mllvm -Wl,-do-block-reorder=aggressive
EXTRA_LIBS               = -fopenmp=libomp \
                           -lomp \
                           -lamdlibm \
                           -lamdalloc-ext \
                           -lflang \
                           -lm

627.cam4_s=peak: #lang='F,C'
LDFLAGS                  = -Wl,-mllvm -Wl,-align-all-nofallthru-blocks=6 \
                           -Wl,-mllvm -Wl,-reduce-array-computations=3
submit                   = ${THP_ALWAYS}; ${DEFAULT_SUBMIT}

628.pop2_s=peak: #lang='F,C'
FOPTIMIZE                = $(OPT_ROOT) \
                           -Ofast \
                           -Mrecursive \
                           -mllvm -reduce-array-computations=3 \
                           -DSPEC_OPENMP \
                           -fvector-transform \
                           -fscalar-transform
submit                   = ${THP_ALWAYS}; ${DEFAULT_SUBMIT}

638.imagick_s=peak: #lang='C'
LDFLAGS                  = -Wl,-mllvm -Wl,-align-all-nofallthru-blocks=6 \
                           -Wl,-mllvm -Wl,-reduce-array-computations=3

submit                   = ${THP_ALWAYS}; ${DEFAULT_SUBMIT}

644.nab_s=peak: #lang='C'
LDFLAGS                  = -Wl,-mllvm -Wl,-region-vectorize
submit                   = ${THP_ALWAYS}; ${DEFAULT_SUBMIT}

649.fotonik3d_s=peak: #lang='F'
ENV_PGHPF_ZMEM           = yes
submit                   = ${THP_ALWAYS}; ${DEFAULT_SUBMIT}

654.roms_s=peak: #lang='F'
FOPTIMIZE                = -Ofast \
                           $(OPT_ROOT) \
                           -Mrecursive \
                           -mllvm -reduce-array-computations=3 \
                           -DSPEC_OPENMP \
                           -fvector-transform \
                           -fscalar-transform
submit                   = ${THP_MADVISE}; ${DEFAULT_SUBMIT}

657.xz_s=peak: #lang='C'
ENV_LIBOMP_NUM_HIDDEN_HELPER_THREADS = 8
# ---- End inclusion of '/home/cpu2017/config/amd_speed_aocc400_znver4_A1_flags.inc'


# The following settings were obtained by running the sysinfo_program
# 'specperl $[top]/bin/sysinfo' (sysinfo:SHA:2eb381fc1a58eb8122e4a1b875c1e38b3489dac84088192aa0ec6d157b084d06)
default:
notes_plat_sysinfo_000 =
notes_plat_sysinfo_005 = Sysinfo program /home/cpu2017/bin/sysinfo
notes_plat_sysinfo_010 = Rev: r6732 of 2022-11-07 fe91c89b7ed5c36ae2c92cc097bec197
notes_plat_sysinfo_015 = running on localhost Fri Jul 12 07:03:59 2024
notes_plat_sysinfo_020 =
notes_plat_sysinfo_025 = SUT (System Under Test) info as seen by some common utilities.
notes_plat_sysinfo_030 =
notes_plat_sysinfo_035 = ------------------------------------------------------------
notes_plat_sysinfo_040 = Table of contents
notes_plat_sysinfo_045 = ------------------------------------------------------------
notes_plat_sysinfo_050 =  1. uname -a
notes_plat_sysinfo_055 =  2. w
notes_plat_sysinfo_060 =  3. Username
notes_plat_sysinfo_065 =  4. ulimit -a
notes_plat_sysinfo_070 =  5. sysinfo process ancestry
notes_plat_sysinfo_075 =  6. /proc/cpuinfo
notes_plat_sysinfo_080 =  7. lscpu
notes_plat_sysinfo_085 =  8. numactl --hardware
notes_plat_sysinfo_090 =  9. /proc/meminfo
notes_plat_sysinfo_095 = 10. who -r
notes_plat_sysinfo_100 = 11. Systemd service manager version: systemd 249 (249.16+suse.171.gdad0071f15)
notes_plat_sysinfo_105 = 12. Services, from systemctl list-unit-files
notes_plat_sysinfo_110 = 13. Linux kernel boot-time arguments, from /proc/cmdline
notes_plat_sysinfo_115 = 14. cpupower frequency-info
notes_plat_sysinfo_120 = 15. sysctl
notes_plat_sysinfo_125 = 16. /sys/kernel/mm/transparent_hugepage
notes_plat_sysinfo_130 = 17. /sys/kernel/mm/transparent_hugepage/khugepaged
notes_plat_sysinfo_135 = 18. OS release
notes_plat_sysinfo_140 = 19. Disk information
notes_plat_sysinfo_145 = 20. /sys/devices/virtual/dmi/id
notes_plat_sysinfo_150 = 21. dmidecode
notes_plat_sysinfo_155 = 22. BIOS
notes_plat_sysinfo_160 = ------------------------------------------------------------
notes_plat_sysinfo_165 =
notes_plat_sysinfo_170 = ------------------------------------------------------------
notes_plat_sysinfo_175 = 1. uname -a
notes_plat_sysinfo_180 =   Linux localhost 5.14.21-150500.53-default #1 SMP PREEMPT_DYNAMIC Wed May 10 07:56:26 UTC 2023 (b630043)
notes_plat_sysinfo_185 =   x86_64 x86_64 x86_64 GNU/Linux
notes_plat_sysinfo_190 =
notes_plat_sysinfo_195 = ------------------------------------------------------------
notes_plat_sysinfo_200 = 2. w
notes_plat_sysinfo_205 =    07:03:59 up  7:05,  1 user,  load average: 0.00, 0.00, 0.00
notes_plat_sysinfo_210 =   USER     TTY      FROM             LOGIN@   IDLE   JCPU   PCPU WHAT
notes_plat_sysinfo_215 =   root     tty1     -                Wed15   23.00s  1.11s  0.10s /bin/bash ./amd_speed_aocc400_znver4_A1.sh
notes_plat_sysinfo_220 =
notes_plat_sysinfo_225 = ------------------------------------------------------------
notes_plat_sysinfo_230 = 3. Username
notes_plat_sysinfo_235 =   From environment variable $USER:  root
notes_plat_sysinfo_240 =
notes_plat_sysinfo_245 = ------------------------------------------------------------
notes_plat_sysinfo_250 = 4. ulimit -a
notes_plat_sysinfo_255 =   core file size          (blocks, -c) unlimited
notes_plat_sysinfo_260 =   data seg size           (kbytes, -d) unlimited
notes_plat_sysinfo_265 =   scheduling priority             (-e) 0
notes_plat_sysinfo_270 =   file size               (blocks, -f) unlimited
notes_plat_sysinfo_275 =   pending signals                 (-i) 6191363
notes_plat_sysinfo_280 =   max locked memory       (kbytes, -l) 2097152
notes_plat_sysinfo_285 =   max memory size         (kbytes, -m) unlimited
notes_plat_sysinfo_290 =   open files                      (-n) 1024
notes_plat_sysinfo_295 =   pipe size            (512 bytes, -p) 8
notes_plat_sysinfo_300 =   POSIX message queues     (bytes, -q) 819200
notes_plat_sysinfo_305 =   real-time priority              (-r) 0
notes_plat_sysinfo_310 =   stack size              (kbytes, -s) unlimited
notes_plat_sysinfo_315 =   cpu time               (seconds, -t) unlimited
notes_plat_sysinfo_320 =   max user processes              (-u) 6191363
notes_plat_sysinfo_325 =   virtual memory          (kbytes, -v) unlimited
notes_plat_sysinfo_330 =   file locks                      (-x) unlimited
notes_plat_sysinfo_335 =
notes_plat_sysinfo_340 = ------------------------------------------------------------
notes_plat_sysinfo_345 = 5. sysinfo process ancestry
notes_plat_sysinfo_350 =  /usr/lib/systemd/systemd --switched-root --system --deserialize 30
notes_plat_sysinfo_355 =  login -- root
notes_plat_sysinfo_360 =  -bash
notes_plat_sysinfo_365 =  python3 ./run_amd_speed_aocc400_znver4_A1.py -b fpspeed
notes_plat_sysinfo_370 =  /bin/bash ./amd_speed_aocc400_znver4_A1.sh
notes_plat_sysinfo_375 =  runcpu --config amd_speed_aocc400_znver4_A1.cfg --tune all --reportable --iterations 3 fpspeed
notes_plat_sysinfo_380 =  runcpu --configfile amd_speed_aocc400_znver4_A1.cfg --tune all --reportable --iterations 3 --nopower
notes_plat_sysinfo_385 =    --runmode speed --tune base:peak --size test:train:refspeed fpspeed --nopreenv --note-preenv --logfile
notes_plat_sysinfo_390 =    $SPEC/tmp/CPU2017.001/templogs/preenv.fpspeed.001.0.log --lognum 001.0 --from_runcpu 2
notes_plat_sysinfo_395 =  specperl $SPEC/bin/sysinfo
notes_plat_sysinfo_400 = $SPEC = /home/cpu2017
notes_plat_sysinfo_405 =
notes_plat_sysinfo_410 = ------------------------------------------------------------
notes_plat_sysinfo_415 = 6. /proc/cpuinfo
notes_plat_sysinfo_420 =     model name      : AMD EPYC 9354 32-Core Processor
notes_plat_sysinfo_425 =     vendor_id       : AuthenticAMD
notes_plat_sysinfo_430 =     cpu family      : 25
notes_plat_sysinfo_435 =     model           : 17
notes_plat_sysinfo_440 =     stepping        : 1
notes_plat_sysinfo_445 =     microcode       : 0xa101148
notes_plat_sysinfo_450 =     bugs            : sysret_ss_attrs spectre_v1 spectre_v2 spec_store_bypass
notes_plat_sysinfo_455 =     TLB size        : 3584 4K pages
notes_plat_sysinfo_460 =     cpu cores       : 32
notes_plat_sysinfo_465 =     siblings        : 32
notes_plat_sysinfo_470 =     2 physical ids (chips)
notes_plat_sysinfo_475 =     64 processors (hardware threads)
notes_plat_sysinfo_480 =     physical id 0: core ids 0-3,16-19,32-35,48-51,64-67,80-83,96-99,112-115
notes_plat_sysinfo_485 =     physical id 1: core ids 0-3,16-19,32-35,48-51,64-67,80-83,96-99,112-115
notes_plat_sysinfo_490 =     physical id 0: apicids 0-3,16-19,32-35,48-51,64-67,80-83,96-99,112-115
notes_plat_sysinfo_495 =     physical id 1: apicids 128-131,144-147,160-163,176-179,192-195,208-211,224-227,240-243
notes_plat_sysinfo_500 =   Caution: /proc/cpuinfo data regarding chips, cores, and threads is not necessarily reliable, especially for
notes_plat_sysinfo_505 =   virtualized systems.  Use the above data carefully.
notes_plat_sysinfo_510 =
notes_plat_sysinfo_515 = ------------------------------------------------------------
notes_plat_sysinfo_520 = 7. lscpu
notes_plat_sysinfo_525 =
notes_plat_sysinfo_530 = From lscpu from util-linux 2.37.4:
notes_plat_sysinfo_535 =   Architecture:                    x86_64
notes_plat_sysinfo_540 =   CPU op-mode(s):                  32-bit, 64-bit
notes_plat_sysinfo_545 =   Address sizes:                   52 bits physical, 57 bits virtual
notes_plat_sysinfo_550 =   Byte Order:                      Little Endian
notes_plat_sysinfo_555 =   CPU(s):                          64
notes_plat_sysinfo_560 =   On-line CPU(s) list:             0-63
notes_plat_sysinfo_565 =   Vendor ID:                       AuthenticAMD
notes_plat_sysinfo_570 =   Model name:                      AMD EPYC 9354 32-Core Processor
notes_plat_sysinfo_575 =   CPU family:                      25
notes_plat_sysinfo_580 =   Model:                           17
notes_plat_sysinfo_585 =   Thread(s) per core:              1
notes_plat_sysinfo_590 =   Core(s) per socket:              32
notes_plat_sysinfo_595 =   Socket(s):                       2
notes_plat_sysinfo_600 =   Stepping:                        1
notes_plat_sysinfo_605 =   Frequency boost:                 enabled
notes_plat_sysinfo_610 =   CPU max MHz:                     3799.0720
notes_plat_sysinfo_615 =   CPU min MHz:                     1500.0000
notes_plat_sysinfo_620 =   BogoMIPS:                        6489.96
notes_plat_sysinfo_625 =   Flags:                           fpu vme de pse tsc msr pae mce cx8 apic sep mtrr pge mca cmov pat pse36
notes_plat_sysinfo_630 =                                    clflush mmx fxsr sse sse2 ht syscall nx mmxext fxsr_opt pdpe1gb rdtscp lm
notes_plat_sysinfo_635 =                                    constant_tsc rep_good amd_lbr_v2 nopl nonstop_tsc cpuid extd_apicid
notes_plat_sysinfo_640 =                                    aperfmperf rapl pni pclmulqdq monitor ssse3 fma cx16 pcid sse4_1 sse4_2
notes_plat_sysinfo_645 =                                    x2apic movbe popcnt aes xsave avx f16c rdrand lahf_lm cmp_legacy svm
notes_plat_sysinfo_650 =                                    extapic cr8_legacy abm sse4a misalignsse 3dnowprefetch osvw ibs skinit wdt
notes_plat_sysinfo_655 =                                    tce topoext perfctr_core perfctr_nb bpext perfctr_llc mwaitx cpb cat_l3
notes_plat_sysinfo_660 =                                    cdp_l3 invpcid_single hw_pstate ssbd mba perfmon_v2 ibrs ibpb stibp
notes_plat_sysinfo_665 =                                    vmmcall fsgsbase bmi1 avx2 smep bmi2 invpcid cqm rdt_a avx512f avx512dq
notes_plat_sysinfo_670 =                                    rdseed adx smap avx512ifma clflushopt clwb avx512cd sha_ni avx512bw
notes_plat_sysinfo_675 =                                    avx512vl xsaveopt xsavec xgetbv1 xsaves cqm_llc cqm_occup_llc
notes_plat_sysinfo_680 =                                    cqm_mbm_total cqm_mbm_local avx512_bf16 clzero irperf xsaveerptr rdpru
notes_plat_sysinfo_685 =                                    wbnoinvd amd_ppin cppc arat npt lbrv svm_lock nrip_save tsc_scale
notes_plat_sysinfo_690 =                                    vmcb_clean flushbyasid decodeassists pausefilter pfthreshold avic
notes_plat_sysinfo_695 =                                    v_vmsave_vmload vgif v_spec_ctrl avx512vbmi umip pku ospke avx512_vbmi2
notes_plat_sysinfo_700 =                                    gfni vaes vpclmulqdq avx512_vnni avx512_bitalg avx512_vpopcntdq la57 rdpid
notes_plat_sysinfo_705 =                                    overflow_recov succor smca flush_l1d
notes_plat_sysinfo_710 =   Virtualization:                  AMD-V
notes_plat_sysinfo_715 =   L1d cache:                       2 MiB (64 instances)
notes_plat_sysinfo_720 =   L1i cache:                       2 MiB (64 instances)
notes_plat_sysinfo_725 =   L2 cache:                        64 MiB (64 instances)
notes_plat_sysinfo_730 =   L3 cache:                        512 MiB (16 instances)
notes_plat_sysinfo_735 =   NUMA node(s):                    4
notes_plat_sysinfo_740 =   NUMA node0 CPU(s):               0-15
notes_plat_sysinfo_745 =   NUMA node1 CPU(s):               16-31
notes_plat_sysinfo_750 =   NUMA node2 CPU(s):               32-47
notes_plat_sysinfo_755 =   NUMA node3 CPU(s):               48-63
notes_plat_sysinfo_760 =   Vulnerability Itlb multihit:     Not affected
notes_plat_sysinfo_765 =   Vulnerability L1tf:              Not affected
notes_plat_sysinfo_770 =   Vulnerability Mds:               Not affected
notes_plat_sysinfo_775 =   Vulnerability Meltdown:          Not affected
notes_plat_sysinfo_780 =   Vulnerability Mmio stale data:   Not affected
notes_plat_sysinfo_785 =   Vulnerability Retbleed:          Not affected
notes_plat_sysinfo_790 =   Vulnerability Spec store bypass: Mitigation; Speculative Store Bypass disabled via prctl and seccomp
notes_plat_sysinfo_795 =   Vulnerability Spectre v1:        Mitigation; usercopy/swapgs barriers and __user pointer sanitization
notes_plat_sysinfo_800 =   Vulnerability Spectre v2:        Mitigation; Retpolines, IBPB conditional, IBRS_FW, STIBP disabled, RSB
notes_plat_sysinfo_805 =                                    filling, PBRSB-eIBRS Not affected
notes_plat_sysinfo_810 =   Vulnerability Srbds:             Not affected
notes_plat_sysinfo_815 =   Vulnerability Tsx async abort:   Not affected
notes_plat_sysinfo_820 =
notes_plat_sysinfo_825 = From lscpu --cache:
notes_plat_sysinfo_830 =      NAME ONE-SIZE ALL-SIZE WAYS TYPE        LEVEL  SETS PHY-LINE COHERENCY-SIZE
notes_plat_sysinfo_835 =      L1d       32K       2M    8 Data            1    64        1             64
notes_plat_sysinfo_840 =      L1i       32K       2M    8 Instruction     1    64        1             64
notes_plat_sysinfo_845 =      L2         1M      64M    8 Unified         2  2048        1             64
notes_plat_sysinfo_850 =      L3        32M     512M   16 Unified         3 32768        1             64
notes_plat_sysinfo_855 =
notes_plat_sysinfo_860 = ------------------------------------------------------------
notes_plat_sysinfo_865 = 8. numactl --hardware
notes_plat_sysinfo_870 = NOTE: a numactl 'node' might or might not correspond to a physical chip.
notes_plat_sysinfo_875 =   available: 4 nodes (0-3)
notes_plat_sysinfo_880 =   node 0 cpus: 0-15
notes_plat_sysinfo_885 =   node 0 size: 386766 MB
notes_plat_sysinfo_890 =   node 0 free: 386320 MB
notes_plat_sysinfo_895 =   node 1 cpus: 16-31
notes_plat_sysinfo_900 =   node 1 size: 387067 MB
notes_plat_sysinfo_905 =   node 1 free: 386241 MB
notes_plat_sysinfo_910 =   node 2 cpus: 32-47
notes_plat_sysinfo_915 =   node 2 size: 387067 MB
notes_plat_sysinfo_920 =   node 2 free: 386159 MB
notes_plat_sysinfo_925 =   node 3 cpus: 48-63
notes_plat_sysinfo_930 =   node 3 size: 386969 MB
notes_plat_sysinfo_935 =   node 3 free: 386562 MB
notes_plat_sysinfo_940 =   node distances:
notes_plat_sysinfo_945 =   node   0   1   2   3
notes_plat_sysinfo_950 =     0:  10  12  32  32
notes_plat_sysinfo_955 =     1:  12  10  32  32
notes_plat_sysinfo_960 =     2:  32  32  10  12
notes_plat_sysinfo_965 =     3:  32  32  12  10
notes_plat_sysinfo_970 =
notes_plat_sysinfo_975 = ------------------------------------------------------------
notes_plat_sysinfo_980 = 9. /proc/meminfo
notes_plat_sysinfo_985 =    MemTotal:       1585019632 kB
notes_plat_sysinfo_990 =
notes_plat_sysinfo_995 = ------------------------------------------------------------
notes_plat_sysinfo_1000= 10. who -r
notes_plat_sysinfo_1005=   run-level 3 Jul 10 15:08
notes_plat_sysinfo_1010=
notes_plat_sysinfo_1015= ------------------------------------------------------------
notes_plat_sysinfo_1020= 11. Systemd service manager version: systemd 249 (249.16+suse.171.gdad0071f15)
notes_plat_sysinfo_1025=   Default Target  Status
notes_plat_sysinfo_1030=   multi-user      running
notes_plat_sysinfo_1035=
notes_plat_sysinfo_1040= ------------------------------------------------------------
notes_plat_sysinfo_1045= 12. Services, from systemctl list-unit-files
notes_plat_sysinfo_1050=   STATE            UNIT FILES
notes_plat_sysinfo_1055=   enabled          YaST2-Firstboot YaST2-Second-Stage apparmor auditd cron getty@ irqbalance iscsi
notes_plat_sysinfo_1060=                    issue-generator kbdsettings klog libvirtd lvm2-monitor nscd postfix purge-kernels rollback
notes_plat_sysinfo_1065=                    rsyslog smartd sshd systemd-pstore wicked wickedd-auto4 wickedd-dhcp4 wickedd-dhcp6
notes_plat_sysinfo_1070=                    wickedd-nanny
notes_plat_sysinfo_1075=   enabled-runtime  systemd-remount-fs
notes_plat_sysinfo_1080=   disabled         autofs autoyast-initscripts blk-availability boot-sysctl ca-certificates chrony-wait
notes_plat_sysinfo_1085=                    chronyd console-getty cups cups-browsed debug-shell dnsmasq ebtables exchange-bmc-os-info
notes_plat_sysinfo_1090=                    firewalld gpm grub2-once haveged haveged-switch-root hwloc-dump-hwdata ipmi ipmievd
notes_plat_sysinfo_1095=                    iscsi-init iscsid issue-add-ssh-keys kdump kdump-early kexec-load ksm kvm_stat
notes_plat_sysinfo_1100=                    libvirt-guests lunmask man-db-create multipathd nfs nfs-blkmap nfs-server nfsserver
notes_plat_sysinfo_1105=                    rpcbind rpmconfigcheck rsyncd serial-getty@ smartd_generate_opts snmpd snmptrapd
notes_plat_sysinfo_1110=                    strongswan strongswan-starter svnserve systemd-boot-check-no-failures
notes_plat_sysinfo_1115=                    systemd-network-generator systemd-nspawn@ systemd-sysext systemd-time-wait-sync
notes_plat_sysinfo_1120=                    systemd-timesyncd tcsd udisks2 virtinterfaced virtnetworkd virtnodedevd virtnwfilterd
notes_plat_sysinfo_1125=                    virtproxyd virtqemud virtsecretd virtstoraged
notes_plat_sysinfo_1130=   indirect         pcscd virtlockd virtlogd wickedd
notes_plat_sysinfo_1135=
notes_plat_sysinfo_1140= ------------------------------------------------------------
notes_plat_sysinfo_1145= 13. Linux kernel boot-time arguments, from /proc/cmdline
notes_plat_sysinfo_1150=   BOOT_IMAGE=/boot/vmlinuz-5.14.21-150500.53-default
notes_plat_sysinfo_1155=   root=UUID=5eac0278-b5d7-4d70-9f22-3587a0d03dd8
notes_plat_sysinfo_1160=   splash=silent
notes_plat_sysinfo_1165=   mitigations=auto
notes_plat_sysinfo_1170=   quiet
notes_plat_sysinfo_1175=   security=apparmor
notes_plat_sysinfo_1180=
notes_plat_sysinfo_1185= ------------------------------------------------------------
notes_plat_sysinfo_1190= 14. cpupower frequency-info
notes_plat_sysinfo_1195=   analyzing CPU 0:
notes_plat_sysinfo_1200=     current policy: frequency should be within 1.50 GHz and 3.25 GHz.
notes_plat_sysinfo_1205=                     The governor "performance" may decide which speed to use
notes_plat_sysinfo_1210=                     within this range.
notes_plat_sysinfo_1215=     boost state support:
notes_plat_sysinfo_1220=       Supported: yes
notes_plat_sysinfo_1225=       Active: yes
notes_plat_sysinfo_1230=
notes_plat_sysinfo_1235= ------------------------------------------------------------
notes_plat_sysinfo_1240= 15. sysctl
notes_plat_sysinfo_1245=   kernel.numa_balancing               1
notes_plat_sysinfo_1250=   kernel.randomize_va_space           0
notes_plat_sysinfo_1255=   vm.compaction_proactiveness        20
notes_plat_sysinfo_1260=   vm.dirty_background_bytes           0
notes_plat_sysinfo_1265=   vm.dirty_background_ratio          10
notes_plat_sysinfo_1270=   vm.dirty_bytes                      0
notes_plat_sysinfo_1275=   vm.dirty_expire_centisecs        3000
notes_plat_sysinfo_1280=   vm.dirty_ratio                      8
notes_plat_sysinfo_1285=   vm.dirty_writeback_centisecs      500
notes_plat_sysinfo_1290=   vm.dirtytime_expire_seconds     43200
notes_plat_sysinfo_1295=   vm.extfrag_threshold              500
notes_plat_sysinfo_1300=   vm.min_unmapped_ratio               1
notes_plat_sysinfo_1305=   vm.nr_hugepages                     0
notes_plat_sysinfo_1310=   vm.nr_hugepages_mempolicy           0
notes_plat_sysinfo_1315=   vm.nr_overcommit_hugepages          0
notes_plat_sysinfo_1320=   vm.swappiness                       1
notes_plat_sysinfo_1325=   vm.watermark_boost_factor       15000
notes_plat_sysinfo_1330=   vm.watermark_scale_factor          10
notes_plat_sysinfo_1335=   vm.zone_reclaim_mode                1
notes_plat_sysinfo_1340=
notes_plat_sysinfo_1345= ------------------------------------------------------------
notes_plat_sysinfo_1350= 16. /sys/kernel/mm/transparent_hugepage
notes_plat_sysinfo_1355=   defrag          [always] defer defer+madvise madvise never
notes_plat_sysinfo_1360=   enabled         [always] madvise never
notes_plat_sysinfo_1365=   hpage_pmd_size  2097152
notes_plat_sysinfo_1370=   shmem_enabled   always within_size advise [never] deny force
notes_plat_sysinfo_1375=
notes_plat_sysinfo_1380= ------------------------------------------------------------
notes_plat_sysinfo_1385= 17. /sys/kernel/mm/transparent_hugepage/khugepaged
notes_plat_sysinfo_1390=   alloc_sleep_millisecs   60000
notes_plat_sysinfo_1395=   defrag                      1
notes_plat_sysinfo_1400=   max_ptes_none             511
notes_plat_sysinfo_1405=   max_ptes_shared           256
notes_plat_sysinfo_1410=   max_ptes_swap              64
notes_plat_sysinfo_1415=   pages_to_scan            4096
notes_plat_sysinfo_1420=   scan_sleep_millisecs    10000
notes_plat_sysinfo_1425=
notes_plat_sysinfo_1430= ------------------------------------------------------------
notes_plat_sysinfo_1435= 18. OS release
notes_plat_sysinfo_1440=   From /etc/*-release /etc/*-version
notes_plat_sysinfo_1445=   os-release SUSE Linux Enterprise Server 15 SP5
notes_plat_sysinfo_1450=
notes_plat_sysinfo_1455= ------------------------------------------------------------
notes_plat_sysinfo_1460= 19. Disk information
notes_plat_sysinfo_1465= SPEC is set to: /home/cpu2017
notes_plat_sysinfo_1470=   Filesystem     Type   Size  Used Avail Use% Mounted on
notes_plat_sysinfo_1475=   /dev/sdb2      btrfs  222G   11G  211G   5% /home
notes_plat_sysinfo_1480=
notes_plat_sysinfo_1485= ------------------------------------------------------------
notes_plat_sysinfo_1490= 20. /sys/devices/virtual/dmi/id
notes_plat_sysinfo_1495=     Vendor:         Cisco Systems Inc
notes_plat_sysinfo_1500=     Product:        UCSC-C245-M8SX
notes_plat_sysinfo_1505=     Serial:         WZP27360C65
notes_plat_sysinfo_1510=
notes_plat_sysinfo_1515= ------------------------------------------------------------
notes_plat_sysinfo_1520= 21. dmidecode
notes_plat_sysinfo_1525=   Additional information from dmidecode 3.4 follows.  WARNING: Use caution when you interpret this section.
notes_plat_sysinfo_1530=   The 'dmidecode' program reads system data which is "intended to allow hardware to be accurately
notes_plat_sysinfo_1535=   determined", but the intent may not be met, as there are frequent changes to hardware, firmware, and the
notes_plat_sysinfo_1540=   "DMTF SMBIOS" standard.
notes_plat_sysinfo_1545=   Memory:
notes_plat_sysinfo_1550=     4x 0xCE00 M321R8GA0PB0-CWMJH 64 GB 2 rank 5600, configured at 4800
notes_plat_sysinfo_1555=     20x 0xCE00 M321R8GA0PB0-CWMKJ 64 GB 2 rank 5600, configured at 4800
notes_plat_sysinfo_1560=
notes_plat_sysinfo_1565=
notes_plat_sysinfo_1570= ------------------------------------------------------------
notes_plat_sysinfo_1575= 22. BIOS
notes_plat_sysinfo_1580= (This section combines info from /sys/devices and dmidecode.)
notes_plat_sysinfo_1585=    BIOS Vendor:       Cisco Systems, Inc.
notes_plat_sysinfo_1590=    BIOS Version:      C245M8.4.3.4a.0.0520240849
notes_plat_sysinfo_1595=    BIOS Date:         05/20/2024
notes_plat_sysinfo_1600=    BIOS Revision:     5.27
hw_cpu_name        = AMD EPYC 9354
hw_disk            = 222 GB  add more disk info here
hw_memory001       = 1511.593 GB fixme: If using DDR4, the format is:
hw_memory002       = 'N GB (N x N GB nRxn PC4-nnnnX-X)'
hw_nchips          = 2
hw_ncores          = 64
hw_nthreadspercore = 1
prepared_by        = root  (is never output, only tags rawfile)
sw_file            = btrfs
sw_os001           = SUSE Linux Enterprise Server 15 SP5
sw_os002           = 5.14.21-150500.53-default
sw_state           = Run level 3 (add definition here)
# End of settings added by sysinfo_program


644.nab_s:
# The following setting was inserted automatically as a result of
# post-run basepeak application.
basepeak = 1


619.lbm_s:
# The following setting was inserted automatically as a result of
# post-run basepeak application.
basepeak = 1


607.cactuBSSN_s:
# The following setting was inserted automatically as a result of
# post-run basepeak application.
basepeak = 1


# The following section was added automatically, and contains settings that
# did not appear in the original configuration file, but were added to the
# raw file after the run.
default:
power_management000 = BIOS and OS set to prefer performance
power_management001 = at the cost of additional power usage.
notes_plat_form_000 =
notes_plat_form_005 =BIOS settings:
notes_plat_form_010 =SMT Mode set to Disabled
notes_plat_form_015 =NUMA nodes per socket set to NPS1
notes_plat_form_020 =Determinism Slider set to Power
notes_plat_form_025 =DF C-States set to Disabled
notes_plat_form_030 =TDP set to 400
notes_plat_form_035 =PPT set to 400
notes_plat_form_040 =ACPI SRAT L3 Cache as NUMA Domain set to Enabled