# Invocation command line: # /usr/cpu2000/bin/runspec -c amd353K8 -r -u 4 -T all all ############################################################################ # Invocation command line: # runspec -c amd353K8 -T all all ############################################################################ ############################################################################ # SPEC2000 Suse Linux config file # August 2003. # # PGI 5.1-3 Fortran Compiler # SuSE optional gcc33 extension gcc33 # # These variables below MUST be checked for accuracy before submitting company_name = AMD # # Make sure the motherboard and clock rate is checked. # hw_model = Verari QuatreX-64 (TM) # # Make sure the processor and clock rate is checked. # hw_cpu = AMD Opteron (TM) 850 # # Make sure the frequency is checked. The field MUST be an integer. # hw_cpu_mhz = 2400 hw_disk = SCSI, Ultra-320, 10k rpm hw_fpu = Integrated # # Make sure the memory is checked. # hw_memory = 8 x 512 PC3200 DDR SDRAM CL3.0 # # Note here any deviations from default BIOS settings # Optimized settings # SRAT on, ECC on, DRAM Interleave on # Make sure the system bus frequency is checked. # NUMA enabled Suse stock NUMA kernel 2.4.21-143 schedutilstaskset enabled ECC Disabled # Make sure the dates are checked. # hw_avail = May-2004 test_date = Apr-2004 # # Make sure the file system type is checked. # sw_file = Linux/ext3 # # Make sure the OS is checked. # sw_os = SuSE Linux 8.0 SLES 64 bit (SP3) SuSe NUMA kernel 2.4.21-143 # # # Make sure your identity is correct # hw_vendor = AMD tester_name = AMD license_num = 0000 # # These variables below are less likely to need changing hw_ncpu = 4 hw_ncpuorder = 4 hw_ocache = N/A hw_other = None hw_parallel = No hw_pcache = 64KBI + 64KBD on chip hw_scache = 1024KB(I+D) on chip hw_tcache = N/A sw_state = Multi-user SuSE Run level 3 VENDOR = action = validate tune = base output_format = asc,html,config ext = amd353K8.gcc33.pgi51 check_md5 = 1 reportable = 1 # schedutils taskset enabled command submit= "MYNUM=$SPECUSERNUM" ; MYMASK=\$((1<<\$SPECUSERNUM)); /usr/bin/taskset \$MYMASK $command # # These are listed as benchmark-tuning-extension-machine # default=default=default=default: GCCDIR = /opt/gcc33/bin CC = $(GCCDIR)/gcc CXX = $(GCCDIR)/g++ PGIDIR = /usr/pgi/linux86-64/5.1/bin FC = $(PGIDIR)/pgf90 F77 = $(PGIDIR)/pgf90 ################################################################ # Portability Flags ################################################################ fp=default=default=default: notes0045= PORTABILITY=-DSPEC_CPU2000_LP64 is applied to all the C benchmarks. int=default=default=default: notes0040= PORTABILITY=-DSPEC_CPU2000_LP64 is applied to all benchmarks, notes0041= except for peak runs of 181.mcf, 197.parser and 300.twolf, which notes0042= are compiled for 32-bit in peak. PORTABILITY = -DSPEC_CPU2000_LP64 186.crafty=default=default=default: notes0045= 186.crafty: CPORTABILITY=-DLINUX_i386 CPORTABILITY = -DLINUX_i386 176.gcc=default=default=default: notes0049= 176.gcc: Approved src.alt is used srcalt = 64bitgcc 252.eon=default=default=default: notes0050= 252.eon: CXXPORTABILITY=-DHAS_ERRLIST -DFMAX_IS_DOUBLE notes0051= Approved src.alt is used. EXTRA_CXXFLAGS = -DHAS_ERRLIST -DFMAX_IS_DOUBLE srcalt = fmax_errno 253.perlbmk=default=default=default: notes0052= 253.perlbmk: CPORTABILITY=-DSPEC_CPU2000_LINUX_I386 -DSPEC_CPU2000_NEED_BOOL notes0053= -DSPEC_CPU2000_GLIBC22 CPORTABILITY = -DSPEC_CPU2000_LINUX_I386 -DSPEC_CPU2000_NEED_BOOL -DSPEC_CPU2000_GLIBC22 254.gap=default=default=default: notes0055= 254.gap: CPORTABILITY=-DSYS_IS_USG -DSYS_HAS_IOCTL_PROTO -DSYS_HAS_TIME_PROTO notes0056= -DSYS_HAS_SIGNAL_PROTO -DSYS_HAS_ANSI -DSYS_HAS_CALLOC_PROTO CPORTABILITY = -DSYS_IS_USG -DSYS_HAS_IOCTL_PROTO -DSYS_HAS_TIME_PROTO -DSYS_HAS_SIGNAL_PROTO -DSYS_HAS_ANSI -DSYS_HAS_CALLOC_PROTO 178.galgel=default=default=default: notes0050= 178.galgel: -Mfixed FPORTABILITY= -Mfixed ################################################################ # Baseline Tuning Flags ################################################################ # # int2000 # Base tuning default optimization # int=base=default=default: notes0080= Baseline C: gcc -O3 -funroll-all-loops +FDO COPTIMIZE = -O3 -funroll-all-loops ONESTEP = yes PASS1_CFLAGS = -fprofile-arcs PASS2_CFLAGS = -fbranch-probabilities PASS1_LDFLAGS = $(PASS1_CFLAGS) PASS2_LDFLAGS = $(PASS2_CFLAGS) # Delete feedback data from previous runs fdo_pre0 = rm -f *.da *.life analyz_prbrob.out 252.eon=base=default=default: notes0085= Baseline C++: g++ -O3 -funroll-all-loops +FDO CXXOPTIMIZE = -O3 -funroll-all-loops ONESTEP = yes PASS1_CXXFLAGS = -fprofile-arcs PASS2_CXXFLAGS = -fbranch-probabilities PASS1_LDFLAGS = $(PASS1_CXXFLAGS) PASS2_LDFLAGS = $(PASS2_CXXFLAGS) # Delete feedback data from previous runs fdo_pre0 = rm -f *.da *.life analyz_prbrob.out # # fp2000 # Base tuning default optimization # # Fortran benchmarks # fp=base=default=default: notes0085= Baseline: Fortran pgf90 -fastsse -Mipa=fast OPTIMIZE = CPORTABILITY = -DSPEC_CPU2000_LP64 PASS1_FFLAGS = -fastsse -Mipa=fast PASS2_FFLAGS = -fastsse -Mipa=fast PASS1_LDFFLAGS = $(PASS1_FFLAGS) PASS2_LDFFLAGS = $(PASS2_FFLAGS) ONESTEP=yes # # C benchmarks # 177.mesa=base=default=default: notes0080= Baseline: C gcc -O3 -funroll-all-loops +FDO COPTIMIZE = -O3 -funroll-all-loops CFLAGS = PASS1_CFLAGS = -fprofile-arcs PASS2_CFLAGS = -fbranch-probabilities PASS1_LDFLAGS = $(PASS1_CFLAGS) PASS2_LDFLAGS = $(PASS2_CFLAGS) # Delete feedback data from previous runs fdo_pre0 = rm -f *.da *.life analyz_prbrob.out 179.art=base=default=default: COPTIMIZE = -O3 -funroll-all-loops CFLAGS = PASS1_CFLAGS = -fprofile-arcs PASS2_CFLAGS = -fbranch-probabilities PASS1_LDFLAGS = $(PASS1_CFLAGS) PASS2_LDFLAGS = $(PASS2_CFLAGS) # Delete feedback data from previous runs fdo_pre0 = rm -f *.da *.life analyz_prbrob.out 183.equake=base=default=default: COPTIMIZE = -O3 -funroll-all-loops CFLAGS = PASS1_CFLAGS = -fprofile-arcs PASS2_CFLAGS = -fbranch-probabilities PASS1_LDFLAGS = $(PASS1_CFLAGS) PASS2_LDFLAGS = $(PASS2_CFLAGS) # Delete feedback data from previous runs fdo_pre0 = rm -f *.da *.life analyz_prbrob.out 188.ammp=base=default=default: COPTIMIZE = -O3 -funroll-all-loops CFLAGS= PASS1_CFLAGS = -fprofile-arcs PASS2_CFLAGS = -fbranch-probabilities PASS1_LDFLAGS = $(PASS1_CFLAGS) PASS2_LDFLAGS = $(PASS2_CFLAGS) # Delete feedback data from previous runs fdo_pre0 = rm -f *.da *.life analyz_prbrob.out ################################################################ # Peak Tuning Flags ################################################################ # # int2000 # Peak tuning # 164.gzip=peak=default=default: notes0088= 164.gzip: -O3 -funroll-all-loops -finline-limit=900 -freduce-all-givs +FDO COPTIMIZE = -O3 -funroll-all-loops -finline-limit=900 -freduce-all-givs PASS1_CFLAGS = -fprofile-arcs PASS2_CFLAGS = -fbranch-probabilities PASS1_LDFLAGS = $(PASS1_CFLAGS) PASS2_LDFLAGS = $(PASS2_CFLAGS) fdo_pre0 = rm -f *.da *.life analyz_prbrob.out 175.vpr=peak=default=default: notes0090= 175.vpr: -O3 -funroll-loops -finline-limit=1000 +FDO COPTIMIZE = -O3 -funroll-loops -finline-limit=1000 PASS1_CFLAGS = -fprofile-arcs PASS2_CFLAGS = -fbranch-probabilities PASS1_LDFLAGS = $(PASS1_CFLAGS) PASS2_LDFLAGS = $(PASS2_CFLAGS) fdo_pre0 = rm -f *.da *.life analyz_prbrob.out 176.gcc=peak=default=default: notes0100= 176.gcc: -O3 -funroll-all-loops -finline-limit=900 +FDO COPTIMIZE = -O3 -funroll-all-loops -finline-limit=900 PASS1_CFLAGS = -fprofile-arcs PASS2_CFLAGS = -fbranch-probabilities PASS1_LDFLAGS = $(PASS1_CFLAGS) PASS2_LDFLAGS = $(PASS2_CFLAGS) fdo_pre0 = rm -f *.da *.life analyz_prbrob.out 181.mcf=peak=default=default: notes0110= 181.mcf: -O3 -funroll-all-loops -m32 +FDO PORTABILITY= COPTIMIZE = -O3 -funroll-all-loops -m32 PASS1_CFLAGS = -fprofile-arcs PASS2_CFLAGS = -fbranch-probabilities PASS1_LDFLAGS = $(PASS1_CFLAGS) PASS2_LDFLAGS = $(PASS2_CFLAGS) fdo_pre0 = rm -f *.da *.life analyz_prbrob.out 186.crafty=peak=default=default: notes0120= 186.crafty: -O3 -funroll-loops -fprefetch-loop-arrays COPTIMIZE = -O3 -funroll-loops -fprefetch-loop-arrays 197.parser=peak=default=default: notes0130= 197.parser: -O3 -funroll-all-loops -m32 +FDO PORTABILITY= COPTIMIZE = -O3 -funroll-all-loops -m32 PASS1_CFLAGS = -fprofile-arcs PASS2_CFLAGS = -fbranch-probabilities PASS1_LDFLAGS = $(PASS1_CFLAGS) PASS2_LDFLAGS = $(PASS2_CFLAGS) fdo_pre0 = rm -f *.da *.life analyz_prbrob.out 252.eon=peak=default=default: notes0140= 252.eon: -O3 -funroll-all-loops -ffast-math -finline-limit=3000 +FDO CXXOPTIMIZE = -O3 -funroll-all-loops -ffast-math -finline-limit=3000 PASS1_CXXFLAGS = -fprofile-arcs PASS2_CXXFLAGS = -fbranch-probabilities PASS1_LDFLAGS = $(PASS1_CXXFLAGS) PASS2_LDFLAGS = $(PASS2_CXXFLAGS) fdo_pre0 = rm -f *.da *.life analyz_prbrob.out 253.perlbmk=peak=default=default: notes0150= 253.perlbmk: -O3 -funroll-all-loops -finline-limit=1800 +FDO COPTIMIZE = -O3 -funroll-all-loops -finline-limit=1800 PASS1_CFLAGS = -fprofile-arcs PASS2_CFLAGS = -fbranch-probabilities PASS1_LDFLAGS = $(PASS1_CFLAGS) PASS2_LDFLAGS = $(PASS2_CFLAGS) fdo_pre0 = rm -f *.da *.life analyz_prbrob.out 254.gap=peak=default=default: notes0160= 254.gap: basepeak=true basepeak = true 255.vortex=peak=default=default: notes0170= 255.vortex: -O3 -funroll-all-loops -finline-limit=1000 +FDO COPTIMIZE = -O3 -funroll-all-loops -finline-limit=1000 PASS1_CFLAGS = -fprofile-arcs PASS2_CFLAGS = -fbranch-probabilities PASS1_LDFLAGS = $(PASS1_CFLAGS) PASS2_LDFLAGS = $(PASS2_CFLAGS) fdo_pre0 = rm -f *.da *.life analyz_prbrob.out 256.bzip2=peak=default=default: notes0180= 256.bzip2: -O3 -funroll-all-loops -freduce-all-givs -finline-limit=2700 +FDO COPTIMIZE = -O3 -funroll-all-loops -freduce-all-givs -finline-limit=2700 PASS1_CFLAGS = -fprofile-arcs PASS2_CFLAGS = -fbranch-probabilities PASS1_LDFLAGS = $(PASS1_CFLAGS) PASS2_LDFLAGS = $(PASS2_CFLAGS) fdo_pre0 = rm -f *.da *.life analyz_prbrob.out 300.twolf=peak=default=default: notes0190= 300.twolf: -O3 -funroll-all-loops -finline-limit=2000 -m32 +FDO PORTABILITY= COPTIMIZE = -O3 -funroll-all-loops -finline-limit=2000 -m32 PASS1_CFLAGS = -fprofile-arcs PASS2_CFLAGS = -fbranch-probabilities PASS1_LDFLAGS = $(PASS1_CFLAGS) PASS2_LDFLAGS = $(PASS2_CFLAGS) ################################################# # fp2000 # Peak tuning ################################################# 168.wupwise=peak=default=default: #Use PGI 5.1 Fortran notes0090= 168.wupwise: pgf90 -fastsse -Mipa=fast -Minline=levels:2 PASS1_F77FLAGS = -fastsse -Mipa=fast -Minline=levels:2 PASS2_F77FLAGS = -fastsse -Mipa=fast -Minline=levels:2 PASS1_LDF77FLAGS= $(PASS1_F77FLAGS) PASS2_LDF77FLAGS= $(PASS1_F77FLAGS) ONESTEP = yes 171.swim=peak=default=default: #Use PGI 5.1 Fortran notes0100= 171.swim: basepeak=true basepeak = true 172.mgrid=peak=default=default: #Use PGI 5.1 Fortran notes0110= 172.mgrid: pgf90 -fast -Mipa=fast PASS1_F77FLAGS = -fast -Mipa=fast PASS2_F77FLAGS = -fast -Mipa=fast PASS1_LDF77FLAGS= $(PASS1_F77FLAGS) PASS2_LDF77FLAGS= $(PASS1_F77FLAGS) ONESTEP = yes 173.applu=peak=default=default: #Use PGI 5.1 Fortran notes0120= 173.applu: pgf90 -fast -Mipa=fast PASS1_F77FLAGS = -fast -Mipa=fast PASS2_F77FLAGS = -fast -Mipa=fast PASS1_LDF77FLAGS= $(PASS1_F77FLAGS) PASS2_LDF77FLAGS= $(PASS1_F77FLAGS) ONESTEP = yes 177.mesa=peak=default=default: #Use SuSE gcc33 notes0130= 177.mesa: gcc -O3 -funroll-all-loops -finline-limit=2000 +FDO CPORTABILITY = -DSPEC_CPU2000_LP64 COPTIMIZE = -O3 -finline-limit=2000 -funroll-all-loops CFLAGS = ONESTEP = yes PASS1_CFLAGS = -fprofile-arcs PASS2_CFLAGS = -fbranch-probabilities PASS1_LDFLAGS = $(PASS1_CFLAGS) PASS2_LDFLAGS = $(PASS2_CFLAGS) 178.galgel=peak=default=default: #Use PGI 5.1 Fortran notes0140= 178.galgel: pgf90 -fastsse -O3 -mp RM_SOURCES=lapak.f90 +ACML FFLAGS = -fastsse -O3 -mp RM_SOURCES = lapak.f90 EXTRA_LIBS = -lacml ONESTEP = yes 179.art=peak=default=default: #Use SuSE gcc33 notes0150= 179.art: gcc -O3 -funroll-all-loops -ffast-math -finline-limit=1500 +FDO CPORTABILITY = -DSPEC_CPU2000_LP64 COPTIMIZE = -O3 -funroll-all-loops -ffast-math -finline-limit=1500 CFLAGS = ONESTEP = yes PASS1_CFLAGS = -fprofile-arcs PASS2_CFLAGS = -fbranch-probabilities PASS1_LDFLAGS = $(PASS1_CFLAGS) PASS2_LDFLAGS = $(PASS2_CFLAGS) 183.equake=peak=default=default: #Use SuSE gcc33 notes0160= 183.equake: gcc -O3 -funroll-all-loops -ffast-math -finline-limit=2000 CPORTABILITY = -DSPEC_CPU2000_LP64 COPTIMIZE = -O3 -funroll-all-loops -ffast-math -finline-limit=2000 CFLAGS = ONESTEP = yes 187.facerec=peak=default=default: #Use PGI 5.1 Fortran notes0170= 187.facerec: basepeak=true basepeak =true 188.ammp=peak=default=default: #Use SuSE gcc33 notes0180= 188.ammp: gcc -O3 -funroll-all-loops -ffast-math -finline-limit=2000 +FDO CPORTABILITY = -DSPEC_CPU2000_LP64 COPTIMIZE = -O3 -funroll-all-loops -ffast-math -finline-limit=2000 CFLAGS = ONESTEP = yes PASS1_CFLAGS = -fprofile-arcs PASS2_CFLAGS = -fbranch-probabilities PASS1_LDFLAGS = $(PASS1_CFLAGS) PASS2_LDFLAGS = $(PASS2_CFLAGS) 189.lucas=peak=default=default: #Use PGI 5.1 Fortran notes0190= 189.lucas: pgf90 -fastsse -Mipa=fast -Mnosmart PASS1_FFLAGS = -fastsse -Mipa=fast -Mnosmart PASS2_FFLAGS = -fastsse -Mipa=fast -Mnosmart ONESTEP = yes 191.fma3d=peak=default=default: #Use PGI 5.1 Fortran notes0200= 191.fma3d: basepeak=true basepeak = true 200.sixtrack=peak=default=default: #Use PGI 5.1 Fortran notes0210= 200.sixtrack: basepeak=true basepeak = true 301.apsi=peak=default=default: #Use PGI 5.1 Fortran notes0220= 301.apsi: basepeak=true basepeak = true int=default=default=default: notes0025= +FDO: PASS1=-fprofile-arcs PASS2=-fbranch-probabilities notes0030= Portability: notes0086= Peak tuning: notes0230= ONESTEP is used for all base and peak runs sw_avail= Dec-2003 sw_compiler0000= SuSE optional gcc 3.3 compiler (20030312) (from SLES8 SP3) fp=default=default=default: notes0010= +FDO: PASS1=-fprofile-arcs PASS2=-fbranch-probabilities notes0015= +ACML is linking with AMD Core Math Library notes0020= pgf90 is the PGI Fortran compiler notes0025= gcc is the SuSE optional gcc 3.3 compiler (from SLES8 SP3) notes0040= Portability: notes0088= Peak tuning: notes0260= ONESTEP is used for all base and peak runs sw_avail= Jan-2004 sw_compiler0000= PGI Fortran 5.1-3 and SuSE gcc33 optional compiler (from SLES8 SP3) sw_compiler0010= AMD Core Math Library (Version 1.5) for AMD64