# Invocation command line:
# /cpu2000/bin/runspec -c amd384K8 -T all int
############################################################################
# pathscale-amd64.cfg
#
# Copyright 2003, 2004, 2005 PathScale, Inc.  All Rights Reserved.
#
# Configuration file for use with the PathScale compiler on x86-64

check_md5 = 1

ext=ps_amd64_R23
teeout=yes
teerunout=yes

################################################################
# Machine-specific section
################################################################
sw_avail     = Nov-2005
#include: SUT.inc
# ---- Begin inclusion of '/cpu2000/config/SUT.inc'
################################################################
# Machine-specific section
################################################################
hw_cpu       = AMD Opteron (TM) 256
hw_cpu_mhz   = 3000
hw_disk      = SATA, 250 GB
hw_fpu       = Integrated
hw_memory    = 2x512MB, DDR400 CL2 ECC Reg
hw_vendor    = Advanced Micro Devices
hw_model     = TYAN Thunder K8SD Pro (S2882-D), Opteron (TM) 256
hw_avail     = Apr-2006
sw_avail     = Jan-2006
hw_ncpu      = 1 cores, 1 chips, 1 core/chip
hw_ncpuorder = 1-2
hw_ocache    = N/A
hw_other     = None
hw_parallel  = No
hw_pcache    = 64KBI + 64KBD on chip
hw_scache    = 1024KB (I+D) on chip
hw_tcache    = N/A
sw_file      = Linux/ext3
sw_os        = SuSE Linux Enterprise Server 9 SP3 (64-bit)
sw_state     = Multi-user, run level 3
submit= MYMASK=`printf '0x%x' \$((1<<\$SPECUSERNUM))`; /usr/bin/taskset \$MYMASK $command
# System setup notes
# To add notes, uncomments these lines below and add the comments
#notes6000    =
#notes6010    =
#notes6020    =
notes6030    = Corsair CMX512RE-3200LL (XMS3200REv2.1) memory used in Dual Channel configuration.
notes6040    = BIOS rev 3.05
notes6050    = The tested system can be assembled using a standard ATX case and an Antec True 550
notes6060    = watt EPS12V Power Supply.
notes6070    = Single-processor kernel (2.6.5-7.244-default) was used.
#notes6100    = taskset utility used to bind CPU(s) to processes.
################################################################
# Software and license-specific section
################################################################
license_num  = 49
test_date    = Mar-2006
prepared_by  = Michael Paton
company_name = Advanced Micro Devices
tester_name  = AMD Austin, TX
reportable   = 1
# ---- End inclusion of '/cpu2000/config/SUT.inc'
license_num  = 49
sw_compiler010 = PathScale EKOPath(TM) Compiler
sw_compiler020 =  Suite, Release 2.3

default=default=default=default:

PS_DIR = /opt/pathscale/2.3/bin
ACML_PSC64_DIR = /opt/acml2.7.0/pathscale64/lib
CC=pathcc
FC=pathf95
F77=pathf95
CXX=pathCC

################################################################
# Initial Notes
################################################################

notes016 = 
notes018 = +FDO: PASS1= -fb_create fbdata  PASS2= -fb_opt fbdata

################################################################
# Final Notes
################################################################

default=default=default=default:
notes5000	=   

#################################################################
#                                                               #
#          SPECint Tuning & Notes                               #
#                                                               #
#################################################################

# Specify feedback-directed optimization for all SPECint runs.

int=default=default=default:
PASS1_CFLAGS  = -fb_create fbdata 
PASS1_CXXFLAGS  = -fb_create fbdata 
PASS1_LDFLAGS = -fb_create fbdata
PASS2_CFLAGS  = -fb_opt fbdata
PASS2_CXXFLAGS  = -fb_opt fbdata
PASS2_LDFLAGS = -fb_opt fbdata

int=base=default=default:
COPTIMIZE      = -Ofast
CXXOPTIMIZE    = -Ofast

notes021 = 
notes022 = Baseline optimization flags: 
notes023 =   C programs:       -Ofast +FDO
notes024 =   C++ programs:     -Ofast +FDO

notes100 = 
notes101 = Portability Flags:
notes106 =   186.crafty:  -DLINUX_i386
notes107 =   252.eon:     -DHAS_ERRLIST -DSPEC_CPU2000_LP64
notes108 =   253.perlbmk: -DSPEC_CPU2000_LINUX_I386 -DSPEC_CPU2000_NEED_BOOL  
notes109 =                -DSPEC_CPU2000_GLIBC22 -DSPEC_CPU2000_LP64
notes112 =   254.gap:     -DSYS_IS_USG -DSYS_HAS_IOCTL_PROTO -DSYS_HAS_TIME_PROTO
notes113 =                -DSYS_HAS_CALLOC_PROTO -DSPEC_CPU2000_LP64
notes116 =   255.vortex:  -DSPEC_CPU2000_LP64

#################################################################
#                                                               #
#          SPECint Portability flags                            #
#                                                               #
#################################################################

186.crafty=default=default=default:
CPORTABILITY = -DLINUX_i386 

252.eon=default=default=default:
CXXPORTABILITY = -DHAS_ERRLIST -DSPEC_CPU2000_LP64

253.perlbmk=default=default=default: 
CPORTABILITY = -DSPEC_CPU2000_LINUX_I386 -DSPEC_CPU2000_NEED_BOOL -DSPEC_CPU2000_GLIBC22 -DSPEC_CPU2000_LP64

254.gap=default=default=default:
CPORTABILITY = -DSYS_IS_USG -DSYS_HAS_IOCTL_PROTO -DSYS_HAS_TIME_PROTO -DSYS_HAS_CALLOC_PROTO -DSPEC_CPU2000_LP64

255.vortex=default=default=default:
CPORTABILITY= -DSPEC_CPU2000_LP64

notes120 = 
notes125 = Peak Tuning:
     
164.gzip=peak=default=default:
OPTIMIZE = -O3 -ipa -WOPT:val=0 -OPT:unroll_size=0
notes205= 164.gzip:    -O3 -ipa -WOPT:val=0 -OPT:unroll_size=0 +FDO

175.vpr=peak=default=default:
OPTIMIZE = -O3 -ipa -m32
notes208= 175.vpr:     -O3 -ipa -m32 +FDO

176.gcc=peak=default=default:
OPTIMIZE      = -O3 -IPA:plimit=10000 -LNO:opt=0 -OPT:goto=off
notes212= 176.gcc:     -O3 -IPA:plimit=10000 -LNO:opt=0 -OPT:goto=off +FDO

181.mcf=peak=default=default:
OPTIMIZE      = -O3 -ipa -IPA:field_reorder=on -m32
notes214= 181.mcf:     -O3 -ipa -IPA:field_reorder=on -m32 +FDO

186.crafty=peak=default=default:
OPTIMIZE      = -Ofast -CG:local_fwd_sched=on -LNO:opt=0 -WOPT:val=0
notes217= 186.crafty:  -Ofast -CG:local_fwd_sched=on -LNO:opt=0 -WOPT:val=0 +FDO

197.parser=peak=default=default:
OPTIMIZE      = -O3 -ipa -m32 -IPA:ctype=on
notes220= 197.parser:  -O3 -ipa -m32 -IPA:ctype=on +FDO

252.eon=peak=default=default:
OPTIMIZE = -Ofast -CG:gcm=off:p2align_freq=1:prefetch=off -IPA:plimit=4000 -OPT:treeheight=on -TENV:X=4:frame_pointer=off -fno-exceptions -LNO:fu=10:full_unroll_outer=on -GRA:optimize_boundary=on
notes223= 252.eon:     -Ofast -CG:gcm=off:p2align_freq=1:prefetch=off -IPA:plimit=4000
notes224=              -OPT:treeheight=on -TENV:X=4:frame_pointer=off -fno-exceptions
notes225=              -LNO:fu=10:full_unroll_outer=on -GRA:optimize_boundary=on +FDO

253.perlbmk=peak=default=default:
OPTIMIZE = -O2 -ipa -OPT:Ofast:transform_to_memlib=off -fno-math-errno -IPA:plimit=10000
notes227= 253.perlbmk: -O2 -ipa -OPT:Ofast:transform_to_memlib=off 
notes228=              -fno-math-errno -IPA:plimit=10000 +FDO

254.gap=peak=default=default:
basepeak = true
notes240= 254.gap:   basepeak = true

255.vortex=peak=default=default:
OPTIMIZE = -Ofast -OPT:goto=off -CG:p2align=on -GRA:optimize_boundary=on -IPA:min_hotness=120
notes233= 255.vortex:  -Ofast -OPT:goto=off -CG:p2align=on
notes234=              -GRA:optimize_boundary=on -IPA:min_hotness=120 +FDO

256.bzip2=peak=default=default:
basepeak = true
notes240= 256.bzip2:   basepeak = true

300.twolf=peak=default=default:
OPTIMIZE      = -O2 -CG:gcm=off:p2align_freq=100000 -OPT:Ofast:unroll_times_max=8:unroll_size=256:alias=disjoint -WOPT:mem_opnds=on -m32
notes245= 300.twolf:   -O2 -CG:gcm=off:p2align_freq=100000
notes246=              -OPT:Ofast:unroll_times_max=8:unroll_size=256:alias=disjoint
notes247=              -WOPT:mem_opnds=on -m32 +FDO

#################################################################
#                                                               #
#                        SPECfp Tuning                          #
#                                                               #
#################################################################

# Specify feedback-directed optimization for all SPECfp C codes.

fp=default=default=default:
COPTIMIZE         = -Ofast -WOPT:mem_opnds=on
PASS1_CFLAGS      = -fb_create fbdata
PASS2_CFLAGS      = -fb_opt fbdata
FOPTIMIZE         = -Ofast -LNO:fusion=2 -OPT:fast_complex=on
F77OPTIMIZE       = -Ofast -LNO:fusion=2 -OPT:fast_complex=on
PASS1_FFLAGS      = -fb_create fbdata
PASS2_FFLAGS      = -fb_opt fbdata
PASS1_F77FLAGS      = -fb_create fbdata
PASS2_F77FLAGS      = -fb_opt fbdata
PASS1_LDFLAGS    = -fb_create fbdata
PASS2_LDFLAGS    = -fb_opt fbdata

notes020 = +ACML  means -L<acml2.7.0-install-dir>/pathscale64/lib -lacml, 
notes021 =        which causes linking with AMD Core Math Library V2.7.0
notes028 = 
notes030 = Baseline optimization 
notes032 =   C programs:       -Ofast -WOPT:mem_opnds=on +FDO 
notes034 =   Fortran programs: -Ofast -LNO:fusion=2 -OPT:fast_complex=on +FDO
notes101       = Portability Flags:
notes102       =   178.galgel: -fixedform

178.galgel=default=default=default:
FPORTABILITY=-fixedform

notes150 =  
notes155 =Peak Tuning:

168.wupwise=peak=default=default:
F77OPTIMIZE = -Ofast -LNO:prefetch_ahead=5:prefetch=3 -OPT:unroll_times_max=8:unroll_size=128:IEEE_NaN_Inf=off:ro=3 -IPA:linear=on:plimit=50000:callee_limit=5000 -INLINE:aggressive=on
feedback = 0 
notes204= 168.wupwise:  -Ofast -LNO:prefetch_ahead=5:prefetch=3
notes205=               -OPT:unroll_times_max=8:unroll_size=128:IEEE_NaN_Inf=off:ro=3
notes206=               -IPA:linear=on:plimit=50000:callee_limit=5000 
notes207=               -INLINE:aggressive=on

171.swim=peak=default=default:
F77OPTIMIZE     = -Ofast -CG:local_fwd_sched=on -LNO:fusion=2 -m3dnow
feedback = 0
notes210= 171.swim:     -Ofast -CG:local_fwd_sched=on -LNO:fusion=2 -m3dnow

172.mgrid=peak=default=default:
F77OPTIMIZE = -Ofast -CG:gcm=off -OPT:IEEE_arith=3:unroll_size=200 -LNO:fusion=2:fission=1:blocking=off:prefetch_ahead=2 -WOPT:mem_opnds=on:aggstr=0
feedback = 0
notes215= 172.mgrid:    -Ofast -CG:gcm=off -OPT:IEEE_arith=3:unroll_size=200
notes216=               -LNO:fusion=2:fission=1:blocking=off:prefetch_ahead=2
notes217=               -WOPT:mem_opnds=on:aggstr=0

173.applu=peak=default=default:
F77OPTIMIZE = -Ofast -CG:local_fwd_sched=on -OPT:ro=3 -TENV:X=3 -LNO:fusion=2:fission=2:full_unroll_size=10000
notes220= 173.applu:    -Ofast -CG:local_fwd_sched=on -OPT:ro=3 -TENV:X=3
notes221=               -LNO:fusion=2:fission=2:full_unroll_size=10000 +FDO

177.mesa=peak=default=default:
COPTIMIZE = -O2 -ipa -OPT:Ofast -fno-math-errno -CG:local_fwd_sched=on -WOPT:mem_opnds=on
notes225= 177.mesa:     -O2 -ipa -OPT:Ofast -fno-math-errno -CG:local_fwd_sched=on -WOPT:mem_opnds=on +FDO

178.galgel=peak=default=default:
FOPTIMIZE = -Ofast -OPT:fast_complex=on
RM_SOURCES      = lapak.f90
EXTRA_LIBS      = -L$(ACML_PSC64_DIR) -lacml
notes230= 178.galgel:   -Ofast -OPT:fast_complex=on +ACML +FDO
notes232=                RM_SOURCES=lapak.f90

179.art=peak=default=default:
COPTIMIZE= -O3 -OPT:Ofast -fno-math-errno -mno-sse2 -m32
feedback = 0
notes235= 179.art:      -O3 -OPT:Ofast -fno-math-errno -mno-sse2 -m32

183.equake=peak=default=default:
COPTIMIZE = -Ofast -CG:load_exe=2 -WOPT:mem_opnds=on -m32
notes240= 183.equake:   -Ofast -CG:load_exe=2 -WOPT:mem_opnds=on -m32 +FDO
     
187.facerec=peak=default=default:
FOPTIMIZE = -Ofast -LNO:fusion=2 -OPT:fast_complex=on:IEEE_NaN_Inf=off:unroll_size=0
notes245= 187.facerec:  -Ofast -LNO:fusion=2
notes246=               -OPT:fast_complex=on:IEEE_NaN_Inf=off:unroll_size=0 +FDO

188.ammp=peak=default=default:
COPTIMIZE = -O3 -OPT:alias=disjoint:unroll_times_max=8:Ofast:ro=3 -fno-math-errno -TENV:X=4
notes250= 188.ammp:     -O3 -OPT:alias=disjoint:unroll_times_max=8:Ofast:ro=3
notes251=               -fno-math-errno -TENV:X=4 +FDO
     
189.lucas=peak=default=default:
FOPTIMIZE = -Ofast -OPT:ro=3:fast_nint=off:unroll_size=256 -WOPT:mem_opnds=on
notes255= 189.lucas:    -Ofast -OPT:ro=3:fast_nint=off:unroll_size=256 -WOPT:mem_opnds=on +FDO

191.fma3d=peak=default=default:
FOPTIMIZE = -O2 -ipa -CG:load_exe=1 -OPT:Ofast:IEEE_arith=3:ro=3 -WOPT:mem_opnds=on:retype_expr=on -IPA:pu_reorder=1
notes260= 191.fma3d:    -O2 -ipa -CG:load_exe=1 -OPT:Ofast:IEEE_arith=3:ro=3
notes261=               -WOPT:mem_opnds=on:retype_expr=on -IPA:pu_reorder=1 +FDO 

200.sixtrack=peak=default=default:
F77OPTIMIZE = -O3 -OPT:Ofast:Olimit=6000:early_intrinsics=on -fno-math-errno -CG:load_exe=1
notes265= 200.sixtrack: -O3 -OPT:Ofast:Olimit=6000:early_intrinsics=on
notes266=               -fno-math-errno -CG:load_exe=1 +FDO

301.apsi=peak=default=default:
F77OPTIMIZE = -Ofast -CG:load_exe=0 -LNO:prefetch=0:simd=2
feedback=0
notes270= 301.apsi:     -Ofast -CG:load_exe=0 -LNO:prefetch=0:simd=2