Commit 669989b0 authored by Youngsung Kim's avatar Youngsung Kim
Browse files

saving work

parent 5bef05f3
include Makefile.inc
# Makefile for KGEN-generated kernel
# Originally used compiler(s)
#FC_0 := /sw/summit/xl/16.1.1-5/xlf/16.1.1/bin/.orig/xlf2008_r
FC_0 := /sw/summit/gcc/6.4.0/bin/gfortran
#FC_0 := mpif90
#FC_FLAGS_SET_0 := -F/sw/summit/xl/16.1.1-5/xlf/16.1.1/etc/xlf.cfg.rhel.7.6.gcc.4.8.5.cuda.10.1 -g -qfullpath -qmaxmem=-1 -qphsinfo -qzerosize -qfree=f90 -qxlf2003=polymorphic -qspillsize=2500 -qextname=flush -qsuffix=f=f90:cpp=F90 -g -O2 -qoffload -qthreaded -D_MPI
#FC_FLAGS_SET_0 := -F/sw/summit/xl/16.1.1-5/xlf/16.1.1/etc/xlf.cfg.rhel.7.6.gcc.4.8.5.cuda.10.1 -g -qfullpath -qmaxmem=-1 -qphsinfo -qzerosize -qfree=f90 -qxlf2003=polymorphic -qspillsize=2500 -qextname=flush -qsuffix=f=f90:cpp=F90 -g -O2 -qoffload -qthreaded
FC_FLAGS_SET_0 := -ffree-form -ffree-line-length-none -O3 -g -I $(EXTRAE_HOME)/include
#CC_0 := /sw/summit/xl/16.1.1-5/xlC/16.1.1/bin/xlc_r
CC_0 := /sw/summit/gcc/6.4.0/bin/gcc
CC_FLAGS_SET_0 := -O3 -g -I $(EXTRAE_HOME)/include
LFLAGS = -Wl,-rpath -Wl,$(EXTRAE_HOME)/lib -L$(EXTRAE_HOME)/lib -lseqtrace
ALL_OBJS := crm_module.o vars.o grid.o domain.o crmdims.o sgs.o scalar_momentum.o params.o microphysics.o cloud.o precip_init.o task_util_NOMPI.o precip_proc.o micro_params.o damping.o crm_output_module.o kurant.o abcoefs.o buoyancy.o crm_surface.o zero.o forcing.o ice_fall.o shr_const_mod.o shr_kind_mod.o boundaries.o periodic.o bound_exchange.o advection.o tke_full.o shear_prod3D.o shear_prod2D.o sat.o advect_mom.o advect2_mom_z.o advect2_mom_xy.o diffuse_mom.o diffuse_mom2D.o diffuse_mom3D.o diagnose.o uvw.o coriolis.o pressure.o fft.o press_rhs.o bound_duvdt.o press_grad.o adams.o advect_all_scalars.o advect_scalar.o advect_scalar2D.o advect_scalar3D.o diffuse_scalar.o diffuse_scalar3D.o diffuse_scalar2D.o accelerate_crm.o kernel_driver.o kgen_utils.o tprof_mod.o gammafff.o
build: ${ALL_OBJS}
${FC_0} ${FC_FLAGS_SET_0} ${LFLAGS} -o kernel.exe $^
PRERUN := source /sw/summit/extrae/3.7.1/rhel7.5_gnu6.4.0/etc/extrae.sh; export EXTRAE_CONFIG_FILE=extrae.xml;
# export EXECUTABLE=./pi_instrumentedf # This is taken by extrae.xml
#${EXECUTABLE}
run: build
#mpirun -np 2 ./kernel.exe
${PRERUN}./kernel.exe
crm_module.o: crm_module.F90 vars.o grid.o domain.o crmdims.o sgs.o scalar_momentum.o params.o microphysics.o cloud.o precip_init.o task_util_NOMPI.o precip_proc.o micro_params.o damping.o crm_output_module.o kurant.o abcoefs.o buoyancy.o crm_surface.o zero.o forcing.o ice_fall.o shr_const_mod.o shr_kind_mod.o boundaries.o periodic.o bound_exchange.o advection.o tke_full.o shear_prod3D.o shear_prod2D.o sat.o advect_mom.o advect2_mom_z.o advect2_mom_xy.o diffuse_mom.o diffuse_mom2D.o diffuse_mom3D.o diagnose.o uvw.o coriolis.o pressure.o fft.o press_rhs.o bound_duvdt.o press_grad.o adams.o advect_all_scalars.o advect_scalar.o advect_scalar2D.o advect_scalar3D.o diffuse_scalar.o diffuse_scalar3D.o diffuse_scalar2D.o accelerate_crm.o kgen_utils.o tprof_mod.o
$(FC_0) ${FC_FLAGS_SET_0} -c -o $@ $(EXTRAE_HOME)/include/extrae_module.f90
${FC_0} ${FC_FLAGS_SET_0} -c -o $@ $<
vars.o: vars.F90 kgen_utils.o tprof_mod.o grid.o params.o
${FC_0} ${FC_FLAGS_SET_0} -c -o $@ $<
grid.o: grid.F90 kgen_utils.o tprof_mod.o domain.o params.o advection.o
${FC_0} ${FC_FLAGS_SET_0} -c -o $@ $<
domain.o: domain.F90 kgen_utils.o tprof_mod.o crmdims.o
${FC_0} ${FC_FLAGS_SET_0} -c -o $@ $<
crmdims.o: crmdims.F90 kgen_utils.o tprof_mod.o
${FC_0} ${FC_FLAGS_SET_0} -c -o $@ $<
sgs.o: sgs.F90 kgen_utils.o tprof_mod.o params.o grid.o tke_full.o vars.o diffuse_mom.o diffuse_scalar.o microphysics.o scalar_momentum.o
${FC_0} ${FC_FLAGS_SET_0} -c -o $@ $<
scalar_momentum.o: scalar_momentum.F90 kgen_utils.o tprof_mod.o params.o
${FC_0} ${FC_FLAGS_SET_0} -c -o $@ $<
params.o: params.F90 kgen_utils.o tprof_mod.o shr_const_mod.o
${FC_0} ${FC_FLAGS_SET_0} -c -o $@ $<
microphysics.o: microphysics.F90 kgen_utils.o tprof_mod.o params.o vars.o micro_params.o grid.o precip_init.o cloud.o precip_proc.o
${FC_0} ${FC_FLAGS_SET_0} -c -o $@ $<
cloud.o: cloud.F90 kgen_utils.o tprof_mod.o micro_params.o vars.o params.o sat.o
${FC_0} ${FC_FLAGS_SET_0} -c -o $@ $<
precip_init.o: precip_init.F90 kgen_utils.o tprof_mod.o micro_params.o vars.o task_util_NOMPI.o sat.o params.o
${FC_0} ${FC_FLAGS_SET_0} -c -o $@ $<
task_util_NOMPI.o: task_util_NOMPI.F90 kgen_utils.o tprof_mod.o
${FC_0} ${FC_FLAGS_SET_0} -c -o $@ $<
precip_proc.o: precip_proc.F90 kgen_utils.o tprof_mod.o micro_params.o vars.o sat.o
${FC_0} ${FC_FLAGS_SET_0} -c -o $@ $<
micro_params.o: micro_params.F90 kgen_utils.o tprof_mod.o params.o grid.o
${FC_0} ${FC_FLAGS_SET_0} -c -o $@ $<
damping.o: damping.F90 kgen_utils.o tprof_mod.o params.o vars.o task_util_NOMPI.o microphysics.o
${FC_0} ${FC_FLAGS_SET_0} -c -o $@ $<
crm_output_module.o: crm_output_module.F90 kgen_utils.o tprof_mod.o params.o
${FC_0} ${FC_FLAGS_SET_0} -c -o $@ $<
kurant.o: kurant.F90 kgen_utils.o tprof_mod.o params.o vars.o sgs.o task_util_NOMPI.o
${FC_0} ${FC_FLAGS_SET_0} -c -o $@ $<
abcoefs.o: abcoefs.F90 kgen_utils.o tprof_mod.o params.o grid.o
${FC_0} ${FC_FLAGS_SET_0} -c -o $@ $<
buoyancy.o: buoyancy.F90 kgen_utils.o tprof_mod.o params.o vars.o
${FC_0} ${FC_FLAGS_SET_0} -c -o $@ $<
crm_surface.o: crm_surface.F90 kgen_utils.o tprof_mod.o params.o vars.o
${FC_0} ${FC_FLAGS_SET_0} -c -o $@ $<
zero.o: zero.F90 kgen_utils.o tprof_mod.o vars.o
${FC_0} ${FC_FLAGS_SET_0} -c -o $@ $<
forcing.o: forcing.F90 kgen_utils.o tprof_mod.o params.o vars.o microphysics.o
${FC_0} ${FC_FLAGS_SET_0} -c -o $@ $<
ice_fall.o: ice_fall.F90 kgen_utils.o tprof_mod.o params.o vars.o microphysics.o
${FC_0} ${FC_FLAGS_SET_0} -c -o $@ $<
shr_const_mod.o: shr_const_mod.F90 kgen_utils.o tprof_mod.o shr_kind_mod.o
${FC_0} ${FC_FLAGS_SET_0} -c -o $@ $<
shr_kind_mod.o: shr_kind_mod.F90 kgen_utils.o tprof_mod.o
${FC_0} ${FC_FLAGS_SET_0} -c -o $@ $<
boundaries.o: boundaries.F90 kgen_utils.o tprof_mod.o periodic.o
${FC_0} ${FC_FLAGS_SET_0} -c -o $@ $<
periodic.o: periodic.F90 kgen_utils.o tprof_mod.o bound_exchange.o vars.o sgs.o params.o microphysics.o scalar_momentum.o
${FC_0} ${FC_FLAGS_SET_0} -c -o $@ $<
bound_exchange.o: bound_exchange.F90 kgen_utils.o tprof_mod.o params.o grid.o
${FC_0} ${FC_FLAGS_SET_0} -c -o $@ $<
advection.o: advection.F90 kgen_utils.o tprof_mod.o
${FC_0} ${FC_FLAGS_SET_0} -c -o $@ $<
tke_full.o: tke_full.F90 kgen_utils.o tprof_mod.o params.o vars.o shear_prod3D.o shear_prod2D.o sat.o
${FC_0} ${FC_FLAGS_SET_0} -c -o $@ $<
shear_prod3D.o: shear_prod3D.F90 kgen_utils.o tprof_mod.o params.o vars.o
${FC_0} ${FC_FLAGS_SET_0} -c -o $@ $<
shear_prod2D.o: shear_prod2D.F90 kgen_utils.o tprof_mod.o params.o vars.o
${FC_0} ${FC_FLAGS_SET_0} -c -o $@ $<
sat.o: sat.F90 kgen_utils.o tprof_mod.o params.o
${FC_0} ${FC_FLAGS_SET_0} -c -o $@ $<
advect_mom.o: advect_mom.F90 kgen_utils.o tprof_mod.o advect2_mom_xy.o advect2_mom_z.o
${FC_0} ${FC_FLAGS_SET_0} -c -o $@ $<
advect2_mom_z.o: advect2_mom_z.F90 kgen_utils.o tprof_mod.o params.o vars.o
${FC_0} ${FC_FLAGS_SET_0} -c -o $@ $<
advect2_mom_xy.o: advect2_mom_xy.F90 kgen_utils.o tprof_mod.o params.o vars.o
${FC_0} ${FC_FLAGS_SET_0} -c -o $@ $<
diffuse_mom.o: diffuse_mom.F90 kgen_utils.o tprof_mod.o vars.o diffuse_mom3D.o diffuse_mom2D.o
${FC_0} ${FC_FLAGS_SET_0} -c -o $@ $<
diffuse_mom2D.o: diffuse_mom2D.F90 kgen_utils.o tprof_mod.o params.o vars.o
${FC_0} ${FC_FLAGS_SET_0} -c -o $@ $<
diffuse_mom3D.o: diffuse_mom3D.F90 kgen_utils.o tprof_mod.o params.o vars.o
${FC_0} ${FC_FLAGS_SET_0} -c -o $@ $<
diagnose.o: diagnose.F90 kgen_utils.o tprof_mod.o params.o vars.o sat.o
${FC_0} ${FC_FLAGS_SET_0} -c -o $@ $<
uvw.o: uvw.F90 kgen_utils.o tprof_mod.o vars.o
${FC_0} ${FC_FLAGS_SET_0} -c -o $@ $<
coriolis.o: coriolis.F90 kgen_utils.o tprof_mod.o params.o vars.o
${FC_0} ${FC_FLAGS_SET_0} -c -o $@ $<
pressure.o: pressure.F90 kgen_utils.o tprof_mod.o vars.o params.o press_rhs.o fft.o press_grad.o
${FC_0} ${FC_FLAGS_SET_0} -c -o $@ $<
fft.o: fft.F90 kgen_utils.o tprof_mod.o params.o
${FC_0} ${FC_FLAGS_SET_0} -c -o $@ $<
press_rhs.o: press_rhs.F90 kgen_utils.o tprof_mod.o params.o vars.o bound_duvdt.o
${FC_0} ${FC_FLAGS_SET_0} -c -o $@ $<
bound_duvdt.o: bound_duvdt.F90 kgen_utils.o tprof_mod.o vars.o
${FC_0} ${FC_FLAGS_SET_0} -c -o $@ $<
press_grad.o: press_grad.F90 kgen_utils.o tprof_mod.o vars.o params.o bound_duvdt.o
${FC_0} ${FC_FLAGS_SET_0} -c -o $@ $<
adams.o: adams.F90 kgen_utils.o tprof_mod.o params.o vars.o
${FC_0} ${FC_FLAGS_SET_0} -c -o $@ $<
advect_all_scalars.o: advect_all_scalars.F90 kgen_utils.o tprof_mod.o vars.o advect_scalar.o microphysics.o scalar_momentum.o sgs.o
${FC_0} ${FC_FLAGS_SET_0} -c -o $@ $<
advect_scalar.o: advect_scalar.F90 kgen_utils.o tprof_mod.o params.o grid.o advect_scalar3D.o vars.o advect_scalar2D.o
${FC_0} ${FC_FLAGS_SET_0} -c -o $@ $<
advect_scalar2D.o: advect_scalar2D.F90 kgen_utils.o tprof_mod.o params.o grid.o
${FC_0} ${FC_FLAGS_SET_0} -c -o $@ $<
advect_scalar3D.o: advect_scalar3D.F90 kgen_utils.o tprof_mod.o params.o grid.o
${FC_0} ${FC_FLAGS_SET_0} -c -o $@ $<
diffuse_scalar.o: diffuse_scalar.F90 kgen_utils.o tprof_mod.o params.o grid.o diffuse_scalar3D.o vars.o diffuse_scalar2D.o
${FC_0} ${FC_FLAGS_SET_0} -c -o $@ $<
diffuse_scalar3D.o: diffuse_scalar3D.F90 kgen_utils.o tprof_mod.o params.o grid.o
${FC_0} ${FC_FLAGS_SET_0} -c -o $@ $<
diffuse_scalar2D.o: diffuse_scalar2D.F90 kgen_utils.o tprof_mod.o params.o grid.o
${FC_0} ${FC_FLAGS_SET_0} -c -o $@ $<
accelerate_crm.o: accelerate_crm.F90 kgen_utils.o tprof_mod.o params.o shr_kind_mod.o grid.o vars.o microphysics.o
${FC_0} ${FC_FLAGS_SET_0} -c -o $@ $<
kernel_driver.o: kernel_driver.F90 crm_module.o vars.o grid.o domain.o crmdims.o sgs.o scalar_momentum.o params.o microphysics.o cloud.o precip_init.o task_util_NOMPI.o precip_proc.o micro_params.o damping.o crm_output_module.o kurant.o abcoefs.o buoyancy.o crm_surface.o zero.o forcing.o ice_fall.o shr_const_mod.o shr_kind_mod.o boundaries.o periodic.o bound_exchange.o advection.o tke_full.o shear_prod3D.o shear_prod2D.o sat.o advect_mom.o advect2_mom_z.o advect2_mom_xy.o diffuse_mom.o diffuse_mom2D.o diffuse_mom3D.o diagnose.o uvw.o coriolis.o pressure.o fft.o press_rhs.o bound_duvdt.o press_grad.o adams.o advect_all_scalars.o advect_scalar.o advect_scalar2D.o advect_scalar3D.o diffuse_scalar.o diffuse_scalar3D.o diffuse_scalar2D.o accelerate_crm.o kgen_utils.o tprof_mod.o
${FC_0} ${FC_FLAGS_SET_0} -c -o $@ $<
kgen_utils.o: kgen_utils.f90
${FC_0} ${FC_FLAGS_SET_0} -c -o $@ $<
tprof_mod.o: tprof_mod.f90
${FC_0} ${FC_FLAGS_SET_0} -c -o $@ $<
gammafff.o: gammafff.c
${CC_0} ${CC_FLAGS_SET_0} -c -o $@ $<
clean:
rm -fr kernel.exe *.mod ${ALL_OBJS} TRACE*.mpit* TRACE.sym set-0
# This file is automatically generated after the make install step.
EXTRAE_HOME=/sw/summit/extrae/3.7.1/rhel7.5_gnu6.4.0
MPI_HOME=/autofs/nccs-svm1_sw/summit/.swci/1-compute/opt/spack/20180914/linux-rhel7-ppc64le/gcc-8.1.1/spectrum-mpi-10.3.0.0-20190419-juwhiawazufuuoastohlsuewaklwmazi
MPI_CFLAGS=-I/autofs/nccs-svm1_sw/summit/.swci/1-compute/opt/spack/20180914/linux-rhel7-ppc64le/gcc-8.1.1/spectrum-mpi-10.3.0.0-20190419-juwhiawazufuuoastohlsuewaklwmazi/include
MPI_LDFLAGS=-L/autofs/nccs-svm1_sw/summit/.swci/1-compute/opt/spack/20180914/linux-rhel7-ppc64le/gcc-8.1.1/spectrum-mpi-10.3.0.0-20190419-juwhiawazufuuoastohlsuewaklwmazi/lib
MPI_LIBS=-lmpi_ibm
PAPI_HOME=/autofs/nccs-svm1_sw/summit/.swci/0-core/opt/spack/20180914/linux-rhel7-ppc64le/gcc-4.8.5/papi-5.6.0-xhd3soyh4mzxlhqmtinhylnchxuqkshb/
XML2_HOME= /usr
XML2_LDFLAGS=-L/usr/lib64
XML2_LIBS=-lxml2
UNWIND_HOME=/sw/summit/scorep/libunwind-1.3.1/rhel7.5_gnu6.4.0/
BFD_HOME=/usr
LIBERTY_HOME=/usr
BFD_LIBS=-L/usr/lib64 -lbfd -L/usr/lib64 -liberty
UNWIND_LIBS=-L$(UNWIND_HOME)/lib -lunwind
PAPI_LIBS=-L$(PAPI_HOME)/lib -lpapi
CUPTI_LIBS=
POSIX_CLOCK_LIBS=
LIBEXECINFO_LIBS= # FreeBSD specific
ZLIB_HOME=/usr
ZLIB_LIBS=-lz
DL_LIBS=-ldl
OPENCL_HOME=
OPENCL_LDFLAGS=
CC=/sw/summit/gcc/6.4.0/bin/gcc
FC=/autofs/nccs-svm1_sw/summit/.swci/1-compute/opt/spack/20180914/linux-rhel7-ppc64le/gcc-8.1.1/spectrum-mpi-10.3.0.0-20190419-juwhiawazufuuoastohlsuewaklwmazi/bin/mpif90
CXX=/sw/summit/gcc/6.4.0/bin/g++
MPICC=/autofs/nccs-svm1_sw/summit/.swci/1-compute/opt/spack/20180914/linux-rhel7-ppc64le/gcc-8.1.1/spectrum-mpi-10.3.0.0-20190419-juwhiawazufuuoastohlsuewaklwmazi/bin/mpicc
MPIF77=/autofs/nccs-svm1_sw/summit/.swci/1-compute/opt/spack/20180914/linux-rhel7-ppc64le/gcc-8.1.1/spectrum-mpi-10.3.0.0-20190419-juwhiawazufuuoastohlsuewaklwmazi/bin/mpif77
MPIF90=/autofs/nccs-svm1_sw/summit/.swci/1-compute/opt/spack/20180914/linux-rhel7-ppc64le/gcc-8.1.1/spectrum-mpi-10.3.0.0-20190419-juwhiawazufuuoastohlsuewaklwmazi/bin/mpif90
NVCC=/sw/summit/cuda/10.1.105/bin/nvcc
JAVAC=
JAR=
# For statically linked apps or systems
EXTRAE_LDFLAGS_LIBSEQTRACE=-L$(EXTRAE_HOME)/lib -lseqtrace -L$(ZLIB_HOME)/lib -lz -L$(PAPI_HOME)/lib -lpapi -L$(XML2_HOME)/lib -lxml2 -L$(BFD_HOME)/lib -lbfd -liberty
EXTRAE_LDFLAGS_LIBMPITRACE=-L$(EXTRAE_HOME)/lib -lmpitrace -L$(ZLIB_HOME)/lib -lz -L$(PAPI_HOME)/lib -lpapi -L$(XML2_HOME)/lib -lxml2 -L$(BFD_HOME)/lib -lbfd -liberty
EXTRAE_LDFLAGS_LIBMPITRACEF=-L$(EXTRAE_HOME)/lib -lmpitracef -L$(ZLIB_HOME)/lib -lz -L$(PAPI_HOME)/lib -lpapi -L$(XML2_HOME)/lib -lxml2 -L$(BFD_HOME)/lib -lbfd -liberty
......@@ -41,6 +41,9 @@ contains
SUBROUTINE crm(kgen_unit, kgen_measure, kgen_isverified, kgen_filepath, ncrms, plev)
!-----------------------------------------------------------------------------------------------
!-----------------------------------------------------------------------------------------------
USE EXTRAE_MODULE
USE shr_kind_mod, ONLY: r8 => shr_kind_r8
USE vars
USE microphysics
......@@ -126,7 +129,7 @@ SUBROUTINE crm(kgen_unit, kgen_measure, kgen_isverified, kgen_filepath, ncrms, p
INTEGER :: kgen_mpirank, kgen_openmptid, kgen_kernelinvoke
LOGICAL :: kgen_evalstage, kgen_warmupstage, kgen_mainstage
COMMON / state / kgen_mpirank, kgen_openmptid, kgen_kernelinvoke, kgen_evalstage, kgen_warmupstage, kgen_mainstage
INTEGER, PARAMETER :: KGEN_MAXITER = 10
INTEGER, PARAMETER :: KGEN_MAXITER = 100
TYPE(check_t) :: check_status
INTEGER*8 :: kgen_start_clock, kgen_stop_clock, kgen_rate_clock
......@@ -758,6 +761,8 @@ SUBROUTINE crm(kgen_unit, kgen_measure, kgen_isverified, kgen_filepath, ncrms, p
CALL SYSTEM_CLOCK(kgen_start_clock, kgen_rate_clock)
DO kgen_intvar = 1, KGEN_MAXITER
call extrae_user_function(1)
nstep = nstep + 1
!$omp target teams distribute parallel do
do icrm = 1 , ncrms
......@@ -1075,6 +1080,10 @@ SUBROUTINE crm(kgen_unit, kgen_measure, kgen_isverified, kgen_filepath, ncrms, p
enddo
enddo
END DO
call extrae_user_function(0)
call extrae_next_hwc_set()
CALL SYSTEM_CLOCK(kgen_stop_clock, kgen_rate_clock)
kgen_measure = 1.0D6*(kgen_stop_clock - kgen_start_clock)/DBLE(kgen_rate_clock*KGEN_MAXITER)
#ifdef _MPI
......
This diff is collapsed.
This diff is collapsed.
<?xml version='1.0'?>
<trace enabled="yes"
home="/sw/summit/extrae/3.7.1/rhel7.5_gnu8.1.1"
initial-mode="detail"
type="paraver"
>
<user-functions enabled="no" list="function-list" exclude-automatic-functions="no">
<counters enabled="yes" />
</user-functions>
<counters enabled="yes">
<cpu enabled="yes" starting-set-distribution="0">
<set enabled="yes" domain="all" changeat-time="0">
PAPI_TOT_INS,PAPI_TOT_CYC,PAPI_L2_DCM
</set>
<!--
<set enabled="yes" domain="all" changeat-time="0">
PAPI_TOT_INS,PAPI_TOT_CYC,PAPI_L1_DCM,PAPI_L2_DCM,PAPI_L3_TCM,PAPI_BR_INS,PAPI_BR_MSP,RESOURCE_STALLS
</set>
<set enabled="yes" domain="all" changeat-time="0">
PAPI_TOT_INS,PAPI_TOT_CYC,PAPI_VEC_SP,PAPI_SR_INS,PAPI_LD_INS,PAPI_FP_INS
<sampling enabled="no" period="1000000000">PAPI_TOT_CYC</sampling>
</set>
-->
<!--
<set enabled="yes" domain="all" changeat-time="0">
PAPI_TOT_INS,PAPI_FP_INS,PAPI_TOT_CYC,PAPI_FP_OPS
</set>
<set enabled="yes" domain="all" changeat-time="0">
PAPI_TOT_INS,PAPI_TOT_IIS
</set>
<set enabled="yes" domain="all" changeat-time="0">
PAPI_TOT_INS,PAPI_INT_INS
</set>
<set enabled="yes" domain="all" changeat-time="0">
PAPI_TOT_INS,PAPI_SR_INS
</set>
<set enabled="yes" domain="all" changeat-time="0">
PAPI_TOT_INS,PAPI_L3_DCR
</set>
<set enabled="yes" domain="all" changeat-time="0">
PAPI_TOT_INS,PAPI_L1_ICH
</set>
<set enabled="yes" domain="all" changeat-time="0">
PAPI_TOT_INS,PAPI_L3_ICH
</set>
<set enabled="yes" domain="all" changeat-time="0">
PAPI_TOT_INS,PAPI_SP_OPS
</set>
<set enabled="yes" domain="all" changeat-time="0">
PAPI_TOT_INS,PAPI_DP_OPS
</set>
<set enabled="yes" domain="all" changeat-time="0">
PAPI_TOT_INS,PAPI_FP_INS,PAPI_TOT_CYC,PAPI_FP_OPS
</set>
<set enabled="yes" domain="all" changeat-time="0">
PAPI_TOT_INS,PAPI_TOT_IIS
</set>
<set enabled="yes" domain="all" changeat-time="0">
PAPI_TOT_INS,PAPI_INT_INS
</set>
<set enabled="yes" domain="all" changeat-time="0">
PAPI_TOT_INS,PAPI_SR_INS
</set>
<set enabled="yes" domain="all" changeat-time="0">
PAPI_TOT_INS,PAPI_L3_DCR
</set>
<set enabled="yes" domain="all" changeat-time="0">
PAPI_TOT_INS,PAPI_L1_ICH
</set>
<set enabled="yes" domain="all" changeat-time="0">
PAPI_TOT_INS,PAPI_L3_ICH
</set>
<set enabled="yes" domain="all" changeat-time="0">
PAPI_TOT_INS,PAPI_SP_OPS
</set>
<set enabled="yes" domain="all" changeat-time="0">
PAPI_TOT_INS,PAPI_DP_OPS
</set>
-->
</cpu>
<network enabled="no" />
<resource-usage enabled="no" />
<memory-usage enabled="no" />
</counters>
<storage enabled="no">
<trace-prefix enabled="yes">TRACE</trace-prefix>
<size enabled="no">5</size>
<temporal-directory enabled="yes">/scratch</temporal-directory>
<final-directory enabled="yes">/gpfs/scratch/bsc41/bsc41273</final-directory>
</storage>
<buffer enabled="yes">
<size enabled="yes">5000000</size>
<circular enabled="no" />
</buffer>
<trace-control enabled="yes">
<file enabled="no" frequency="5M">/gpfs/scratch/bsc41/bsc41273/control</file>
<global-ops enabled="no"></global-ops>
</trace-control>
<others enabled="yes">
<minimum-time enabled="no">10M</minimum-time>
<finalize-on-signal enabled="yes"
SIGUSR1="no" SIGUSR2="no" SIGINT="yes"
SIGQUIT="yes" SIGTERM="yes" SIGXCPU="yes"
SIGFPE="yes" SIGSEGV="yes" SIGABRT="yes"
/>
<flush-sampling-buffer-at-instrumentation-point enabled="yes" />
</others>
<sampling enabled="yes" type="default" period="100u" variability="50u" />
<dynamic-memory enabled="no" />
<input-output enabled="no" />
<syscall enabled="no" />
<merge enabled="yes"
synchronization="default"
tree-fan-out="16"
max-memory="512"
joint-states="yes"
keep-mpits="yes"
sort-addresses="yes"
overwrite="yes"
/>
</trace>
<?xml version='1.0'?>
<trace enabled="yes"
home="/sw/summit/extrae/3.7.1/rhel7.5_gnu8.1.1"
initial-mode="detail"
type="paraver"
>
<user-functions enabled="yes" list="function-list" exclude-automatic-functions="no">
<counters enabled="yes" />
</user-functions>
<counters enabled="yes">
<cpu enabled="yes" starting-set-distribution="1">
<!--
<set enabled="yes" domain="all" changeat-time="0">
PAPI_TOT_INS,PAPI_TOT_CYC,PAPI_L1_DCM,PAPI_L2_DCM,PAPI_L3_TCM,PAPI_BR_INS,PAPI_BR_MSP,RESOURCE_STALLS
</set>
<set enabled="yes" domain="all" changeat-time="0">
PAPI_TOT_INS,PAPI_TOT_CYC,PAPI_VEC_SP,PAPI_SR_INS,PAPI_LD_INS,PAPI_FP_INS
<sampling enabled="no" period="1000000000">PAPI_TOT_CYC</sampling>
</set>
-->
<!-- counter set 1 -->
<set enabled="yes" domain="all" changeat-time="0">
PAPI_TOT_INS,PAPI_FP_INS,PAPI_TOT_CYC,PAPI_FP_OPS
</set>
<!-- counter set 2 -->
<set enabled="yes" domain="all" changeat-time="0">
PAPI_TOT_INS,PAPI_TOT_IIS
</set>
<!-- counter set 3 -->
<set enabled="yes" domain="all" changeat-time="0">
PAPI_TOT_INS,PAPI_INT_INS
</set>
<!-- counter set 4 -->
<set enabled="yes" domain="all" changeat-time="0">
PAPI_TOT_INS,PAPI_SR_INS
</set>
<!-- counter set 5 -->
<set enabled="yes" domain="all" changeat-time="0">
PAPI_TOT_INS,PAPI_L3_DCR
</set>
<!-- counter set 6 -->
<set enabled="yes" domain="all" changeat-time="0">
PAPI_TOT_INS,PAPI_L1_ICH
</set>
<!-- counter set 7 -->
<set enabled="yes" domain="all" changeat-time="0">
PAPI_TOT_INS,PAPI_L3_ICH
</set>
<!-- counter set 8 -->
<set enabled="yes" domain="all" changeat-time="0">
PAPI_TOT_INS,PAPI_SP_OPS
</set>
<!-- counter set 9 -->
<set enabled="yes" domain="all" changeat-time="0">
PAPI_TOT_INS,PAPI_DP_OPS
</set>
<!-- counter set 1 -->
<set enabled="yes" domain="all" changeat-time="0">
PAPI_TOT_INS,PAPI_FP_INS,PAPI_TOT_CYC,PAPI_FP_OPS
</set>
<!-- counter set 2 -->
<set enabled="yes" domain="all" changeat-time="0">
PAPI_TOT_INS,PAPI_TOT_IIS
</set>
<!-- counter set 3 -->
<set enabled="yes" domain="all" changeat-time="0">
PAPI_TOT_INS,PAPI_INT_INS
</set>
<!-- counter set 4 -->
<set enabled="yes" domain="all" changeat-time="0">
PAPI_TOT_INS,PAPI_SR_INS
</set>
<!-- counter set 5 -->
<set enabled="yes" domain="all" changeat-time="0">
PAPI_TOT_INS,PAPI_L3_DCR
</set>
<!-- counter set 6 -->
<set enabled="yes" domain="all" changeat-time="0">
PAPI_TOT_INS,PAPI_L1_ICH
</set>
<!-- counter set 7 -->
<set enabled="yes" domain="all" changeat-time="0">
PAPI_TOT_INS,PAPI_L3_ICH
</set>
<!-- counter set 8 -->
<set enabled="yes" domain="all" changeat-time="0">
PAPI_TOT_INS,PAPI_SP_OPS
</set>
<!-- counter set 9 -->
<set enabled="yes" domain="all" changeat-time="0">
PAPI_TOT_INS,PAPI_DP_OPS
</set>
</cpu>
<network enabled="no" />
<resource-usage enabled="no" />
<memory-usage enabled="no" />
</counters>
<storage enabled="no">
<trace-prefix enabled="yes">TRACE</trace-prefix>
<size enabled="no">5</size>
<temporal-directory enabled="yes">/scratch</temporal-directory>
<final-directory enabled="yes">/gpfs/scratch/bsc41/bsc41273</final-directory>
</storage>
<buffer enabled="yes">
<size enabled="yes">5000000</size>
<circular enabled="no" />
</buffer>
<trace-control enabled="yes">
<file enabled="no" frequency="5M">/gpfs/scratch/bsc41/bsc41273/control</file>
<global-ops enabled="no"></global-ops>
</trace-control>
<others enabled="yes">
<minimum-time enabled="no">10M</minimum-time>
<finalize-on-signal enabled="yes"
SIGUSR1="no" SIGUSR2="no" SIGINT="yes"
SIGQUIT="yes" SIGTERM="yes" SIGXCPU="yes"
SIGFPE="yes" SIGSEGV="yes" SIGABRT="yes"
/>
<flush-sampling-buffer-at-instrumentation-point enabled="yes" />
</others>
<sampling enabled="yes" type="default" period="100u" variability="50u" />
<dynamic-memory enabled="no" />
<input-output enabled="no" />
<syscall enabled="no" />
<merge enabled="yes"
synchronization="default"
tree-fan-out="16"
max-memory="512"
joint-states="yes"
keep-mpits="yes"
sort-addresses="yes"
overwrite="yes"
/>
</trace>
<?xml version='1.0'?>
<trace enabled="yes"
home="/sw/summit/extrae/3.7.1/rhel7.5_gnu8.1.1"
initial-mode="detail"
type="paraver"
>
<user-functions enabled="yes" list="function-list" exclude-automatic-functions="no">
<counters enabled="yes" />
</user-functions>
<counters enabled="yes">
<cpu enabled="yes" starting-set-distribution="1">
<set enabled="yes" domain="all" changeat-time="0">
PAPI_TOT_INS,PAPI_TOT_CYC,PAPI_L1_DCM,PAPI_L2_DCM,PAPI_L3_TCM,PAPI_BR_INS,PAPI_BR_MSP,RESOURCE_STALLS
</set>
<set enabled="yes" domain="all" changeat-time="0">
PAPI_TOT_INS,PAPI_TOT_CYC,PAPI_VEC_SP,PAPI_SR_INS,PAPI_LD_INS,PAPI_FP_INS
<sampling enabled="no" period="1000000000">PAPI_TOT_CYC</sampling>
</set>
</cpu>
<network enabled="no" />
<resource-usage enabled="no" />