import papi-5.6.0-14.el8
This commit is contained in:
parent
010882e11e
commit
dfd9af71bc
382
SOURCES/papi-bz1908126.patch
Normal file
382
SOURCES/papi-bz1908126.patch
Normal file
@ -0,0 +1,382 @@
|
|||||||
|
commit 77ee6b54f4080ca27b7efcb4c91679d0f1e090b5
|
||||||
|
Author: Anthony Castaldo <TonyCastaldo@icl.utk.edu>
|
||||||
|
Date: Fri Jan 24 10:25:36 2020 -0500
|
||||||
|
|
||||||
|
New libpfm4 contains "aliased" pmus for backward compatibility,
|
||||||
|
amd64_fam17h == amd64_fam17h_zen1; this causes us to put BOTH pmus
|
||||||
|
into the PMUs supported string and double the events in native_avail.
|
||||||
|
This update recognizes when aliases exist (the names must be hard-coded)
|
||||||
|
and uses only one of the most recent name.
|
||||||
|
|
||||||
|
diff --git a/src/components/perf_event/pe_libpfm4_events.c b/src/components/perf_event/pe_libpfm4_events.c
|
||||||
|
index 3b5f8d13f..3262608cd 100644
|
||||||
|
--- a/src/components/perf_event/pe_libpfm4_events.c
|
||||||
|
+++ b/src/components/perf_event/pe_libpfm4_events.c
|
||||||
|
@@ -31,6 +31,9 @@
|
||||||
|
// used to step through the attributes when enumerating events
|
||||||
|
static int attr_idx;
|
||||||
|
|
||||||
|
+/* alias flags to handle amd_fam17h, amd_fam17h_zen1 both present PMUs*/
|
||||||
|
+static int amd64_fam17h_zen1_present = 0;
|
||||||
|
+
|
||||||
|
/** @class find_existing_event
|
||||||
|
* @brief looks up an event, returns it if it exists
|
||||||
|
*
|
||||||
|
@@ -482,7 +485,13 @@ static struct native_event_t *allocate_native_event(
|
||||||
|
*
|
||||||
|
* @returns returns a libpfm event number
|
||||||
|
* @retval PAPI_ENOEVENT Could not find an event
|
||||||
|
- *
|
||||||
|
+ * Operational note: _pe_libpfm4_init() must be called first to set
|
||||||
|
+ * flags for synonymous PMUs. At this writing only
|
||||||
|
+ * amd64_fam17h_zen1_present is defined.
|
||||||
|
+ * Operational note: We indirectly return the pmu_idx within the
|
||||||
|
+ * event data; the calling code uses that to set
|
||||||
|
+ * pmu_idx for subsequent calls. All we do is find
|
||||||
|
+ * the next valid pmu, if any.
|
||||||
|
*/
|
||||||
|
|
||||||
|
static int
|
||||||
|
@@ -511,6 +520,12 @@ get_first_event_next_pmu(int pmu_idx, int pmu_type)
|
||||||
|
break;
|
||||||
|
}
|
||||||
|
|
||||||
|
+ if ((ret==PFM_SUCCESS) && amd64_fam17h_zen1_present && strcmp(pinfo.name, "amd64_fam17h") == 0) {
|
||||||
|
+ /* Skip as if invalid; we want the PMU amd64_fam17h_zen1 instead. */
|
||||||
|
+ pmu_idx++;
|
||||||
|
+ continue;
|
||||||
|
+ }
|
||||||
|
+
|
||||||
|
if ((ret==PFM_SUCCESS) && pmu_is_present_and_right_type(&pinfo,pmu_type)) {
|
||||||
|
|
||||||
|
pidx=pinfo.first_event;
|
||||||
|
@@ -1159,6 +1174,35 @@ _pe_libpfm4_init(papi_vector_t *component, int cidx,
|
||||||
|
event_table->default_pmu.size = sizeof(pfm_pmu_info_t);
|
||||||
|
retval=pfm_get_pmu_info(0, &(event_table->default_pmu));
|
||||||
|
|
||||||
|
+ SUBDBG("Prescan for aliases.")
|
||||||
|
+ /* We have to see if we have aliases in there as separate PMUs, */
|
||||||
|
+ /* we don't want both PMUs with all the events duplicated. */
|
||||||
|
+ /* For aliases, either is valid alone, but if both are present */
|
||||||
|
+ /* specify a preference in the code. */
|
||||||
|
+ /* Alias: amd64_fam17h_zen1 over amd64_fam17h. */
|
||||||
|
+ /* Alias flags are static ints global to this file. */
|
||||||
|
+ i=0;
|
||||||
|
+ while(1) {
|
||||||
|
+ memset(&pinfo,0,sizeof(pfm_pmu_info_t));
|
||||||
|
+ pinfo.size = sizeof(pfm_pmu_info_t);
|
||||||
|
+ retval=pfm_get_pmu_info(i, &pinfo);
|
||||||
|
+
|
||||||
|
+ /* We're done if we hit an invalid PMU entry */
|
||||||
|
+ /* We can't check against PFM_PMU_MAX as that might not */
|
||||||
|
+ /* match if libpfm4 is dynamically linked */
|
||||||
|
+
|
||||||
|
+ if (retval==PFM_ERR_INVAL) {
|
||||||
|
+ break;
|
||||||
|
+ }
|
||||||
|
+
|
||||||
|
+ if ( (retval==PFM_SUCCESS) && (pinfo.name != NULL) &&
|
||||||
|
+ (pmu_is_present_and_right_type(&pinfo,pmu_type)) &&
|
||||||
|
+ (strcmp(pinfo.name,"amd64_fam17h_zen1") == 0) ) {
|
||||||
|
+ amd64_fam17h_zen1_present = 1;
|
||||||
|
+ }
|
||||||
|
+ i++;
|
||||||
|
+ }
|
||||||
|
+
|
||||||
|
SUBDBG("Detected pmus:\n");
|
||||||
|
i=0;
|
||||||
|
while(1) {
|
||||||
|
@@ -1177,6 +1221,12 @@ _pe_libpfm4_init(papi_vector_t *component, int cidx,
|
||||||
|
if ((retval==PFM_SUCCESS) && (pinfo.name != NULL) &&
|
||||||
|
(pmu_is_present_and_right_type(&pinfo,pmu_type))) {
|
||||||
|
|
||||||
|
+ /* skip if it is amd64_fam17h and zen1 is also present. */
|
||||||
|
+ if (strcmp(pinfo.name,"amd64_fam17h") == 0 && amd64_fam17h_zen1_present) {
|
||||||
|
+ i++;
|
||||||
|
+ continue;
|
||||||
|
+ }
|
||||||
|
+
|
||||||
|
SUBDBG("\t%d %s %s %d\n",i,
|
||||||
|
pinfo.name,pinfo.desc,pinfo.type);
|
||||||
|
|
||||||
|
@@ -1193,11 +1243,9 @@ _pe_libpfm4_init(papi_vector_t *component, int cidx,
|
||||||
|
/* Hack to have "default core" PMU */
|
||||||
|
if ( (pinfo.type==PFM_PMU_TYPE_CORE) &&
|
||||||
|
strcmp(pinfo.name,"ix86arch")) {
|
||||||
|
-
|
||||||
|
- SUBDBG("\t %s is default\n",pinfo.name);
|
||||||
|
- memcpy(&(event_table->default_pmu),
|
||||||
|
- &pinfo,sizeof(pfm_pmu_info_t));
|
||||||
|
- found_default++;
|
||||||
|
+ memcpy(&(event_table->default_pmu),
|
||||||
|
+ &pinfo,sizeof(pfm_pmu_info_t));
|
||||||
|
+ found_default++;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
commit 79fe2a025afb8acb317032030c8847c9cbfd0162
|
||||||
|
Author: Masahiko, Yamada <yamada.masahiko@fujitsu.com>
|
||||||
|
Date: Tue Jan 5 13:45:34 2021 +0900
|
||||||
|
|
||||||
|
Get model_string for ARM processor from pfm_get_pmu_info() function
|
||||||
|
|
||||||
|
On ARM processors, the model_string does not appear in /proc/cpuinfo.
|
||||||
|
Instead of looking at the /proc/cpuinfo information, you can look at the lscpu command information at the following URL:.
|
||||||
|
https://github.com/google/cpu_features/issues/26
|
||||||
|
http://suihkulokki.blogspot.com/2018/02/making-sense-of-proccpuinfo-on-arm.html
|
||||||
|
|
||||||
|
The libpfm4 library identifies the ARM processor type from the "CPU implement" and "CPU part" in the /proc/cpuinfo information.
|
||||||
|
The papi library can use the pfm_get_pmu_info() function from the libpfm4 library to obtain a string identifying the ARM processor type.
|
||||||
|
|
||||||
|
diff --git a/src/components/perf_event/pe_libpfm4_events.c b/src/components/perf_event/pe_libpfm4_events.c
|
||||||
|
index a84819cc0..744851ff0 100644
|
||||||
|
--- a/src/components/perf_event/pe_libpfm4_events.c
|
||||||
|
+++ b/src/components/perf_event/pe_libpfm4_events.c
|
||||||
|
@@ -1149,6 +1149,7 @@ _pe_libpfm4_init(papi_vector_t *component, int cidx,
|
||||||
|
|
||||||
|
pfm_err_t retval = PFM_SUCCESS;
|
||||||
|
pfm_pmu_info_t pinfo;
|
||||||
|
+ unsigned int strSize;
|
||||||
|
|
||||||
|
/* allocate the native event structure */
|
||||||
|
event_table->num_native_events=0;
|
||||||
|
@@ -1247,6 +1248,13 @@ _pe_libpfm4_init(papi_vector_t *component, int cidx,
|
||||||
|
&pinfo,sizeof(pfm_pmu_info_t));
|
||||||
|
found_default++;
|
||||||
|
}
|
||||||
|
+ if ( (pinfo.type==PFM_PMU_TYPE_CORE) &&
|
||||||
|
+ ( _papi_hwi_system_info.hw_info.vendor == PAPI_VENDOR_ARM)) {
|
||||||
|
+ if (strlen(_papi_hwi_system_info.hw_info.model_string) == 0) {
|
||||||
|
+ strSize = sizeof(_papi_hwi_system_info.hw_info.model_string);
|
||||||
|
+ strncpy( _papi_hwi_system_info.hw_info.model_string, pinfo.desc, strSize - 1);
|
||||||
|
+ }
|
||||||
|
+ }
|
||||||
|
}
|
||||||
|
|
||||||
|
if (pmu_type==PMU_TYPE_UNCORE) {
|
||||||
|
commit 85003c716d76eff47607fa0967537c6cf63d8348
|
||||||
|
Author: Steve Walk <swalk.cavium@gmail.com>
|
||||||
|
Date: Fri Jun 8 15:50:50 2018 -0400
|
||||||
|
|
||||||
|
enable Cavium ThunderX2 support
|
||||||
|
|
||||||
|
diff --git a/src/papi_events.csv b/src/papi_events.csv
|
||||||
|
index bb11f61d3..46827f180 100644
|
||||||
|
--- a/src/papi_events.csv
|
||||||
|
+++ b/src/papi_events.csv
|
||||||
|
@@ -1841,6 +1841,31 @@ PRESET,PAPI_L2_DCR,NOT_DERIVED,L2D_READ_ACCESS
|
||||||
|
PRESET,PAPI_L2_DCW,NOT_DERIVED,L2D_WRITE_ACCESS
|
||||||
|
PRESET,PAPI_L2_LDM,NOT_DERIVED,L2D_READ_REFILL
|
||||||
|
PRESET,PAPI_L2_STM,NOT_DERIVED,L2D_WRITE_REFILL
|
||||||
|
+
|
||||||
|
+#####################
|
||||||
|
+# ARM ThunderX2 #
|
||||||
|
+#####################
|
||||||
|
+CPU,arm_thunderx2
|
||||||
|
+#
|
||||||
|
+PRESET,PAPI_TOT_INS,NOT_DERIVED,INST_RETIRED
|
||||||
|
+PRESET,PAPI_TOT_CYC,NOT_DERIVED,CPU_CYCLES
|
||||||
|
+PRESET,PAPI_FP_INS,NOT_DERIVED,VFP_SPEC
|
||||||
|
+PRESET,PAPI_VEC_INS,NOT_DERIVED,ASE_SPEC
|
||||||
|
+PRESET,PAPI_BR_INS,NOT_DERIVED,BR_RETIRED
|
||||||
|
+PRESET,PAPI_LD_INS,NOT_DERIVED,LD_RETIRED
|
||||||
|
+PRESET,PAPI_SR_INS,NOT_DERIVED,ST_RETIRED
|
||||||
|
+PRESET,PAPI_L1_DCA,DERIVED_ADD,L1D_CACHE_RD,L1D_CACHE_WR
|
||||||
|
+PRESET,PAPI_L1_DCM,NOT_DERIVED,L1D_CACHE_REFILL
|
||||||
|
+PRESET,PAPI_L1_DCR,NOT_DERIVED,L1D_CACHE_RD
|
||||||
|
+PRESET,PAPI_L1_DCW,NOT_DERIVED,L1D_CACHE_WR
|
||||||
|
+PRESET,PAPI_L1_ICA,NOT_DERIVED,L1I_CACHE
|
||||||
|
+PRESET,PAPI_L1_ICM,NOT_DERIVED,L1I_CACHE_REFILL
|
||||||
|
+PRESET,PAPI_L2_DCH,NOT_DERIVED,L2D_CACHE
|
||||||
|
+PRESET,PAPI_L2_DCM,NOT_DERIVED,L2D_CACHE_REFILL
|
||||||
|
+PRESET,PAPI_L2_DCR,NOT_DERIVED,L2D_CACHE_RD
|
||||||
|
+PRESET,PAPI_L2_DCW,NOT_DERIVED,L2D_CACHE_WR
|
||||||
|
+PRESET,PAPI_L2_LDM,NOT_DERIVED,L2D_CACHE_REFILL_RD
|
||||||
|
+
|
||||||
|
#
|
||||||
|
CPU,mips_74k
|
||||||
|
#
|
||||||
|
commit 9a44d82928ed17ba2ff21eb88b89c5829d0ea30e
|
||||||
|
Author: Steve Kaufmann <steven.kaufmann@hpe.com>
|
||||||
|
Date: Wed Jun 24 14:08:08 2020 -0400
|
||||||
|
|
||||||
|
Added PAPI preset support for Fujitsu A64FX.
|
||||||
|
|
||||||
|
Signed-off-by: Heike Jagode <jagode@icl.utk.edu>
|
||||||
|
|
||||||
|
diff --git a/src/papi_events.csv b/src/papi_events.csv
|
||||||
|
index 8e96adfbd..1b5c15542 100644
|
||||||
|
--- a/src/papi_events.csv
|
||||||
|
+++ b/src/papi_events.csv
|
||||||
|
@@ -1877,6 +1877,21 @@ PRESET,PAPI_L2_DCR,NOT_DERIVED,L2D_CACHE_RD
|
||||||
|
PRESET,PAPI_L2_DCW,NOT_DERIVED,L2D_CACHE_WR
|
||||||
|
PRESET,PAPI_L2_LDM,NOT_DERIVED,L2D_CACHE_REFILL_RD
|
||||||
|
|
||||||
|
+#########################
|
||||||
|
+# ARM Fujitsu A64FX #
|
||||||
|
+#########################
|
||||||
|
+CPU,arm_a64fx
|
||||||
|
+#
|
||||||
|
+PRESET,PAPI_TOT_INS,NOT_DERIVED,INST_RETIRED
|
||||||
|
+PRESET,PAPI_TOT_CYC,NOT_DERIVED,CPU_CYCLES
|
||||||
|
+PRESET,PAPI_FP_INS,NOT_DERIVED,VFP_SPEC
|
||||||
|
+PRESET,PAPI_VEC_INS,NOT_DERIVED,ASE_SPEC
|
||||||
|
+PRESET,PAPI_L1_DCM,NOT_DERIVED,L1D_CACHE_REFILL
|
||||||
|
+PRESET,PAPI_L1_ICA,NOT_DERIVED,L1I_CACHE
|
||||||
|
+PRESET,PAPI_L1_ICM,NOT_DERIVED,L1I_CACHE_REFILL
|
||||||
|
+PRESET,PAPI_L2_DCH,NOT_DERIVED,L2D_CACHE
|
||||||
|
+PRESET,PAPI_L2_DCM,NOT_DERIVED,L2D_CACHE_REFILL
|
||||||
|
+
|
||||||
|
#
|
||||||
|
CPU,mips_74k
|
||||||
|
#
|
||||||
|
commit b87ac4beda096086e0040f8ec1b44c4791a9739c
|
||||||
|
Author: Masahiko, Yamada <yamada.masahiko@fujitsu.com>
|
||||||
|
Date: Mon Dec 14 14:06:22 2020 +0900
|
||||||
|
|
||||||
|
Corrected typo for A64FX support (PAPI_L2_DCH is a typo of PAPI_L2_DCA)
|
||||||
|
|
||||||
|
diff --git a/src/papi_events.csv b/src/papi_events.csv
|
||||||
|
index fd75f9371..164f05641 100644
|
||||||
|
--- a/src/papi_events.csv
|
||||||
|
+++ b/src/papi_events.csv
|
||||||
|
@@ -1937,7 +1937,7 @@ PRESET,PAPI_VEC_INS,NOT_DERIVED,ASE_SPEC
|
||||||
|
PRESET,PAPI_L1_DCM,NOT_DERIVED,L1D_CACHE_REFILL
|
||||||
|
PRESET,PAPI_L1_ICA,NOT_DERIVED,L1I_CACHE
|
||||||
|
PRESET,PAPI_L1_ICM,NOT_DERIVED,L1I_CACHE_REFILL
|
||||||
|
-PRESET,PAPI_L2_DCH,NOT_DERIVED,L2D_CACHE
|
||||||
|
+PRESET,PAPI_L2_DCA,NOT_DERIVED,L2D_CACHE
|
||||||
|
PRESET,PAPI_L2_DCM,NOT_DERIVED,L2D_CACHE_REFILL
|
||||||
|
|
||||||
|
#
|
||||||
|
commit 869864f813f0681b5c9a4b65de2135c8708a2afb
|
||||||
|
Author: Masahiko, Yamada <yamada.masahiko@fujitsu.com>
|
||||||
|
Date: Mon Dec 14 19:34:59 2020 +0900
|
||||||
|
|
||||||
|
Add or modify various A64FX support events, including floating point events (PAPI_FP_OPS, PAPI_SP_OPS, PAPI_DP_OPS).
|
||||||
|
|
||||||
|
diff --git a/src/papi_events.csv b/src/papi_events.csv
|
||||||
|
index 164f05641..9192b1041 100644
|
||||||
|
--- a/src/papi_events.csv
|
||||||
|
+++ b/src/papi_events.csv
|
||||||
|
@@ -1930,15 +1930,46 @@ PRESET,PAPI_L2_LDM,NOT_DERIVED,L2D_CACHE_REFILL_RD
|
||||||
|
#########################
|
||||||
|
CPU,arm_a64fx
|
||||||
|
#
|
||||||
|
+PRESET,PAPI_PRF_DM,DERIVED_SUB,L2D_CACHE_REFILL_PRF,L2D_CACHE_MIBMCH_PRF
|
||||||
|
+PRESET,PAPI_MEM_SCY,NOT_DERIVED,LD_COMP_WAIT_L2_MISS
|
||||||
|
+PRESET,PAPI_STL_ICY,DERIVED_ADD,STALL_FRONTEND,STALL_BACKEND
|
||||||
|
+PRESET,PAPI_STL_CCY,NOT_DERIVED,0INST_COMMIT
|
||||||
|
+PRESET,PAPI_FUL_CCY,DERIVED_SUB,CPU_CYCLES,0INST_COMMIT,1INST_COMMIT,2INST_COMMIT,3INST_COMMIT,4INST_COMMIT
|
||||||
|
+PRESET,PAPI_HW_INT,DERIVED_ADD,EXC_IRQ,EXC_FIQ
|
||||||
|
+PRESET,PAPI_BR_MSP,NOT_DERIVED,BR_MIS_PRED
|
||||||
|
+PRESET,PAPI_BR_PRC,DERIVED_SUB,BR_PRED,BR_MIS_PRED
|
||||||
|
+PRESET,PAPI_FMA_INS,NOT_DERIVED,FP_FMA_SPEC
|
||||||
|
PRESET,PAPI_TOT_INS,NOT_DERIVED,INST_RETIRED
|
||||||
|
PRESET,PAPI_TOT_CYC,NOT_DERIVED,CPU_CYCLES
|
||||||
|
PRESET,PAPI_FP_INS,NOT_DERIVED,VFP_SPEC
|
||||||
|
+PRESET,PAPI_LD_INS,NOT_DERIVED,LD_SPEC
|
||||||
|
+PRESET,PAPI_SR_INS,NOT_DERIVED,ST_SPEC
|
||||||
|
+PRESET,PAPI_BR_INS,NOT_DERIVED,BR_PRED
|
||||||
|
PRESET,PAPI_VEC_INS,NOT_DERIVED,ASE_SPEC
|
||||||
|
+PRESET,PAPI_RES_STL,NOT_DERIVED,STALL_BACKEND
|
||||||
|
+PRESET,PAPI_LST_INS,NOT_DERIVED,LDST_SPEC
|
||||||
|
+PRESET,PAPI_SYC_INS,DERIVED_ADD,ISB_SPEC,DSB_SPEC,DMB_SPEC
|
||||||
|
+PRESET,PAPI_L1_DCA,NOT_DERIVED,L1D_CACHE
|
||||||
|
+PRESET,PAPI_L1_DCH,DERIVED_SUB,L1D_CACHE,L1D_CACHE_REFILL
|
||||||
|
PRESET,PAPI_L1_DCM,NOT_DERIVED,L1D_CACHE_REFILL
|
||||||
|
PRESET,PAPI_L1_ICA,NOT_DERIVED,L1I_CACHE
|
||||||
|
+PRESET,PAPI_L1_ICH,DERIVED_SUB,L1I_CACHE,L1I_CACHE_REFILL
|
||||||
|
PRESET,PAPI_L1_ICM,NOT_DERIVED,L1I_CACHE_REFILL
|
||||||
|
+PRESET,PAPI_L1_TCA,DERIVED_ADD,L1D_CACHE,L1I_CACHE
|
||||||
|
+PRESET,PAPI_L1_TCH,DERIVED_POSTFIX,N0|N1|-|N2|+|N3|-|,L1D_CACHE,L1D_CACHE_REFILL,L1I_CACHE,L1I_CACHE_REFILL
|
||||||
|
+PRESET,PAPI_L1_TCM,DERIVED_ADD,L1D_CACHE_REFILL,L1I_CACHE_REFILL
|
||||||
|
PRESET,PAPI_L2_DCA,NOT_DERIVED,L2D_CACHE
|
||||||
|
-PRESET,PAPI_L2_DCM,NOT_DERIVED,L2D_CACHE_REFILL
|
||||||
|
+PRESET,PAPI_L2_DCH,DERIVED_POSTFIX,N0|N1|-|N2|+|N3|+|,L2D_CACHE,L2D_CACHE_REFILL,L2D_SWAP_DM,L2D_CACHE_MIBMCH_PRF
|
||||||
|
+PRESET,PAPI_L2_DCM,DERIVED_SUB,L2D_CACHE_REFILL,L2D_SWAP_DM,L2D_CACHE_MIBMCH_PRF
|
||||||
|
+PRESET,PAPI_L2_TCA,NOT_DERIVED,L2D_CACHE
|
||||||
|
+PRESET,PAPI_L2_TCH,DERIVED_POSTFIX,N0|N1|-|N2|+|N3|+|,L2D_CACHE,L2D_CACHE_REFILL,L2D_SWAP_DM,L2D_CACHE_MIBMCH_PRF
|
||||||
|
+PRESET,PAPI_L2_TCM,DERIVED_SUB,L2D_CACHE_REFILL,L2D_SWAP_DM,L2D_CACHE_MIBMCH_PRF
|
||||||
|
+PRESET,PAPI_TLB_DM,NOT_DERIVED,L2D_TLB_REFILL
|
||||||
|
+PRESET,PAPI_TLB_IM,NOT_DERIVED,L2I_TLB_REFILL
|
||||||
|
+PRESET,PAPI_TLB_TL,DERIVED_ADD,L2D_TLB_REFILL,L2I_TLB_REFILL
|
||||||
|
+PRESET,PAPI_FP_OPS,DERIVED_POSTFIX,N0|512|128|/|*|N1|+|,FP_SCALE_OPS_SPEC,FP_FIXED_OPS_SPEC
|
||||||
|
+PRESET,PAPI_SP_OPS,DERIVED_POSTFIX,N0|512|128|/|*|N1|+|,FP_SP_SCALE_OPS_SPEC,FP_SP_FIXED_OPS_SPEC
|
||||||
|
+PRESET,PAPI_DP_OPS,DERIVED_POSTFIX,N0|512|128|/|*|N1|+|,FP_DP_SCALE_OPS_SPEC,FP_DP_FIXED_OPS_SPEC
|
||||||
|
|
||||||
|
#
|
||||||
|
CPU,mips_74k
|
||||||
|
commit 7a3c22763ef2ba00a2b8cb069c3501f35ecb13de
|
||||||
|
Author: Masahiko, Yamada <yamada.masahiko@fujitsu.com>
|
||||||
|
Date: Tue Dec 15 13:43:43 2020 +0900
|
||||||
|
|
||||||
|
modify PAPI_FP_INS and PAPI_VEC_INS for A64FX supports
|
||||||
|
|
||||||
|
diff --git a/src/papi_events.csv b/src/papi_events.csv
|
||||||
|
index 9192b1041..7b4ceb674 100644
|
||||||
|
--- a/src/papi_events.csv
|
||||||
|
+++ b/src/papi_events.csv
|
||||||
|
@@ -1941,11 +1941,11 @@ PRESET,PAPI_BR_PRC,DERIVED_SUB,BR_PRED,BR_MIS_PRED
|
||||||
|
PRESET,PAPI_FMA_INS,NOT_DERIVED,FP_FMA_SPEC
|
||||||
|
PRESET,PAPI_TOT_INS,NOT_DERIVED,INST_RETIRED
|
||||||
|
PRESET,PAPI_TOT_CYC,NOT_DERIVED,CPU_CYCLES
|
||||||
|
-PRESET,PAPI_FP_INS,NOT_DERIVED,VFP_SPEC
|
||||||
|
+PRESET,PAPI_FP_INS,NOT_DERIVED,FP_SPEC
|
||||||
|
PRESET,PAPI_LD_INS,NOT_DERIVED,LD_SPEC
|
||||||
|
PRESET,PAPI_SR_INS,NOT_DERIVED,ST_SPEC
|
||||||
|
PRESET,PAPI_BR_INS,NOT_DERIVED,BR_PRED
|
||||||
|
-PRESET,PAPI_VEC_INS,NOT_DERIVED,ASE_SPEC
|
||||||
|
+PRESET,PAPI_VEC_INS,NOT_DERIVED,SIMD_INST_RETIRED
|
||||||
|
PRESET,PAPI_RES_STL,NOT_DERIVED,STALL_BACKEND
|
||||||
|
PRESET,PAPI_LST_INS,NOT_DERIVED,LDST_SPEC
|
||||||
|
PRESET,PAPI_SYC_INS,DERIVED_ADD,ISB_SPEC,DSB_SPEC,DMB_SPEC
|
||||||
|
commit 530d4763fb8e6dd52109387bd58c8c1305fd6b63
|
||||||
|
Author: Masahiko, Yamada <yamada.masahiko@fujitsu.com>
|
||||||
|
Date: Fri Feb 12 15:01:21 2021 +0900
|
||||||
|
|
||||||
|
remove PAPI_L1_DCA and PAPI_L1_DCH for a64fx
|
||||||
|
|
||||||
|
There seems to be a problem with PAPI_L1_DCA and PAPI_L1_DCH for a64fx that prefetch overcounts.
|
||||||
|
I delete (comment out) PAPI_L1_DCA and PAPI_L1_DCH for a64fx from the papi_events.csv file.
|
||||||
|
I will issue the pullrequest again once I have identified how to handle the overcount.
|
||||||
|
|
||||||
|
diff --git a/src/papi_events.csv b/src/papi_events.csv
|
||||||
|
index 7b4ceb674..0f5ec8344 100644
|
||||||
|
--- a/src/papi_events.csv
|
||||||
|
+++ b/src/papi_events.csv
|
||||||
|
@@ -1949,8 +1949,8 @@ PRESET,PAPI_VEC_INS,NOT_DERIVED,SIMD_INST_RETIRED
|
||||||
|
PRESET,PAPI_RES_STL,NOT_DERIVED,STALL_BACKEND
|
||||||
|
PRESET,PAPI_LST_INS,NOT_DERIVED,LDST_SPEC
|
||||||
|
PRESET,PAPI_SYC_INS,DERIVED_ADD,ISB_SPEC,DSB_SPEC,DMB_SPEC
|
||||||
|
-PRESET,PAPI_L1_DCA,NOT_DERIVED,L1D_CACHE
|
||||||
|
-PRESET,PAPI_L1_DCH,DERIVED_SUB,L1D_CACHE,L1D_CACHE_REFILL
|
||||||
|
+#PRESET,PAPI_L1_DCA,NOT_DERIVED,L1D_CACHE
|
||||||
|
+#PRESET,PAPI_L1_DCH,DERIVED_SUB,L1D_CACHE,L1D_CACHE_REFILL
|
||||||
|
PRESET,PAPI_L1_DCM,NOT_DERIVED,L1D_CACHE_REFILL
|
||||||
|
PRESET,PAPI_L1_ICA,NOT_DERIVED,L1I_CACHE
|
||||||
|
PRESET,PAPI_L1_ICH,DERIVED_SUB,L1I_CACHE,L1I_CACHE_REFILL
|
||||||
|
commit 340f68940234f2db181147fc249907b4f1293e62
|
||||||
|
Author: Masahiko, Yamada <yamada.masahiko@fujitsu.com>
|
||||||
|
Date: Tue Feb 16 17:16:24 2021 +0900
|
||||||
|
|
||||||
|
remove PAPI_L1_TCA and PAPI_L1_TCH for a64fx
|
||||||
|
|
||||||
|
PAPI_L1_TCA and PAPI_L1_TCH for a64fx measure L1D_CACHE just like PAPI_L1_DCA and PAPI_L1_DCH,
|
||||||
|
so I delete (comment out) PAPI_L1_TCA and PAPI_L1_TCH for a64fx from the papi_events.csv file.
|
||||||
|
|
||||||
|
diff --git a/src/papi_events.csv b/src/papi_events.csv
|
||||||
|
index 0f5ec8344..4ef647959 100644
|
||||||
|
--- a/src/papi_events.csv
|
||||||
|
+++ b/src/papi_events.csv
|
||||||
|
@@ -1955,8 +1955,8 @@ PRESET,PAPI_L1_DCM,NOT_DERIVED,L1D_CACHE_REFILL
|
||||||
|
PRESET,PAPI_L1_ICA,NOT_DERIVED,L1I_CACHE
|
||||||
|
PRESET,PAPI_L1_ICH,DERIVED_SUB,L1I_CACHE,L1I_CACHE_REFILL
|
||||||
|
PRESET,PAPI_L1_ICM,NOT_DERIVED,L1I_CACHE_REFILL
|
||||||
|
-PRESET,PAPI_L1_TCA,DERIVED_ADD,L1D_CACHE,L1I_CACHE
|
||||||
|
-PRESET,PAPI_L1_TCH,DERIVED_POSTFIX,N0|N1|-|N2|+|N3|-|,L1D_CACHE,L1D_CACHE_REFILL,L1I_CACHE,L1I_CACHE_REFILL
|
||||||
|
+#PRESET,PAPI_L1_TCA,DERIVED_ADD,L1D_CACHE,L1I_CACHE
|
||||||
|
+#PRESET,PAPI_L1_TCH,DERIVED_POSTFIX,N0|N1|-|N2|+|N3|-|,L1D_CACHE,L1D_CACHE_REFILL,L1I_CACHE,L1I_CACHE_REFILL
|
||||||
|
PRESET,PAPI_L1_TCM,DERIVED_ADD,L1D_CACHE_REFILL,L1I_CACHE_REFILL
|
||||||
|
PRESET,PAPI_L2_DCA,NOT_DERIVED,L2D_CACHE
|
||||||
|
PRESET,PAPI_L2_DCH,DERIVED_POSTFIX,N0|N1|-|N2|+|N3|+|,L2D_CACHE,L2D_CACHE_REFILL,L2D_SWAP_DM,L2D_CACHE_MIBMCH_PRF
|
144
SOURCES/papi-mx.patch
Normal file
144
SOURCES/papi-mx.patch
Normal file
@ -0,0 +1,144 @@
|
|||||||
|
commit 3a6c9a855195e6f6f44ad6dffe2cd4046426ab53
|
||||||
|
Author: Masahiko, Yamada <yamada.masahiko@fujitsu.com>
|
||||||
|
Date: Wed Nov 25 21:46:26 2020 +0900
|
||||||
|
|
||||||
|
fix for performance improvement of _mx_init_component() function
|
||||||
|
|
||||||
|
diff --git a/src/components/mx/linux-mx.c b/src/components/mx/linux-mx.c
|
||||||
|
index 2da406d14..34e6f02c2 100644
|
||||||
|
--- a/src/components/mx/linux-mx.c
|
||||||
|
+++ b/src/components/mx/linux-mx.c
|
||||||
|
@@ -224,26 +224,35 @@ _mx_init_component( int cidx )
|
||||||
|
{
|
||||||
|
|
||||||
|
FILE *fff;
|
||||||
|
- char test_string[BUFSIZ];
|
||||||
|
+ char *path;
|
||||||
|
+ int len, pathlen;
|
||||||
|
|
||||||
|
/* detect if MX available */
|
||||||
|
|
||||||
|
- strncpy(mx_counters_exe,"mx_counters 2> /dev/null",BUFSIZ);
|
||||||
|
- fff=popen(mx_counters_exe,"r");
|
||||||
|
- /* popen only returns NULL if "sh" fails, not the actual command */
|
||||||
|
- if (fgets(test_string,BUFSIZ,fff)==NULL) {
|
||||||
|
- pclose(fff);
|
||||||
|
- strncpy(mx_counters_exe,"./components/mx/utils/fake_mx_counters 2> /dev/null",BUFSIZ);
|
||||||
|
- fff=popen(mx_counters_exe,"r");
|
||||||
|
- if (fgets(test_string,BUFSIZ,fff)==NULL) {
|
||||||
|
- pclose(fff);
|
||||||
|
- /* neither real nor fake found */
|
||||||
|
- strncpy(_mx_vector.cmp_info.disabled_reason,
|
||||||
|
- "No MX utilities found",PAPI_MAX_STR_LEN);
|
||||||
|
- return PAPI_ECMP;
|
||||||
|
+ path = getenv("PATH");
|
||||||
|
+ pathlen = strlen(path);
|
||||||
|
+ while(pathlen > 0) {
|
||||||
|
+ len = strcspn(path, ":");
|
||||||
|
+ strncpy(mx_counters_exe, path, len);
|
||||||
|
+ mx_counters_exe[len] = '\0';
|
||||||
|
+ strcat(mx_counters_exe, "/mx_counters");
|
||||||
|
+ fff = fopen(mx_counters_exe, "r");
|
||||||
|
+ if (fff != NULL) {
|
||||||
|
+ strcat(mx_counters_exe, " 2> /dev/null");
|
||||||
|
+ break;
|
||||||
|
}
|
||||||
|
+ pathlen = pathlen - len - 1;
|
||||||
|
+ if (pathlen > 0) {
|
||||||
|
+ path = path + len + 1;
|
||||||
|
+ }
|
||||||
|
+ }
|
||||||
|
+ if (fff == NULL) {
|
||||||
|
+ /* neither real nor fake found */
|
||||||
|
+ strncpy(_mx_vector.cmp_info.disabled_reason,
|
||||||
|
+ "No MX utilities found",PAPI_MAX_STR_LEN);
|
||||||
|
+ return PAPI_ECMP;
|
||||||
|
}
|
||||||
|
- pclose(fff);
|
||||||
|
+ fclose(fff);
|
||||||
|
|
||||||
|
num_events=MX_MAX_COUNTERS;
|
||||||
|
_mx_vector.cmp_info.num_native_events=num_events;
|
||||||
|
commit 3a2560a86be44f4b15d96a45eda8e7f387b9166c
|
||||||
|
Author: Masahiko, Yamada <yamada.masahiko@fujitsu.com>
|
||||||
|
Date: Tue Jan 26 16:30:40 2021 +0900
|
||||||
|
|
||||||
|
Add string length check before strncpy() and strcat() calls in _mx_init_component()
|
||||||
|
|
||||||
|
Myrinet Express-related component MX modules are initialized with the _mx_init_component() function,
|
||||||
|
which is called from the PAPI_library_init() function.
|
||||||
|
The popen(3) call runs a loadable module called "mx_counters",
|
||||||
|
and if the loadable module does not exist,
|
||||||
|
it attempts to run a loadable module called "./components/mx/utils/fake_mx_counters".
|
||||||
|
In an environment where there are no "mx_counters" and "./components/mx/utils/fake_mx_counters" loadable modules,
|
||||||
|
popen(3) will be called twice uselessly.
|
||||||
|
popen(3) internally calls pipe(2) once, fork(2) twice and exec(2) once.
|
||||||
|
|
||||||
|
The size of the user space of the application calling the PAPI_library_init() function affects the performance of fork(2),
|
||||||
|
which is called as an extension of popen(3).
|
||||||
|
As a result, the performance of the PAPI_library_init() function is affected by the amount of user space in the application
|
||||||
|
that called the PAPI_library_init() function.
|
||||||
|
|
||||||
|
In the _mx_init_component() function,
|
||||||
|
the MX module only needs to be able to verify that a load module named "mx_counters" exists.
|
||||||
|
We improved the _mx_init_component() function to call fopen(3) instead of popen(3).
|
||||||
|
We add string length check before strncpy() and strcat() calls in _mx_init_component() function.
|
||||||
|
|
||||||
|
diff --git a/src/components/mx/linux-mx.c b/src/components/mx/linux-mx.c
|
||||||
|
index 34e6f02c2..c2920d65b 100644
|
||||||
|
--- a/src/components/mx/linux-mx.c
|
||||||
|
+++ b/src/components/mx/linux-mx.c
|
||||||
|
@@ -225,7 +225,7 @@ _mx_init_component( int cidx )
|
||||||
|
|
||||||
|
FILE *fff;
|
||||||
|
char *path;
|
||||||
|
- int len, pathlen;
|
||||||
|
+ int checklen, len, pathlen;
|
||||||
|
|
||||||
|
/* detect if MX available */
|
||||||
|
|
||||||
|
@@ -233,13 +233,31 @@ _mx_init_component( int cidx )
|
||||||
|
pathlen = strlen(path);
|
||||||
|
while(pathlen > 0) {
|
||||||
|
len = strcspn(path, ":");
|
||||||
|
- strncpy(mx_counters_exe, path, len);
|
||||||
|
+ if (len < BUFSIZ) {
|
||||||
|
+ strncpy(mx_counters_exe, path, len);
|
||||||
|
+ } else {
|
||||||
|
+ fff = NULL;
|
||||||
|
+ break;
|
||||||
|
+ }
|
||||||
|
mx_counters_exe[len] = '\0';
|
||||||
|
- strcat(mx_counters_exe, "/mx_counters");
|
||||||
|
+ checklen = len + strlen("/mx_counters");
|
||||||
|
+ if (checklen < BUFSIZ) {
|
||||||
|
+ strcat(mx_counters_exe, "/mx_counters");
|
||||||
|
+ } else {
|
||||||
|
+ fff = NULL;
|
||||||
|
+ break;
|
||||||
|
+ }
|
||||||
|
fff = fopen(mx_counters_exe, "r");
|
||||||
|
if (fff != NULL) {
|
||||||
|
- strcat(mx_counters_exe, " 2> /dev/null");
|
||||||
|
- break;
|
||||||
|
+ checklen = checklen + strlen(" 2> /dev/null");
|
||||||
|
+ if (checklen < BUFSIZ) {
|
||||||
|
+ strcat(mx_counters_exe, " 2> /dev/null");
|
||||||
|
+ break;
|
||||||
|
+ } else {
|
||||||
|
+ fclose(fff);
|
||||||
|
+ fff = NULL;
|
||||||
|
+ break;
|
||||||
|
+ }
|
||||||
|
}
|
||||||
|
pathlen = pathlen - len - 1;
|
||||||
|
if (pathlen > 0) {
|
||||||
|
@@ -247,7 +265,7 @@ _mx_init_component( int cidx )
|
||||||
|
}
|
||||||
|
}
|
||||||
|
if (fff == NULL) {
|
||||||
|
- /* neither real nor fake found */
|
||||||
|
+ /* mx_counters not found */
|
||||||
|
strncpy(_mx_vector.cmp_info.disabled_reason,
|
||||||
|
"No MX utilities found",PAPI_MAX_STR_LEN);
|
||||||
|
return PAPI_ECMP;
|
22
SOURCES/papi-rhbz1918721.patch
Normal file
22
SOURCES/papi-rhbz1918721.patch
Normal file
@ -0,0 +1,22 @@
|
|||||||
|
diff -up papi-5.6.0/src/papi_events.csv.p9 papi-5.6.0/src/papi_events.csv
|
||||||
|
--- papi-5.6.0/src/papi_events.csv.p9 2021-05-25 16:19:17.342588151 -0400
|
||||||
|
+++ papi-5.6.0/src/papi_events.csv 2021-05-25 16:54:06.357460525 -0400
|
||||||
|
@@ -1580,15 +1580,15 @@ PRESET,PAPI_L1_DCR,DERIVED_SUB,PM_LD_REF
|
||||||
|
#PRESET,PAPI_L1_DCA,DERIVED_POSTFIX,N0|N1|-|N2|+|N3|-,PM_ST_FIN,PM_ST_MISS_L1,PM_LD_REF_L1,PM_LD_MISS_L1_ALT
|
||||||
|
PRESET,PAPI_L1_DCA,DERIVED_ADD,PM_LD_REF_L1,PM_ST_CMPL
|
||||||
|
PRESET,PAPI_L2_DCM,NOT_DERIVED,PM_DATA_FROM_L2MISS
|
||||||
|
-PRESET,PAPI_L2_LDM,NOT_DERIVED,PM_L2_LD_MISS
|
||||||
|
-PRESET,PAPI_L2_STM,NOT_DERIVED,PM_L2_ST_MISS
|
||||||
|
+#PRESET,PAPI_L2_LDM,NOT_DERIVED,PM_L2_LD_MISS
|
||||||
|
+#PRESET,PAPI_L2_STM,NOT_DERIVED,PM_L2_ST_MISS
|
||||||
|
PRESET,PAPI_L3_DCR,NOT_DERIVED,PM_DATA_FROM_L2MISS
|
||||||
|
PRESET,PAPI_L3_DCM,DERIVED_ADD,PM_DATA_FROM_LMEM,PM_DATA_FROM_RMEM
|
||||||
|
PRESET,PAPI_L3_LDM,DERIVED_ADD,PM_DATA_FROM_LMEM,PM_DATA_FROM_RMEM
|
||||||
|
PRESET,PAPI_L1_ICH,NOT_DERIVED,PM_INST_FROM_L1
|
||||||
|
PRESET,PAPI_L1_ICM,NOT_DERIVED,PM_L1_ICACHE_MISS
|
||||||
|
PRESET,PAPI_L2_ICM,NOT_DERIVED,PM_INST_FROM_L2MISS
|
||||||
|
-PRESET,PAPI_L2_ICM,NOT_DERIVED,PM_L2_INST_MISS
|
||||||
|
+#PRESET,PAPI_L2_ICM,NOT_DERIVED,PM_L2_INST_MISS
|
||||||
|
PRESET,PAPI_L2_ICH,NOT_DERIVED,PM_INST_FROM_L2
|
||||||
|
PRESET,PAPI_L3_ICA,NOT_DERIVED,PM_INST_FROM_L2MISS
|
||||||
|
PRESET,PAPI_L3_ICH,NOT_DERIVED,PM_INST_FROM_L3
|
@ -8,7 +8,7 @@
|
|||||||
Summary: Performance Application Programming Interface
|
Summary: Performance Application Programming Interface
|
||||||
Name: papi
|
Name: papi
|
||||||
Version: 5.6.0
|
Version: 5.6.0
|
||||||
Release: 11%{?dist}
|
Release: 14%{?dist}
|
||||||
License: BSD
|
License: BSD
|
||||||
Group: Development/System
|
Group: Development/System
|
||||||
Requires: papi-libs = %{version}-%{release}
|
Requires: papi-libs = %{version}-%{release}
|
||||||
@ -18,6 +18,9 @@ Patch1: papi-ldflags.patch
|
|||||||
Patch2: papi-divzero.patch
|
Patch2: papi-divzero.patch
|
||||||
Patch3: papi-rhbz1807346.patch
|
Patch3: papi-rhbz1807346.patch
|
||||||
Patch4: papi-thread_init.patch
|
Patch4: papi-thread_init.patch
|
||||||
|
Patch5: papi-mx.patch
|
||||||
|
Patch6: papi-bz1908126.patch
|
||||||
|
Patch7: papi-rhbz1918721.patch
|
||||||
BuildRequires: autoconf
|
BuildRequires: autoconf
|
||||||
BuildRequires: doxygen
|
BuildRequires: doxygen
|
||||||
BuildRequires: ncurses-devel
|
BuildRequires: ncurses-devel
|
||||||
@ -85,6 +88,9 @@ the PAPI user-space libraries and interfaces.
|
|||||||
%patch2 -p1 -b .divzero
|
%patch2 -p1 -b .divzero
|
||||||
%patch3 -p1 -b .rhbz1807346
|
%patch3 -p1 -b .rhbz1807346
|
||||||
%patch4 -p1 -b .thread_init
|
%patch4 -p1 -b .thread_init
|
||||||
|
%patch5 -p1
|
||||||
|
%patch6 -p1
|
||||||
|
%patch7 -p1
|
||||||
|
|
||||||
%build
|
%build
|
||||||
%if %{without bundled_libpfm}
|
%if %{without bundled_libpfm}
|
||||||
@ -167,6 +173,15 @@ chrpath --delete $RPM_BUILD_ROOT%{_libdir}/*.so*
|
|||||||
%{_libdir}/*.a
|
%{_libdir}/*.a
|
||||||
|
|
||||||
%changelog
|
%changelog
|
||||||
|
* Tue May 25 2021 William Cohen <wcohen@redhat.com> - 5.6.0-14
|
||||||
|
- Disable problematic IBM Power9 events.
|
||||||
|
|
||||||
|
* Tue May 25 2021 William Cohen <wcohen@redhat.com> - 5.6.0-13
|
||||||
|
- Add Fujitsu A64FX support.
|
||||||
|
|
||||||
|
* Tue May 18 2021 William Cohen <wcohen@redhat.com> - 5.6.0-12
|
||||||
|
- Improvements to mx component.
|
||||||
|
|
||||||
* Fri Aug 21 2020 William Cohen <wcohen@redhat.com> - 5.6.0-11
|
* Fri Aug 21 2020 William Cohen <wcohen@redhat.com> - 5.6.0-11
|
||||||
- Correct the handling of multiple threads. (rhbz1807346)
|
- Correct the handling of multiple threads. (rhbz1807346)
|
||||||
|
|
||||||
|
Loading…
Reference in New Issue
Block a user