Update to 20.1.2
Resolves: RHEL-80988
This commit is contained in:
		
							parent
							
								
									2421001db4
								
							
						
					
					
						commit
						442ba971bf
					
				| @ -4,13 +4,14 @@ | ||||
| 
 | ||||
| COPR_USERNAME=$(shell rpm --eval %copr_username) | ||||
| COPR_PROJECT=$(shell rpm --eval %copr_projectname) | ||||
| YYYYMMDD=$(shell date +%Y%m%d) | ||||
| 
 | ||||
| .PHONY: srpm | ||||
| srpm: | ||||
| 	dnf install -y dnf-plugins-core fedora-packager | ||||
| 	dnf copr enable -y --setopt=reposdir=/tmp/yum.repos.d $(COPR_USERNAME)/$(COPR_PROJECT) | ||||
| 	dnf install -y --setopt=reposdir=/tmp/yum.repos.d llvm-snapshot-builder | ||||
| 	dnf install -y git tar xz curl --setopt=install_weak_deps=False | ||||
| 	YYYYMMDD=$(YYYYMMDD) ./.copr/snapshot-info.sh > version.spec.inc | ||||
| 	rpmbuild \
 | ||||
| 		--with=snapshot_build \
 | ||||
| 		--define "_srcrpmdir $(outdir)" \
 | ||||
| 		--define "_sourcedir $(shell pwd)" \
 | ||||
| 		--define "_disable_source_fetch 0" \
 | ||||
|  | ||||
							
								
								
									
										76
									
								
								.copr/snapshot-info.sh
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										76
									
								
								.copr/snapshot-info.sh
									
									
									
									
									
										Normal file
									
								
							| @ -0,0 +1,76 @@ | ||||
| #!/usr/bin/bash | ||||
| 
 | ||||
| # You need these packages to run this script: git tar xz curl-minimal | ||||
| 
 | ||||
| set -e | ||||
| 
 | ||||
| # This is important for systems that have a different local but want to produce | ||||
| # a valid changelog date. | ||||
| LANG=en_EN | ||||
| 
 | ||||
| function loginfo() { | ||||
|     local msg=$1 | ||||
|     >&2 echo "[INFO]" $msg | ||||
| } | ||||
| 
 | ||||
| function logerr() { | ||||
|     local msg=$1 | ||||
|     >&2 echo "[ERROR]" $msg | ||||
| } | ||||
| 
 | ||||
| # Check if we shall gather versioning information from a supplied git tree | ||||
| if [ "$GIT_TREE" != "" ]; then | ||||
|     loginfo "Gathering snapshot info from here: $GIT_TREE" | ||||
|     if [ "$(git -C $GIT_TREE  rev-parse --is-inside-work-tree 2>/dev/null)" != "true" ]; then | ||||
|         logerr "Not a git directory: $GIT_TREE" | ||||
|         exit 1 | ||||
|     fi | ||||
|     llvm_snapshot_git_revision=$(git -C $GIT_TREE rev-parse HEAD) | ||||
|     versionfile=$GIT_TREE/cmake/Modules/LLVMVersion.cmake | ||||
|     llvm_snapshot_version=`grep -ioP 'set\(\s*LLVM_VERSION_(MAJOR|MINOR|PATCH)\s\K[0-9]+' ${versionfile} | paste -sd '.'` | ||||
| fi | ||||
| 
 | ||||
| loginfo "Determine date in YYYYMMDD form" | ||||
| llvm_snapshot_yyyymmdd=$(date +%Y%m%d) | ||||
| [[ ! -z "${YYYYMMDD}" ]] && llvm_snapshot_yyyymmdd=$YYYYMMDD | ||||
| 
 | ||||
| if [ -z $GIT_TREE ]; then | ||||
|     git_revision_url=https://github.com/fedora-llvm-team/llvm-snapshots/releases/download/snapshot-version-sync/llvm-git-revision-${llvm_snapshot_yyyymmdd}.txt | ||||
|     loginfo "Get the revision for today from $git_revision_url" | ||||
|     llvm_snapshot_git_revision=$(curl -sL $git_revision_url) | ||||
| fi | ||||
| llvm_snapshot_git_revision_short=$(echo "${llvm_snapshot_git_revision:0:14}") | ||||
| 
 | ||||
| 
 | ||||
| if [ -z $GIT_TREE ]; then | ||||
|     release_url=https://github.com/fedora-llvm-team/llvm-snapshots/releases/download/snapshot-version-sync/llvm-release-${llvm_snapshot_yyyymmdd}.txt | ||||
|     loginfo "Get the release for today from $release_url" | ||||
|     llvm_snapshot_version=$(curl -sL $release_url) | ||||
| fi | ||||
| llvm_snapshot_version_major=$(echo $llvm_snapshot_version | cut -f1 -d.) | ||||
| llvm_snapshot_version_minor=$(echo $llvm_snapshot_version | cut -f2 -d.) | ||||
| llvm_snapshot_version_patch=$(echo $llvm_snapshot_version | cut -f3 -d.) | ||||
| llvm_snapshot_version_suffix=pre${llvm_snapshot_yyyymmdd}.g${llvm_snapshot_git_revision_short} | ||||
| 
 | ||||
| tempfile=$(mktemp) | ||||
| cat > $tempfile <<EOF | ||||
| %global maj_ver ${llvm_snapshot_version_major} | ||||
| %global min_ver ${llvm_snapshot_version_minor} | ||||
| %global patch_ver ${llvm_snapshot_version_patch} | ||||
| %undefine rc_ver | ||||
| 
 | ||||
| %global llvm_snapshot_version            ${llvm_snapshot_version} | ||||
| %global llvm_snapshot_version_major      ${llvm_snapshot_version_major} | ||||
| %global llvm_snapshot_version_minor      ${llvm_snapshot_version_minor} | ||||
| %global llvm_snapshot_version_patch      ${llvm_snapshot_version_patch} | ||||
| %global llvm_snapshot_yyyymmdd           ${llvm_snapshot_yyyymmdd} | ||||
| %global llvm_snapshot_git_revision       ${llvm_snapshot_git_revision} | ||||
| %global llvm_snapshot_git_revision_short ${llvm_snapshot_git_revision_short} | ||||
| %global llvm_snapshot_version_suffix     ${llvm_snapshot_version_suffix} | ||||
| EOF | ||||
| 
 | ||||
| # One for logs | ||||
| cat $tempfile >&2 | ||||
| 
 | ||||
| # One to redirect it away | ||||
| cat $tempfile | ||||
							
								
								
									
										9
									
								
								.git-blame-ignore-revs
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										9
									
								
								.git-blame-ignore-revs
									
									
									
									
									
										Normal file
									
								
							| @ -0,0 +1,9 @@ | ||||
| # Since version 2.23 (released in August 2019), git-blame has a feature | ||||
| # to ignore or bypass certain commits. | ||||
| # | ||||
| # This file contains a list of commits that are not likely what you | ||||
| # are looking for in a blame, such as mass reformatting or renaming. | ||||
| # You can set this file as a default ignore file for blame by running | ||||
| # the following command. | ||||
| # | ||||
| # $ git config blame.ignoreRevsFile .git-blame-ignore-revs | ||||
							
								
								
									
										7
									
								
								.gitignore
									
									
									
									
										vendored
									
									
								
							
							
						
						
									
										7
									
								
								.gitignore
									
									
									
									
										vendored
									
									
								
							| @ -1,7 +1,14 @@ | ||||
| /*.src.rpm | ||||
| /*.src.tar.xz | ||||
| /*.src.tar.xz.sig | ||||
| /*.tar.gz | ||||
| /cmake/ | ||||
| /llvm-*.src/ | ||||
| /results_llvm/ | ||||
| /third-party/ | ||||
| /llvm-git-revision-*.txt | ||||
| /llvm-release-*.txt | ||||
| /BUILD | ||||
| /BUILDROOT | ||||
| /out | ||||
| /version.spec.inc | ||||
|  | ||||
							
								
								
									
										30
									
								
								.pre-commit-config.yaml
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										30
									
								
								.pre-commit-config.yaml
									
									
									
									
									
										Normal file
									
								
							| @ -0,0 +1,30 @@ | ||||
| # See https://pre-commit.com for more information | ||||
| # See https://pre-commit.com/hooks.html for more hooks | ||||
| repos: | ||||
|   - repo: https://github.com/pre-commit/pre-commit-hooks | ||||
|     rev: v5.0.0 | ||||
|     hooks: | ||||
|       - id: check-ast | ||||
|       - id: check-case-conflict | ||||
|       - id: check-docstring-first | ||||
|       - id: check-executables-have-shebangs | ||||
|       - id: check-merge-conflict | ||||
|       - id: check-symlinks | ||||
|       - id: trailing-whitespace | ||||
|       - id: end-of-file-fixer | ||||
|       - id: mixed-line-ending | ||||
|       - id: fix-byte-order-marker | ||||
|       - id: detect-private-key | ||||
|       - id: check-toml | ||||
|       - id: check-yaml | ||||
|         args: | ||||
|           - "--allow-multiple-documents" | ||||
|           - "--unsafe" | ||||
| 
 | ||||
|   # See https://tmt.readthedocs.io/en/latest/guide.html#checking-data-validity | ||||
|   - repo: https://github.com/teemtee/tmt.git | ||||
|     rev: 1.38.0 | ||||
|     hooks: | ||||
|       - id: tmt-lint | ||||
| 
 | ||||
| exclude: ".*\\.patch" | ||||
| @ -1,29 +0,0 @@ | ||||
| From b1c60d7fa322a2d208556087df9e7ef94bfbffb8 Mon Sep 17 00:00:00 2001 | ||||
| From: Nikita Popov <npopov@redhat.com> | ||||
| Date: Wed, 8 May 2024 12:30:36 +0900 | ||||
| Subject: [PATCH] Always build shared libs for LLD | ||||
| 
 | ||||
| We don't want to enable BUILD_SHARED_LIBS for the whole build, | ||||
| but we do want to build lld libraries. | ||||
| ---
 | ||||
|  lld/cmake/modules/AddLLD.cmake | 5 ++--- | ||||
|  1 file changed, 2 insertions(+), 3 deletions(-) | ||||
| 
 | ||||
| diff --git a/lld/cmake/modules/AddLLD.cmake b/lld/cmake/modules/AddLLD.cmake
 | ||||
| index 2ee066b41535..270c03f096ac 100644
 | ||||
| --- a/lld/cmake/modules/AddLLD.cmake
 | ||||
| +++ b/lld/cmake/modules/AddLLD.cmake
 | ||||
| @@ -7,9 +7,8 @@ macro(add_lld_library name)
 | ||||
|      "" | ||||
|      "" | ||||
|      ${ARGN}) | ||||
| -  if(ARG_SHARED)
 | ||||
| -    set(ARG_ENABLE_SHARED SHARED)
 | ||||
| -  endif()
 | ||||
| +  # Always build shared libs for LLD.
 | ||||
| +  set(ARG_ENABLE_SHARED SHARED)
 | ||||
|    llvm_add_library(${name} ${ARG_ENABLE_SHARED} ${ARG_UNPARSED_ARGUMENTS}) | ||||
|    set_target_properties(${name} PROPERTIES FOLDER "lld libraries") | ||||
|   | ||||
| -- 
 | ||||
| 2.44.0 | ||||
							
								
								
									
										59
									
								
								0001-20-polly-shared-libs.patch
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										59
									
								
								0001-20-polly-shared-libs.patch
									
									
									
									
									
										Normal file
									
								
							| @ -0,0 +1,59 @@ | ||||
| From cecb98f56e7d6619d0427fbdbc2f200ce212f0c6 Mon Sep 17 00:00:00 2001 | ||||
| From: Konrad Kleine <kkleine@redhat.com> | ||||
| Date: Tue, 28 Jan 2025 08:34:09 +0000 | ||||
| Subject: [PATCH] [polly] shared libs | ||||
| 
 | ||||
| ---
 | ||||
|  polly/cmake/polly_macros.cmake    | 5 ++++- | ||||
|  polly/lib/CMakeLists.txt          | 1 + | ||||
|  polly/lib/External/CMakeLists.txt | 1 + | ||||
|  3 files changed, 6 insertions(+), 1 deletion(-) | ||||
| 
 | ||||
| diff --git a/polly/cmake/polly_macros.cmake b/polly/cmake/polly_macros.cmake
 | ||||
| index 9bd7b0b0ea59..fc2c3a76901f 100644
 | ||||
| --- a/polly/cmake/polly_macros.cmake
 | ||||
| +++ b/polly/cmake/polly_macros.cmake
 | ||||
| @@ -1,5 +1,5 @@
 | ||||
|  macro(add_polly_library name) | ||||
| -  cmake_parse_arguments(ARG "" "" "" ${ARGN})
 | ||||
| +  cmake_parse_arguments(ARG "SHARED" "" "" ${ARGN})
 | ||||
|    set(srcs ${ARG_UNPARSED_ARGUMENTS}) | ||||
|    if(MSVC_IDE OR XCODE) | ||||
|      file( GLOB_RECURSE headers *.h *.td *.def) | ||||
| @@ -17,6 +17,9 @@ macro(add_polly_library name)
 | ||||
|    else() | ||||
|      set(libkind) | ||||
|    endif() | ||||
| +  if (ARG_SHARED)
 | ||||
| +    set(libkind SHARED)
 | ||||
| +  endif()
 | ||||
|    add_library( ${name} ${libkind} ${srcs} ) | ||||
|    set_target_properties(${name} PROPERTIES FOLDER "Polly/Libraries") | ||||
|   | ||||
| diff --git a/polly/lib/CMakeLists.txt b/polly/lib/CMakeLists.txt
 | ||||
| index d91f4ecd37e6..965f635b7ff6 100644
 | ||||
| --- a/polly/lib/CMakeLists.txt
 | ||||
| +++ b/polly/lib/CMakeLists.txt
 | ||||
| @@ -41,6 +41,7 @@ set(POLLY_COMPONENTS
 | ||||
|  # the sources them to be recompiled for each of them. | ||||
|  add_llvm_pass_plugin(Polly | ||||
|    NO_MODULE | ||||
| +  SHARED
 | ||||
|    SUBPROJECT Polly | ||||
|    Analysis/DependenceInfo.cpp | ||||
|    Analysis/PolyhedralInfo.cpp | ||||
| diff --git a/polly/lib/External/CMakeLists.txt b/polly/lib/External/CMakeLists.txt
 | ||||
| index 5dd69b7199dc..f065fbd7b942 100644
 | ||||
| --- a/polly/lib/External/CMakeLists.txt
 | ||||
| +++ b/polly/lib/External/CMakeLists.txt
 | ||||
| @@ -284,6 +284,7 @@ if (POLLY_BUNDLED_ISL)
 | ||||
|      ) | ||||
|   | ||||
|    add_polly_library(PollyISL | ||||
| +    SHARED
 | ||||
|      ${ISL_FILES} | ||||
|      ) | ||||
|   | ||||
| -- 
 | ||||
| 2.46.0 | ||||
| 
 | ||||
							
								
								
									
										81
									
								
								0001-SystemZ-Fix-ICE-with-i128-i64-uaddo-carry-chain.patch
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										81
									
								
								0001-SystemZ-Fix-ICE-with-i128-i64-uaddo-carry-chain.patch
									
									
									
									
									
										Normal file
									
								
							| @ -0,0 +1,81 @@ | ||||
| From 6d5697f7cb4e933d2f176c46b7ac05a9cbaeb8b6 Mon Sep 17 00:00:00 2001 | ||||
| From: Ulrich Weigand <ulrich.weigand@de.ibm.com> | ||||
| Date: Thu, 23 Jan 2025 19:11:18 +0100 | ||||
| Subject: [PATCH] [SystemZ] Fix ICE with i128->i64 uaddo carry chain | ||||
| 
 | ||||
| We can only optimize a uaddo_carry via specialized instruction | ||||
| if the carry was produced by another uaddo(_carry) instruction; | ||||
| there is already a check for that. | ||||
| 
 | ||||
| However, i128 uaddo(_carry) use a completely different mechanism; | ||||
| they indicate carry in a vector register instead of the CC flag. | ||||
| Thus, we must also check that we don't mix those two - that check | ||||
| has been missing. | ||||
| 
 | ||||
| Fixes: https://github.com/llvm/llvm-project/issues/124001 | ||||
| ---
 | ||||
|  .../Target/SystemZ/SystemZISelLowering.cpp    | 12 ++++++---- | ||||
|  llvm/test/CodeGen/SystemZ/pr124001.ll         | 23 +++++++++++++++++++ | ||||
|  2 files changed, 31 insertions(+), 4 deletions(-) | ||||
|  create mode 100644 llvm/test/CodeGen/SystemZ/pr124001.ll | ||||
| 
 | ||||
| diff --git a/llvm/lib/Target/SystemZ/SystemZISelLowering.cpp b/llvm/lib/Target/SystemZ/SystemZISelLowering.cpp
 | ||||
| index 4040ab6d4510..1fb31c26e20d 100644
 | ||||
| --- a/llvm/lib/Target/SystemZ/SystemZISelLowering.cpp
 | ||||
| +++ b/llvm/lib/Target/SystemZ/SystemZISelLowering.cpp
 | ||||
| @@ -4708,15 +4708,19 @@ SDValue SystemZTargetLowering::lowerXALUO(SDValue Op,
 | ||||
|  } | ||||
|   | ||||
|  static bool isAddCarryChain(SDValue Carry) { | ||||
| -  while (Carry.getOpcode() == ISD::UADDO_CARRY)
 | ||||
| +  while (Carry.getOpcode() == ISD::UADDO_CARRY &&
 | ||||
| +         Carry->getValueType(0) != MVT::i128)
 | ||||
|      Carry = Carry.getOperand(2); | ||||
| -  return Carry.getOpcode() == ISD::UADDO;
 | ||||
| +  return Carry.getOpcode() == ISD::UADDO &&
 | ||||
| +         Carry->getValueType(0) != MVT::i128;
 | ||||
|  } | ||||
|   | ||||
|  static bool isSubBorrowChain(SDValue Carry) { | ||||
| -  while (Carry.getOpcode() == ISD::USUBO_CARRY)
 | ||||
| +  while (Carry.getOpcode() == ISD::USUBO_CARRY &&
 | ||||
| +         Carry->getValueType(0) != MVT::i128)
 | ||||
|      Carry = Carry.getOperand(2); | ||||
| -  return Carry.getOpcode() == ISD::USUBO;
 | ||||
| +  return Carry.getOpcode() == ISD::USUBO &&
 | ||||
| +         Carry->getValueType(0) != MVT::i128;
 | ||||
|  } | ||||
|   | ||||
|  // Lower UADDO_CARRY/USUBO_CARRY nodes. | ||||
| diff --git a/llvm/test/CodeGen/SystemZ/pr124001.ll b/llvm/test/CodeGen/SystemZ/pr124001.ll
 | ||||
| new file mode 100644 | ||||
| index 000000000000..9cf630a55dd6
 | ||||
| --- /dev/null
 | ||||
| +++ b/llvm/test/CodeGen/SystemZ/pr124001.ll
 | ||||
| @@ -0,0 +1,23 @@
 | ||||
| +; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py UTC_ARGS: --version 5
 | ||||
| +; RUN: llc < %s -mtriple=s390x-linux-gnu -mcpu=z13 | FileCheck %s
 | ||||
| +
 | ||||
| +define i64 @test(i128 %in) {
 | ||||
| +; CHECK-LABEL: test:
 | ||||
| +; CHECK:       # %bb.0:
 | ||||
| +; CHECK-NEXT:    larl %r1, .LCPI0_0
 | ||||
| +; CHECK-NEXT:    vl %v0, 0(%r2), 3
 | ||||
| +; CHECK-NEXT:    vl %v1, 0(%r1), 3
 | ||||
| +; CHECK-NEXT:    vaccq %v0, %v0, %v1
 | ||||
| +; CHECK-NEXT:    vlgvg %r1, %v0, 1
 | ||||
| +; CHECK-NEXT:    la %r2, 1(%r1)
 | ||||
| +; CHECK-NEXT:    br %r14
 | ||||
| +  %1 = tail call { i128, i1 } @llvm.uadd.with.overflow.i128(i128 %in, i128 1)
 | ||||
| +  %2 = extractvalue { i128, i1 } %1, 1
 | ||||
| +  %3 = zext i1 %2 to i64
 | ||||
| +  %4 = add i64 %3, 1
 | ||||
| +  ret i64 %4
 | ||||
| +}
 | ||||
| +
 | ||||
| +declare { i128, i1 } @llvm.uadd.with.overflow.i128(i128, i128) #0
 | ||||
| +
 | ||||
| +attributes #0 = { nocallback nofree nosync nounwind speculatable willreturn memory(none) }
 | ||||
| -- 
 | ||||
| 2.48.1 | ||||
| 
 | ||||
							
								
								
									
										39
									
								
								0001-cmake-Resolve-symlink-when-finding-install-prefix.patch
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										39
									
								
								0001-cmake-Resolve-symlink-when-finding-install-prefix.patch
									
									
									
									
									
										Normal file
									
								
							| @ -0,0 +1,39 @@ | ||||
| From 06774eb8a7dc0bc36b59e53310c7f5b5d89f6c29 Mon Sep 17 00:00:00 2001 | ||||
| From: Nikita Popov <npopov@redhat.com> | ||||
| Date: Tue, 28 Jan 2025 12:31:49 +0100 | ||||
| Subject: [PATCH] [cmake] Resolve symlink when finding install prefix | ||||
| 
 | ||||
| When determining the install prefix in LLVMConfig.cmake etc resolve | ||||
| symlinks in CMAKE_CURRENT_LIST_FILE first. The motivation for this | ||||
| is to support symlinks like `/usr/lib64/cmake/llvm` to | ||||
| `/usr/lib64/llvm19/lib/cmake/llvm`. This only works correctly if | ||||
| the paths are relative to the resolved symlink. | ||||
| 
 | ||||
| It's worth noting that this *mostly* already works out of the box, | ||||
| because cmake automatically does the symlink resolution when the | ||||
| library is found via CMAKE_PREFIX_PATH. It just doesn't happen | ||||
| when it's found via the default prefix path. | ||||
| ---
 | ||||
|  cmake/Modules/FindPrefixFromConfig.cmake | 4 ++-- | ||||
|  1 file changed, 2 insertions(+), 2 deletions(-) | ||||
| 
 | ||||
| diff --git a/cmake/Modules/FindPrefixFromConfig.cmake b/cmake/Modules/FindPrefixFromConfig.cmake
 | ||||
| index 22211e4b72f2..3daff607ff84 100644
 | ||||
| --- a/cmake/Modules/FindPrefixFromConfig.cmake
 | ||||
| +++ b/cmake/Modules/FindPrefixFromConfig.cmake
 | ||||
| @@ -39,10 +39,10 @@ function(find_prefix_from_config out_var prefix_var path_to_leave)
 | ||||
|      # install prefix, and avoid hard-coding any absolute paths. | ||||
|      set(config_code | ||||
|        "# Compute the installation prefix from this LLVMConfig.cmake file location." | ||||
| -      "get_filename_component(${prefix_var} \"\${CMAKE_CURRENT_LIST_FILE}\" PATH)")
 | ||||
| +      "get_filename_component(${prefix_var} \"\${CMAKE_CURRENT_LIST_FILE}\" REALPATH)")
 | ||||
|      # Construct the proper number of get_filename_component(... PATH) | ||||
|      # calls to compute the installation prefix. | ||||
| -    string(REGEX REPLACE "/" ";" _count "${path_to_leave}")
 | ||||
| +    string(REGEX REPLACE "/" ";" _count "${path_to_leave}/plus_one")
 | ||||
|      foreach(p ${_count}) | ||||
|        list(APPEND config_code | ||||
|          "get_filename_component(${prefix_var} \"\${${prefix_var}}\" PATH)") | ||||
| -- 
 | ||||
| 2.48.1 | ||||
| 
 | ||||
| @ -1,62 +0,0 @@ | ||||
| From b2edeb58b8cb3268acee425cd52b406eb60a8095 Mon Sep 17 00:00:00 2001 | ||||
| From: Nikita Popov <npopov@redhat.com> | ||||
| Date: Wed, 9 Oct 2024 11:29:30 +0200 | ||||
| Subject: [PATCH] [openmp] Add option to disable tsan tests (#111548) | ||||
| 
 | ||||
| This adds a OPENMP_TEST_ENABLE_TSAN option that allows to override | ||||
| whether tests using tsan will be enabled. The option defaults to the | ||||
| existing auto-detection. | ||||
| 
 | ||||
| The background here is | ||||
| https://github.com/llvm/llvm-project/issues/111492, where we have some | ||||
| systems where tsan doesn't work, but we do still want to build it and | ||||
| run tests that don't use tsan. | ||||
| ---
 | ||||
|  openmp/cmake/OpenMPTesting.cmake          | 3 +++ | ||||
|  openmp/tools/archer/tests/CMakeLists.txt  | 2 +- | ||||
|  openmp/tools/archer/tests/lit.site.cfg.in | 2 +- | ||||
|  3 files changed, 5 insertions(+), 2 deletions(-) | ||||
| 
 | ||||
| diff --git a/openmp/cmake/OpenMPTesting.cmake b/openmp/cmake/OpenMPTesting.cmake
 | ||||
| index c67ad8b1cbd9..14cc5c67d84c 100644
 | ||||
| --- a/openmp/cmake/OpenMPTesting.cmake
 | ||||
| +++ b/openmp/cmake/OpenMPTesting.cmake
 | ||||
| @@ -163,6 +163,9 @@ else()
 | ||||
|    set(OPENMP_TEST_COMPILER_HAS_OMIT_FRAME_POINTER_FLAGS 1) | ||||
|  endif() | ||||
|   | ||||
| +set(OPENMP_TEST_ENABLE_TSAN "${OPENMP_TEST_COMPILER_HAS_TSAN_FLAGS}" CACHE BOOL
 | ||||
| +    "Whether to enable tests using tsan")
 | ||||
| +
 | ||||
|  # Function to set compiler features for use in lit. | ||||
|  function(update_test_compiler_features) | ||||
|    set(FEATURES "[") | ||||
| diff --git a/openmp/tools/archer/tests/CMakeLists.txt b/openmp/tools/archer/tests/CMakeLists.txt
 | ||||
| index 5de91148fa4b..412c7d63725e 100644
 | ||||
| --- a/openmp/tools/archer/tests/CMakeLists.txt
 | ||||
| +++ b/openmp/tools/archer/tests/CMakeLists.txt
 | ||||
| @@ -28,7 +28,7 @@ macro(pythonize_bool var)
 | ||||
|  endmacro() | ||||
|   | ||||
|  pythonize_bool(LIBARCHER_HAVE_LIBATOMIC) | ||||
| -pythonize_bool(OPENMP_TEST_COMPILER_HAS_TSAN_FLAGS)
 | ||||
| +pythonize_bool(OPENMP_TEST_ENABLE_TSAN)
 | ||||
|   | ||||
|  set(ARCHER_TSAN_TEST_DEPENDENCE "") | ||||
|  if(TARGET tsan) | ||||
| diff --git a/openmp/tools/archer/tests/lit.site.cfg.in b/openmp/tools/archer/tests/lit.site.cfg.in
 | ||||
| index 55edfde9738e..ddcb7b8bc3a5 100644
 | ||||
| --- a/openmp/tools/archer/tests/lit.site.cfg.in
 | ||||
| +++ b/openmp/tools/archer/tests/lit.site.cfg.in
 | ||||
| @@ -12,7 +12,7 @@ config.omp_library_dir = "@LIBOMP_LIBRARY_DIR@"
 | ||||
|  config.omp_header_dir = "@LIBOMP_INCLUDE_DIR@" | ||||
|  config.operating_system = "@CMAKE_SYSTEM_NAME@" | ||||
|  config.has_libatomic = @LIBARCHER_HAVE_LIBATOMIC@ | ||||
| -config.has_tsan = @OPENMP_TEST_COMPILER_HAS_TSAN_FLAGS@
 | ||||
| +config.has_tsan = @OPENMP_TEST_ENABLE_TSAN@
 | ||||
|   | ||||
|  config.test_archer_flags = "@LIBARCHER_TEST_FLAGS@" | ||||
|  config.libarcher_obj_root = "@CMAKE_CURRENT_BINARY_DIR@" | ||||
| -- 
 | ||||
| 2.46.0 | ||||
| 
 | ||||
| @ -1,51 +0,0 @@ | ||||
| From 90a05f32166c4a45224a5eedbec9c5c7e21d2dbf Mon Sep 17 00:00:00 2001 | ||||
| From: Nikita Popov <npopov@redhat.com> | ||||
| Date: Fri, 17 Jan 2025 09:26:49 +0100 | ||||
| Subject: [PATCH] [openmp] Support CET in z_Linux_asm.S (#123213) | ||||
| 
 | ||||
| When libomp is built with -cf-protection, add endbr instructions to the | ||||
| start of functions for Intel CET support. | ||||
| ---
 | ||||
|  openmp/runtime/src/z_Linux_asm.S | 12 ++++++++++++ | ||||
|  1 file changed, 12 insertions(+) | ||||
| 
 | ||||
| diff --git a/openmp/runtime/src/z_Linux_asm.S b/openmp/runtime/src/z_Linux_asm.S
 | ||||
| index cc5344cdd124..0bf9f07a13f1 100644
 | ||||
| --- a/openmp/runtime/src/z_Linux_asm.S
 | ||||
| +++ b/openmp/runtime/src/z_Linux_asm.S
 | ||||
| @@ -19,6 +19,16 @@
 | ||||
|   | ||||
|  #if KMP_ARCH_X86 || KMP_ARCH_X86_64 | ||||
|   | ||||
| +# if defined(__ELF__) && defined(__CET__) && defined(__has_include)
 | ||||
| +# if __has_include(<cet.h>)
 | ||||
| +# include <cet.h>
 | ||||
| +# endif
 | ||||
| +# endif
 | ||||
| +
 | ||||
| +# if !defined(_CET_ENDBR)
 | ||||
| +# define _CET_ENDBR
 | ||||
| +# endif
 | ||||
| +
 | ||||
|  # if KMP_MIC | ||||
|  // the 'delay r16/r32/r64' should be used instead of the 'pause'. | ||||
|  // The delay operation has the effect of removing the current thread from | ||||
| @@ -66,6 +76,7 @@
 | ||||
|  	ALIGN  4 | ||||
|  	.globl KMP_PREFIX_UNDERSCORE($0) | ||||
|  KMP_PREFIX_UNDERSCORE($0): | ||||
| +	_CET_ENDBR
 | ||||
|  .endmacro | ||||
|  # else // KMP_OS_DARWIN | ||||
|  #  define KMP_PREFIX_UNDERSCORE(x) x //no extra underscore for Linux* OS symbols | ||||
| @@ -92,6 +103,7 @@ KMP_PREFIX_UNDERSCORE($0):
 | ||||
|          .globl KMP_PREFIX_UNDERSCORE(\proc) | ||||
|  KMP_PREFIX_UNDERSCORE(\proc): | ||||
|  	.cfi_startproc | ||||
| +	_CET_ENDBR
 | ||||
|  .endm | ||||
|  .macro KMP_CFI_DEF_OFFSET sz | ||||
|  	.cfi_def_cfa_offset	\sz | ||||
| -- 
 | ||||
| 2.47.1 | ||||
| 
 | ||||
| @ -1,205 +0,0 @@ | ||||
| From 5fb4d7f6079a76b2907ccc8c53c7c509c30a3dca Mon Sep 17 00:00:00 2001 | ||||
| From: Nikita Popov <npopov@redhat.com> | ||||
| Date: Thu, 10 Oct 2024 12:47:33 +0000 | ||||
| Subject: [PATCH] [openmp] Use core_siblings_list if physical_package_id not | ||||
|  available | ||||
| 
 | ||||
| On powerpc, physical_package_id may not be available. Currently, | ||||
| this causes openmp to fall back to flat topology and various | ||||
| affinity tests fail. | ||||
| 
 | ||||
| Fix this by parsing core_siblings_list to deterimine which cpus | ||||
| belong to the same socket. This matches what the testing code | ||||
| does. The code to parse the CPU list format thankfully already | ||||
| exists. | ||||
| 
 | ||||
| Fixes https://github.com/llvm/llvm-project/issues/111809. | ||||
| ---
 | ||||
|  openmp/runtime/src/kmp_affinity.cpp          | 100 +++++++++++++------ | ||||
|  openmp/runtime/test/affinity/kmp-hw-subset.c |   2 +- | ||||
|  2 files changed, 72 insertions(+), 30 deletions(-) | ||||
| 
 | ||||
| diff --git a/openmp/runtime/src/kmp_affinity.cpp b/openmp/runtime/src/kmp_affinity.cpp
 | ||||
| index cf5cad04eb57..c3d5ecf1345e 100644
 | ||||
| --- a/openmp/runtime/src/kmp_affinity.cpp
 | ||||
| +++ b/openmp/runtime/src/kmp_affinity.cpp
 | ||||
| @@ -1589,15 +1589,13 @@ kmp_str_buf_t *__kmp_affinity_str_buf_mask(kmp_str_buf_t *buf,
 | ||||
|    return buf; | ||||
|  } | ||||
|   | ||||
| -// Return (possibly empty) affinity mask representing the offline CPUs
 | ||||
| -// Caller must free the mask
 | ||||
| -kmp_affin_mask_t *__kmp_affinity_get_offline_cpus() {
 | ||||
| -  kmp_affin_mask_t *offline;
 | ||||
| -  KMP_CPU_ALLOC(offline);
 | ||||
| -  KMP_CPU_ZERO(offline);
 | ||||
| +static kmp_affin_mask_t *__kmp_parse_cpu_list(const char *path) {
 | ||||
| +  kmp_affin_mask_t *mask;
 | ||||
| +  KMP_CPU_ALLOC(mask);
 | ||||
| +  KMP_CPU_ZERO(mask);
 | ||||
|  #if KMP_OS_LINUX | ||||
|    int n, begin_cpu, end_cpu; | ||||
| -  kmp_safe_raii_file_t offline_file;
 | ||||
| +  kmp_safe_raii_file_t file;
 | ||||
|    auto skip_ws = [](FILE *f) { | ||||
|      int c; | ||||
|      do { | ||||
| @@ -1606,29 +1604,29 @@ kmp_affin_mask_t *__kmp_affinity_get_offline_cpus() {
 | ||||
|      if (c != EOF) | ||||
|        ungetc(c, f); | ||||
|    }; | ||||
| -  // File contains CSV of integer ranges representing the offline CPUs
 | ||||
| +  // File contains CSV of integer ranges representing the CPUs
 | ||||
|    // e.g., 1,2,4-7,9,11-15 | ||||
| -  int status = offline_file.try_open("/sys/devices/system/cpu/offline", "r");
 | ||||
| +  int status = file.try_open(path, "r");
 | ||||
|    if (status != 0) | ||||
| -    return offline;
 | ||||
| -  while (!feof(offline_file)) {
 | ||||
| -    skip_ws(offline_file);
 | ||||
| -    n = fscanf(offline_file, "%d", &begin_cpu);
 | ||||
| +    return mask;
 | ||||
| +  while (!feof(file)) {
 | ||||
| +    skip_ws(file);
 | ||||
| +    n = fscanf(file, "%d", &begin_cpu);
 | ||||
|      if (n != 1) | ||||
|        break; | ||||
| -    skip_ws(offline_file);
 | ||||
| -    int c = fgetc(offline_file);
 | ||||
| +    skip_ws(file);
 | ||||
| +    int c = fgetc(file);
 | ||||
|      if (c == EOF || c == ',') { | ||||
|        // Just single CPU | ||||
|        end_cpu = begin_cpu; | ||||
|      } else if (c == '-') { | ||||
|        // Range of CPUs | ||||
| -      skip_ws(offline_file);
 | ||||
| -      n = fscanf(offline_file, "%d", &end_cpu);
 | ||||
| +      skip_ws(file);
 | ||||
| +      n = fscanf(file, "%d", &end_cpu);
 | ||||
|        if (n != 1) | ||||
|          break; | ||||
| -      skip_ws(offline_file);
 | ||||
| -      c = fgetc(offline_file); // skip ','
 | ||||
| +      skip_ws(file);
 | ||||
| +      c = fgetc(file); // skip ','
 | ||||
|      } else { | ||||
|        // Syntax problem | ||||
|        break; | ||||
| @@ -1638,13 +1636,19 @@ kmp_affin_mask_t *__kmp_affinity_get_offline_cpus() {
 | ||||
|          end_cpu >= __kmp_xproc || begin_cpu > end_cpu) { | ||||
|        continue; | ||||
|      } | ||||
| -    // Insert [begin_cpu, end_cpu] into offline mask
 | ||||
| +    // Insert [begin_cpu, end_cpu] into mask
 | ||||
|      for (int cpu = begin_cpu; cpu <= end_cpu; ++cpu) { | ||||
| -      KMP_CPU_SET(cpu, offline);
 | ||||
| +      KMP_CPU_SET(cpu, mask);
 | ||||
|      } | ||||
|    } | ||||
|  #endif | ||||
| -  return offline;
 | ||||
| +  return mask;
 | ||||
| +}
 | ||||
| +
 | ||||
| +// Return (possibly empty) affinity mask representing the offline CPUs
 | ||||
| +// Caller must free the mask
 | ||||
| +kmp_affin_mask_t *__kmp_affinity_get_offline_cpus() {
 | ||||
| +  return __kmp_parse_cpu_list("/sys/devices/system/cpu/offline");
 | ||||
|  } | ||||
|   | ||||
|  // Return the number of available procs | ||||
| @@ -3175,6 +3179,37 @@ static inline const char *__kmp_cpuinfo_get_envvar() {
 | ||||
|    return envvar; | ||||
|  } | ||||
|   | ||||
| +static bool __kmp_package_id_from_core_siblings_list(unsigned **threadInfo,
 | ||||
| +                                                     unsigned num_avail,
 | ||||
| +                                                     unsigned idx) {
 | ||||
| +  if (!KMP_AFFINITY_CAPABLE())
 | ||||
| +    return false;
 | ||||
| +
 | ||||
| +  char path[256];
 | ||||
| +  KMP_SNPRINTF(path, sizeof(path),
 | ||||
| +               "/sys/devices/system/cpu/cpu%u/topology/core_siblings_list",
 | ||||
| +               threadInfo[idx][osIdIndex]);
 | ||||
| +  kmp_affin_mask_t *siblings = __kmp_parse_cpu_list(path);
 | ||||
| +  for (unsigned i = 0; i < num_avail; ++i) {
 | ||||
| +    unsigned cpu_id = threadInfo[i][osIdIndex];
 | ||||
| +    KMP_ASSERT(cpu_id < __kmp_affin_mask_size * CHAR_BIT);
 | ||||
| +    if (!KMP_CPU_ISSET(cpu_id, siblings))
 | ||||
| +      continue;
 | ||||
| +    if (threadInfo[i][pkgIdIndex] == UINT_MAX) {
 | ||||
| +      // Arbitrarily pick the first index we encounter, it only matters that
 | ||||
| +      // the value is the same for all siblings.
 | ||||
| +      threadInfo[i][pkgIdIndex] = idx;
 | ||||
| +    } else if (threadInfo[i][pkgIdIndex] != idx) {
 | ||||
| +      // Contradictory sibling lists.
 | ||||
| +      KMP_CPU_FREE(siblings);
 | ||||
| +      return false;
 | ||||
| +    }
 | ||||
| +  }
 | ||||
| +  KMP_ASSERT(threadInfo[idx][pkgIdIndex] != UINT_MAX);
 | ||||
| +  KMP_CPU_FREE(siblings);
 | ||||
| +  return true;
 | ||||
| +}
 | ||||
| +
 | ||||
|  // Parse /proc/cpuinfo (or an alternate file in the same format) to obtain the | ||||
|  // affinity map. On AIX, the map is obtained through system SRAD (Scheduler | ||||
|  // Resource Allocation Domain). | ||||
| @@ -3550,18 +3585,13 @@ static bool __kmp_affinity_create_cpuinfo_map(int *line,
 | ||||
|          return false; | ||||
|        } | ||||
|   | ||||
| -      // Check for missing fields.  The osId field must be there, and we
 | ||||
| -      // currently require that the physical id field is specified, also.
 | ||||
| +      // Check for missing fields.  The osId field must be there. The physical
 | ||||
| +      // id field will be checked later.
 | ||||
|        if (threadInfo[num_avail][osIdIndex] == UINT_MAX) { | ||||
|          CLEANUP_THREAD_INFO; | ||||
|          *msg_id = kmp_i18n_str_MissingProcField; | ||||
|          return false; | ||||
|        } | ||||
| -      if (threadInfo[0][pkgIdIndex] == UINT_MAX) {
 | ||||
| -        CLEANUP_THREAD_INFO;
 | ||||
| -        *msg_id = kmp_i18n_str_MissingPhysicalIDField;
 | ||||
| -        return false;
 | ||||
| -      }
 | ||||
|   | ||||
|        // Skip this proc if it is not included in the machine model. | ||||
|        if (KMP_AFFINITY_CAPABLE() && | ||||
| @@ -3591,6 +3621,18 @@ static bool __kmp_affinity_create_cpuinfo_map(int *line,
 | ||||
|    } | ||||
|    *line = 0; | ||||
|   | ||||
| +  // At least on powerpc, Linux may return -1 for physical_package_id. Try
 | ||||
| +  // to reconstruct topology from core_siblings_list in that case.
 | ||||
| +  for (i = 0; i < num_avail; ++i) {
 | ||||
| +    if (threadInfo[i][pkgIdIndex] == UINT_MAX) {
 | ||||
| +      if (!__kmp_package_id_from_core_siblings_list(threadInfo, num_avail, i)) {
 | ||||
| +        CLEANUP_THREAD_INFO;
 | ||||
| +        *msg_id = kmp_i18n_str_MissingPhysicalIDField;
 | ||||
| +        return false;
 | ||||
| +      }
 | ||||
| +    }
 | ||||
| +  }
 | ||||
| +
 | ||||
|  #if KMP_MIC && REDUCE_TEAM_SIZE | ||||
|    unsigned teamSize = 0; | ||||
|  #endif // KMP_MIC && REDUCE_TEAM_SIZE | ||||
| diff --git a/openmp/runtime/test/affinity/kmp-hw-subset.c b/openmp/runtime/test/affinity/kmp-hw-subset.c
 | ||||
| index 606fcdfbada9..0b49969bd3b1 100644
 | ||||
| --- a/openmp/runtime/test/affinity/kmp-hw-subset.c
 | ||||
| +++ b/openmp/runtime/test/affinity/kmp-hw-subset.c
 | ||||
| @@ -25,7 +25,7 @@ static int compare_hw_subset_places(const place_list_t *openmp_places,
 | ||||
|      expected_per_place = nthreads_per_core; | ||||
|    } else { | ||||
|      expected_total = nsockets; | ||||
| -    expected_per_place = ncores_per_socket;
 | ||||
| +    expected_per_place = ncores_per_socket * nthreads_per_core;
 | ||||
|    } | ||||
|    if (openmp_places->num_places != expected_total) { | ||||
|      fprintf(stderr, "error: KMP_HW_SUBSET did not half each resource layer!\n"); | ||||
| -- 
 | ||||
| 2.47.0 | ||||
| 
 | ||||
| @ -1,86 +0,0 @@ | ||||
| From ccc2b792e57d632bc887b226a4e7f0a8189eab8b Mon Sep 17 00:00:00 2001 | ||||
| From: Josh Stone <jistone@redhat.com> | ||||
| Date: Mon, 4 Nov 2024 16:37:49 -0800 | ||||
| Subject: [PATCH] [profile] Use base+vaddr for `__llvm_write_binary_ids` note | ||||
|  pointers | ||||
| 
 | ||||
| This function is always examining its own ELF headers in memory, but it | ||||
| was trying to use conditions between examining files or memory, and it | ||||
| wasn't accounting for LOAD offsets at runtime. This is especially bad if | ||||
| a loaded segment has additional padding that's not in the file offsets. | ||||
| 
 | ||||
| Now we do a first scan of the program headers to figure out the runtime | ||||
| base address based on `PT_PHDR` and/or `PT_DYNAMIC` (else assume zero), | ||||
| similar to libc's `do_start`. Then each `PT_NOTE` pointer is simply the | ||||
| base plus the segments's `pt_vaddr`, which includes LOAD offsets. | ||||
| 
 | ||||
| Fixes #114605 | ||||
| ---
 | ||||
|  .../lib/profile/InstrProfilingPlatformLinux.c | 40 ++++++++----------- | ||||
|  1 file changed, 16 insertions(+), 24 deletions(-) | ||||
| 
 | ||||
| diff --git a/compiler-rt/lib/profile/InstrProfilingPlatformLinux.c b/compiler-rt/lib/profile/InstrProfilingPlatformLinux.c
 | ||||
| index e2c06d51e0c6..c365129a0768 100644
 | ||||
| --- a/compiler-rt/lib/profile/InstrProfilingPlatformLinux.c
 | ||||
| +++ b/compiler-rt/lib/profile/InstrProfilingPlatformLinux.c
 | ||||
| @@ -194,41 +194,33 @@ static int WriteBinaryIds(ProfDataWriter *Writer, const ElfW(Nhdr) * Note,
 | ||||
|   */ | ||||
|  COMPILER_RT_VISIBILITY int __llvm_write_binary_ids(ProfDataWriter *Writer) { | ||||
|    extern const ElfW(Ehdr) __ehdr_start __attribute__((visibility("hidden"))); | ||||
| +  extern ElfW(Dyn) _DYNAMIC[] __attribute__((weak, visibility("hidden")));
 | ||||
| +
 | ||||
|    const ElfW(Ehdr) *ElfHeader = &__ehdr_start; | ||||
|    const ElfW(Phdr) *ProgramHeader = | ||||
|        (const ElfW(Phdr) *)((uintptr_t)ElfHeader + ElfHeader->e_phoff); | ||||
|   | ||||
| +  /* Compute the added base address in case of position-independent code. */
 | ||||
| +  uintptr_t Base = 0;
 | ||||
| +  for (uint32_t I = 0; I < ElfHeader->e_phnum; I++) {
 | ||||
| +    if (ProgramHeader[I].p_type == PT_PHDR)
 | ||||
| +      Base = (uintptr_t)ProgramHeader - ProgramHeader[I].p_vaddr;
 | ||||
| +    if (ProgramHeader[I].p_type == PT_DYNAMIC && _DYNAMIC)
 | ||||
| +      Base = (uintptr_t)_DYNAMIC - ProgramHeader[I].p_vaddr;
 | ||||
| +  }
 | ||||
| +
 | ||||
|    int TotalBinaryIdsSize = 0; | ||||
| -  uint32_t I;
 | ||||
|    /* Iterate through entries in the program header. */ | ||||
| -  for (I = 0; I < ElfHeader->e_phnum; I++) {
 | ||||
| +  for (uint32_t I = 0; I < ElfHeader->e_phnum; I++) {
 | ||||
|      /* Look for the notes segment in program header entries. */ | ||||
|      if (ProgramHeader[I].p_type != PT_NOTE) | ||||
|        continue; | ||||
|   | ||||
|      /* There can be multiple notes segment, and examine each of them. */ | ||||
| -    const ElfW(Nhdr) * Note;
 | ||||
| -    const ElfW(Nhdr) * NotesEnd;
 | ||||
| -    /*
 | ||||
| -     * When examining notes in file, use p_offset, which is the offset within
 | ||||
| -     * the elf file, to find the start of notes.
 | ||||
| -     */
 | ||||
| -    if (ProgramHeader[I].p_memsz == 0 ||
 | ||||
| -        ProgramHeader[I].p_memsz == ProgramHeader[I].p_filesz) {
 | ||||
| -      Note = (const ElfW(Nhdr) *)((uintptr_t)ElfHeader +
 | ||||
| -                                  ProgramHeader[I].p_offset);
 | ||||
| -      NotesEnd = (const ElfW(Nhdr) *)((const char *)(Note) +
 | ||||
| -                                      ProgramHeader[I].p_filesz);
 | ||||
| -    } else {
 | ||||
| -      /*
 | ||||
| -       * When examining notes in memory, use p_vaddr, which is the address of
 | ||||
| -       * section after loaded to memory, to find the start of notes.
 | ||||
| -       */
 | ||||
| -      Note =
 | ||||
| -          (const ElfW(Nhdr) *)((uintptr_t)ElfHeader + ProgramHeader[I].p_vaddr);
 | ||||
| -      NotesEnd =
 | ||||
| -          (const ElfW(Nhdr) *)((const char *)(Note) + ProgramHeader[I].p_memsz);
 | ||||
| -    }
 | ||||
| +    const ElfW(Nhdr) *Note =
 | ||||
| +        (const ElfW(Nhdr) *)(Base + ProgramHeader[I].p_vaddr);
 | ||||
| +    const ElfW(Nhdr) *NotesEnd =
 | ||||
| +        (const ElfW(Nhdr) *)((const char *)(Note) + ProgramHeader[I].p_memsz);
 | ||||
|   | ||||
|      int BinaryIdsSize = WriteBinaryIds(Writer, Note, NotesEnd); | ||||
|      if (TotalBinaryIdsSize == -1) | ||||
| -- 
 | ||||
| 2.47.0 | ||||
| 
 | ||||
							
								
								
									
										46
									
								
								131801.patch
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										46
									
								
								131801.patch
									
									
									
									
									
										Normal file
									
								
							| @ -0,0 +1,46 @@ | ||||
| From d25887408ee9fb78d68787ff7388cba254aced6f Mon Sep 17 00:00:00 2001 | ||||
| From: Nikita Popov <npopov@redhat.com> | ||||
| Date: Tue, 18 Mar 2025 14:36:06 +0100 | ||||
| Subject: [PATCH] [GlobalMerge][PPC] Don't merge globals in llvm.metadata | ||||
|  section | ||||
| 
 | ||||
| The llvm.metadata section is not emitted and has special semantics. | ||||
| We should not merge globals in it, similarly to how we already | ||||
| skip merging of `llvm.xyz` globals. | ||||
| 
 | ||||
| Fixes https://github.com/llvm/llvm-project/issues/131394. | ||||
| ---
 | ||||
|  llvm/lib/CodeGen/GlobalMerge.cpp                        | 3 ++- | ||||
|  llvm/test/CodeGen/PowerPC/global-merge-llvm-metadata.ll | 9 +++++++++ | ||||
|  2 files changed, 11 insertions(+), 1 deletion(-) | ||||
|  create mode 100644 llvm/test/CodeGen/PowerPC/global-merge-llvm-metadata.ll | ||||
| 
 | ||||
| diff --git a/llvm/lib/CodeGen/GlobalMerge.cpp b/llvm/lib/CodeGen/GlobalMerge.cpp
 | ||||
| index 1aedc447935b7..ca743918cec24 100644
 | ||||
| --- a/llvm/lib/CodeGen/GlobalMerge.cpp
 | ||||
| +++ b/llvm/lib/CodeGen/GlobalMerge.cpp
 | ||||
| @@ -711,7 +711,8 @@ bool GlobalMergeImpl::run(Module &M) {
 | ||||
|        continue; | ||||
|   | ||||
|      // Ignore all 'special' globals. | ||||
| -    if (GV.getName().starts_with("llvm.") || GV.getName().starts_with(".llvm."))
 | ||||
| +    if (GV.getName().starts_with("llvm.") ||
 | ||||
| +        GV.getName().starts_with(".llvm.") || Section == "llvm.metadata")
 | ||||
|        continue; | ||||
|   | ||||
|      // Ignore all "required" globals: | ||||
| diff --git a/llvm/test/CodeGen/PowerPC/global-merge-llvm-metadata.ll b/llvm/test/CodeGen/PowerPC/global-merge-llvm-metadata.ll
 | ||||
| new file mode 100644 | ||||
| index 0000000000000..7db092e13afeb
 | ||||
| --- /dev/null
 | ||||
| +++ b/llvm/test/CodeGen/PowerPC/global-merge-llvm-metadata.ll
 | ||||
| @@ -0,0 +1,9 @@
 | ||||
| +; RUN: llc -mtriple=powerpc64le-unknown-linux-gnu < %s | FileCheck %s
 | ||||
| +
 | ||||
| +@index = global i32 0, align 4
 | ||||
| +@.str = private unnamed_addr constant [1 x i8] zeroinitializer, section "llvm.metadata"
 | ||||
| +@.str.1 = private unnamed_addr constant [7 x i8] c"test.c\00", section "llvm.metadata" 
 | ||||
| +@llvm.global.annotations = appending global [1 x { ptr, ptr, ptr, i32, ptr }] [{ ptr, ptr, ptr, i32, ptr } { ptr @index, ptr @.str, ptr @.str.1, i32 1, ptr null }], section "llvm.metadata"
 | ||||
| +
 | ||||
| +; CHECK-NOT: .set
 | ||||
| +; CHECK-NOT: _MergedGlobals
 | ||||
							
								
								
									
										893
									
								
								18-99273.patch
									
									
									
									
									
								
							
							
						
						
									
										893
									
								
								18-99273.patch
									
									
									
									
									
								
							| @ -1,893 +0,0 @@ | ||||
| From 91052169960477fbc39169c10f9fae3bec732510 Mon Sep 17 00:00:00 2001 | ||||
| From: Carl Ritson <carl.ritson@amd.com> | ||||
| Date: Wed, 17 Jul 2024 15:07:42 +0900 | ||||
| Subject: [PATCH 1/3] [AMDGPU] Implement workaround for GFX11.5 export priority | ||||
| 
 | ||||
| On GFX11.5 shaders having completed exports need to execute/wait | ||||
| at a lower priority than shaders still executing exports. | ||||
| Add code to maintain normal priority of 2 for shaders that export | ||||
| and drop to priority 0 after exports. | ||||
| ---
 | ||||
|  llvm/lib/Target/AMDGPU/AMDGPU.td              |  15 +- | ||||
|  .../lib/Target/AMDGPU/GCNHazardRecognizer.cpp | 112 ++++++ | ||||
|  llvm/lib/Target/AMDGPU/GCNHazardRecognizer.h  |   1 + | ||||
|  llvm/lib/Target/AMDGPU/GCNSubtarget.h         |   3 + | ||||
|  .../AMDGPU/required-export-priority.ll        | 344 ++++++++++++++++++ | ||||
|  .../AMDGPU/required-export-priority.mir       | 293 +++++++++++++++ | ||||
|  6 files changed, 765 insertions(+), 3 deletions(-) | ||||
|  create mode 100644 llvm/test/CodeGen/AMDGPU/required-export-priority.ll | ||||
|  create mode 100644 llvm/test/CodeGen/AMDGPU/required-export-priority.mir | ||||
| 
 | ||||
| diff --git a/llvm/lib/Target/AMDGPU/AMDGPU.td b/llvm/lib/Target/AMDGPU/AMDGPU.td
 | ||||
| index dfc8eaea66f7b..14fcf6a210a78 100644
 | ||||
| --- a/llvm/lib/Target/AMDGPU/AMDGPU.td
 | ||||
| +++ b/llvm/lib/Target/AMDGPU/AMDGPU.td
 | ||||
| @@ -947,6 +947,12 @@ def FeatureHasRestrictedSOffset : SubtargetFeature<"restricted-soffset",
 | ||||
|    "Has restricted SOffset (immediate not supported)." | ||||
|  >; | ||||
|   | ||||
| +def FeatureRequiredExportPriority : SubtargetFeature<"required-export-priority",
 | ||||
| +  "HasRequiredExportPriority",
 | ||||
| +  "true",
 | ||||
| +  "Export priority must be explicitly manipulated on GFX11.5"
 | ||||
| +>;
 | ||||
| +
 | ||||
|  //===------------------------------------------------------------===// | ||||
|  // Subtarget Features (options and debugging) | ||||
|  //===------------------------------------------------------------===// | ||||
| @@ -1597,14 +1603,16 @@ def FeatureISAVersion11_5_0 : FeatureSet<
 | ||||
|    !listconcat(FeatureISAVersion11_Common.Features, | ||||
|      [FeatureSALUFloatInsts, | ||||
|       FeatureDPPSrc1SGPR, | ||||
| -     FeatureVGPRSingleUseHintInsts])>;
 | ||||
| +     FeatureVGPRSingleUseHintInsts,
 | ||||
| +     FeatureRequiredExportPriority])>;
 | ||||
|   | ||||
|  def FeatureISAVersion11_5_1 : FeatureSet< | ||||
|    !listconcat(FeatureISAVersion11_Common.Features, | ||||
|      [FeatureSALUFloatInsts, | ||||
|       FeatureDPPSrc1SGPR, | ||||
|       FeatureVGPRSingleUseHintInsts, | ||||
| -     FeatureGFX11FullVGPRs])>;
 | ||||
| +     FeatureGFX11FullVGPRs,
 | ||||
| +     FeatureRequiredExportPriority])>;
 | ||||
|   | ||||
|  def FeatureISAVersion12 : FeatureSet< | ||||
|    [FeatureGFX12, | ||||
| diff --git a/llvm/lib/Target/AMDGPU/GCNHazardRecognizer.cpp b/llvm/lib/Target/AMDGPU/GCNHazardRecognizer.cpp
 | ||||
| index a402fc6d7e611..a8b171aa82840 100644
 | ||||
| --- a/llvm/lib/Target/AMDGPU/GCNHazardRecognizer.cpp
 | ||||
| +++ b/llvm/lib/Target/AMDGPU/GCNHazardRecognizer.cpp
 | ||||
| @@ -14,6 +14,7 @@
 | ||||
|  #include "GCNSubtarget.h" | ||||
|  #include "MCTargetDesc/AMDGPUMCTargetDesc.h" | ||||
|  #include "SIMachineFunctionInfo.h" | ||||
| +#include "llvm/CodeGen/MachineFrameInfo.h"
 | ||||
|  #include "llvm/CodeGen/MachineFunction.h" | ||||
|  #include "llvm/CodeGen/ScheduleDAG.h" | ||||
|  #include "llvm/TargetParser/TargetParser.h" | ||||
| @@ -1104,6 +1105,7 @@ void GCNHazardRecognizer::fixHazards(MachineInstr *MI) {
 | ||||
|    fixWMMAHazards(MI); | ||||
|    fixShift64HighRegBug(MI); | ||||
|    fixVALUMaskWriteHazard(MI); | ||||
| +  fixRequiredExportPriority(MI);
 | ||||
|  } | ||||
|   | ||||
|  bool GCNHazardRecognizer::fixVcmpxPermlaneHazards(MachineInstr *MI) { | ||||
| @@ -2895,3 +2897,113 @@ bool GCNHazardRecognizer::fixVALUMaskWriteHazard(MachineInstr *MI) {
 | ||||
|   | ||||
|    return true; | ||||
|  } | ||||
| +
 | ||||
| +static bool ensureEntrySetPrio(MachineFunction *MF, int Priority,
 | ||||
| +                               const SIInstrInfo &TII) {
 | ||||
| +  MachineBasicBlock &EntryMBB = MF->front();
 | ||||
| +  if (EntryMBB.begin() != EntryMBB.end()) {
 | ||||
| +    auto &EntryMI = *EntryMBB.begin();
 | ||||
| +    if (EntryMI.getOpcode() == AMDGPU::S_SETPRIO &&
 | ||||
| +        EntryMI.getOperand(0).getImm() >= Priority)
 | ||||
| +      return false;
 | ||||
| +  }
 | ||||
| +
 | ||||
| +  BuildMI(EntryMBB, EntryMBB.begin(), DebugLoc(), TII.get(AMDGPU::S_SETPRIO))
 | ||||
| +      .addImm(Priority);
 | ||||
| +  return true;
 | ||||
| +}
 | ||||
| +
 | ||||
| +bool GCNHazardRecognizer::fixRequiredExportPriority(MachineInstr *MI) {
 | ||||
| +  if (!ST.hasRequiredExportPriority())
 | ||||
| +    return false;
 | ||||
| +
 | ||||
| +  // Assume the following shader types will never have exports,
 | ||||
| +  // and avoid adding or adjusting S_SETPRIO.
 | ||||
| +  MachineBasicBlock *MBB = MI->getParent();
 | ||||
| +  MachineFunction *MF = MBB->getParent();
 | ||||
| +  auto CC = MF->getFunction().getCallingConv();
 | ||||
| +  switch (CC) {
 | ||||
| +  case CallingConv::AMDGPU_CS:
 | ||||
| +  case CallingConv::AMDGPU_CS_Chain:
 | ||||
| +  case CallingConv::AMDGPU_CS_ChainPreserve:
 | ||||
| +  case CallingConv::AMDGPU_KERNEL:
 | ||||
| +    return false;
 | ||||
| +  default:
 | ||||
| +    break;
 | ||||
| +  }
 | ||||
| +
 | ||||
| +  const int MaxPriority = 3;
 | ||||
| +  const int NormalPriority = 2;
 | ||||
| +  const int PostExportPriority = 0;
 | ||||
| +
 | ||||
| +  auto It = MI->getIterator();
 | ||||
| +  switch (MI->getOpcode()) {
 | ||||
| +  case AMDGPU::S_ENDPGM:
 | ||||
| +  case AMDGPU::S_ENDPGM_SAVED:
 | ||||
| +  case AMDGPU::S_ENDPGM_ORDERED_PS_DONE:
 | ||||
| +  case AMDGPU::SI_RETURN_TO_EPILOG:
 | ||||
| +    // Ensure shader with calls raises priority at entry.
 | ||||
| +    // This ensures correct priority if exports exist in callee.
 | ||||
| +    if (MF->getFrameInfo().hasCalls())
 | ||||
| +      return ensureEntrySetPrio(MF, NormalPriority, TII);
 | ||||
| +    return false;
 | ||||
| +  case AMDGPU::S_SETPRIO: {
 | ||||
| +    // Raise minimum priority unless in workaround.
 | ||||
| +    auto &PrioOp = MI->getOperand(0);
 | ||||
| +    int Prio = PrioOp.getImm();
 | ||||
| +    bool InWA = (Prio == PostExportPriority) &&
 | ||||
| +                (It != MBB->begin() && TII.isEXP(*std::prev(It)));
 | ||||
| +    if (InWA || Prio >= NormalPriority)
 | ||||
| +      return false;
 | ||||
| +    PrioOp.setImm(std::min(Prio + NormalPriority, MaxPriority));
 | ||||
| +    return true;
 | ||||
| +  }
 | ||||
| +  default:
 | ||||
| +    if (!TII.isEXP(*MI))
 | ||||
| +      return false;
 | ||||
| +    break;
 | ||||
| +  }
 | ||||
| +
 | ||||
| +  // Check entry priority at each export (as there will only be a few).
 | ||||
| +  // Note: amdgpu_gfx can only be a callee, so defer to caller setprio.
 | ||||
| +  bool Changed = false;
 | ||||
| +  if (CC != CallingConv::AMDGPU_Gfx)
 | ||||
| +    Changed = ensureEntrySetPrio(MF, NormalPriority, TII);
 | ||||
| +
 | ||||
| +  auto NextMI = std::next(It);
 | ||||
| +  bool EndOfShader = false;
 | ||||
| +  if (NextMI != MBB->end()) {
 | ||||
| +    // Only need WA at end of sequence of exports.
 | ||||
| +    if (TII.isEXP(*NextMI))
 | ||||
| +      return Changed;
 | ||||
| +    // Assume appropriate S_SETPRIO after export means WA already applied.
 | ||||
| +    if (NextMI->getOpcode() == AMDGPU::S_SETPRIO &&
 | ||||
| +        NextMI->getOperand(0).getImm() == PostExportPriority)
 | ||||
| +      return Changed;
 | ||||
| +    EndOfShader = NextMI->getOpcode() == AMDGPU::S_ENDPGM;
 | ||||
| +  }
 | ||||
| +
 | ||||
| +  const DebugLoc &DL = MI->getDebugLoc();
 | ||||
| +
 | ||||
| +  // Lower priority.
 | ||||
| +  BuildMI(*MBB, NextMI, DL, TII.get(AMDGPU::S_SETPRIO))
 | ||||
| +      .addImm(PostExportPriority);
 | ||||
| +
 | ||||
| +  if (!EndOfShader) {
 | ||||
| +    // Wait for exports to complete.
 | ||||
| +    BuildMI(*MBB, NextMI, DL, TII.get(AMDGPU::S_WAITCNT_EXPCNT))
 | ||||
| +        .addReg(AMDGPU::SGPR_NULL)
 | ||||
| +        .addImm(0);
 | ||||
| +  }
 | ||||
| +
 | ||||
| +  BuildMI(*MBB, NextMI, DL, TII.get(AMDGPU::S_NOP)).addImm(0);
 | ||||
| +  BuildMI(*MBB, NextMI, DL, TII.get(AMDGPU::S_NOP)).addImm(0);
 | ||||
| +
 | ||||
| +  if (!EndOfShader) {
 | ||||
| +    // Return to normal (higher) priority.
 | ||||
| +    BuildMI(*MBB, NextMI, DL, TII.get(AMDGPU::S_SETPRIO))
 | ||||
| +        .addImm(NormalPriority);
 | ||||
| +  }
 | ||||
| +
 | ||||
| +  return true;
 | ||||
| +}
 | ||||
| diff --git a/llvm/lib/Target/AMDGPU/GCNHazardRecognizer.h b/llvm/lib/Target/AMDGPU/GCNHazardRecognizer.h
 | ||||
| index 3ccca527c626b..f2a64ab48e180 100644
 | ||||
| --- a/llvm/lib/Target/AMDGPU/GCNHazardRecognizer.h
 | ||||
| +++ b/llvm/lib/Target/AMDGPU/GCNHazardRecognizer.h
 | ||||
| @@ -107,6 +107,7 @@ class GCNHazardRecognizer final : public ScheduleHazardRecognizer {
 | ||||
|    bool fixWMMAHazards(MachineInstr *MI); | ||||
|    bool fixShift64HighRegBug(MachineInstr *MI); | ||||
|    bool fixVALUMaskWriteHazard(MachineInstr *MI); | ||||
| +  bool fixRequiredExportPriority(MachineInstr *MI);
 | ||||
|   | ||||
|    int checkMAIHazards(MachineInstr *MI); | ||||
|    int checkMAIHazards908(MachineInstr *MI); | ||||
| diff --git a/llvm/lib/Target/AMDGPU/GCNSubtarget.h b/llvm/lib/Target/AMDGPU/GCNSubtarget.h
 | ||||
| index e5817594a4521..def89c785b855 100644
 | ||||
| --- a/llvm/lib/Target/AMDGPU/GCNSubtarget.h
 | ||||
| +++ b/llvm/lib/Target/AMDGPU/GCNSubtarget.h
 | ||||
| @@ -238,6 +238,7 @@ class GCNSubtarget final : public AMDGPUGenSubtargetInfo,
 | ||||
|    bool HasVOPDInsts = false; | ||||
|    bool HasVALUTransUseHazard = false; | ||||
|    bool HasForceStoreSC0SC1 = false; | ||||
| +  bool HasRequiredExportPriority = false;
 | ||||
|   | ||||
|    // Dummy feature to use for assembler in tablegen. | ||||
|    bool FeatureDisable = false; | ||||
| @@ -1282,6 +1283,8 @@ class GCNSubtarget final : public AMDGPUGenSubtargetInfo,
 | ||||
|   | ||||
|    bool hasRestrictedSOffset() const { return HasRestrictedSOffset; } | ||||
|   | ||||
| +  bool hasRequiredExportPriority() const { return HasRequiredExportPriority; }
 | ||||
| +
 | ||||
|    /// \returns true if the target uses LOADcnt/SAMPLEcnt/BVHcnt, DScnt/KMcnt | ||||
|    /// and STOREcnt rather than VMcnt, LGKMcnt and VScnt respectively. | ||||
|    bool hasExtendedWaitCounts() const { return getGeneration() >= GFX12; } | ||||
| diff --git a/llvm/test/CodeGen/AMDGPU/required-export-priority.ll b/llvm/test/CodeGen/AMDGPU/required-export-priority.ll
 | ||||
| new file mode 100644 | ||||
| index 0000000000000..377902f3f0d1a
 | ||||
| --- /dev/null
 | ||||
| +++ b/llvm/test/CodeGen/AMDGPU/required-export-priority.ll
 | ||||
| @@ -0,0 +1,344 @@
 | ||||
| +; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py UTC_ARGS: --version 5
 | ||||
| +; RUN: llc -mtriple=amdgcn -mcpu=gfx1150 -amdgpu-enable-vopd=0 -verify-machineinstrs < %s | FileCheck -check-prefix=GCN %s
 | ||||
| +
 | ||||
| +define amdgpu_ps void @test_export_zeroes_f32() #0 {
 | ||||
| +; GCN-LABEL: test_export_zeroes_f32:
 | ||||
| +; GCN:       ; %bb.0:
 | ||||
| +; GCN-NEXT:    s_setprio 2
 | ||||
| +; GCN-NEXT:    v_mov_b32_e32 v0, 0
 | ||||
| +; GCN-NEXT:    exp mrt0 off, off, off, off
 | ||||
| +; GCN-NEXT:    exp mrt0 off, off, off, off done
 | ||||
| +; GCN-NEXT:    s_setprio 0
 | ||||
| +; GCN-NEXT:    s_nop 0
 | ||||
| +; GCN-NEXT:    s_nop 0
 | ||||
| +; GCN-NEXT:    s_endpgm
 | ||||
| +  call void @llvm.amdgcn.exp.f32(i32 0, i32 0, float 0.0, float 0.0, float 0.0, float 0.0, i1 false, i1 false)
 | ||||
| +  call void @llvm.amdgcn.exp.f32(i32 0, i32 0, float 0.0, float 0.0, float 0.0, float 0.0, i1 true, i1 false)
 | ||||
| +  ret void
 | ||||
| +}
 | ||||
| +
 | ||||
| +define amdgpu_ps void @test_export_en_src0_f32() #0 {
 | ||||
| +; GCN-LABEL: test_export_en_src0_f32:
 | ||||
| +; GCN:       ; %bb.0:
 | ||||
| +; GCN-NEXT:    s_setprio 2
 | ||||
| +; GCN-NEXT:    v_mov_b32_e32 v0, 4.0
 | ||||
| +; GCN-NEXT:    v_mov_b32_e32 v1, 0.5
 | ||||
| +; GCN-NEXT:    v_mov_b32_e32 v2, 2.0
 | ||||
| +; GCN-NEXT:    v_mov_b32_e32 v3, 1.0
 | ||||
| +; GCN-NEXT:    exp mrt0 v3, off, off, off done
 | ||||
| +; GCN-NEXT:    s_setprio 0
 | ||||
| +; GCN-NEXT:    s_nop 0
 | ||||
| +; GCN-NEXT:    s_nop 0
 | ||||
| +; GCN-NEXT:    s_endpgm
 | ||||
| +  call void @llvm.amdgcn.exp.f32(i32 0, i32 1, float 1.0, float 2.0, float 0.5, float 4.0, i1 true, i1 false)
 | ||||
| +  ret void
 | ||||
| +}
 | ||||
| +
 | ||||
| +define amdgpu_gs void @test_export_gs() #0 {
 | ||||
| +; GCN-LABEL: test_export_gs:
 | ||||
| +; GCN:       ; %bb.0:
 | ||||
| +; GCN-NEXT:    s_setprio 2
 | ||||
| +; GCN-NEXT:    v_mov_b32_e32 v0, 4.0
 | ||||
| +; GCN-NEXT:    v_mov_b32_e32 v1, 0.5
 | ||||
| +; GCN-NEXT:    v_mov_b32_e32 v2, 2.0
 | ||||
| +; GCN-NEXT:    v_mov_b32_e32 v3, 1.0
 | ||||
| +; GCN-NEXT:    exp mrt0 off, v2, off, off done
 | ||||
| +; GCN-NEXT:    s_setprio 0
 | ||||
| +; GCN-NEXT:    s_nop 0
 | ||||
| +; GCN-NEXT:    s_nop 0
 | ||||
| +; GCN-NEXT:    s_endpgm
 | ||||
| +  call void @llvm.amdgcn.exp.f32(i32 0, i32 2, float 1.0, float 2.0, float 0.5, float 4.0, i1 true, i1 false)
 | ||||
| +  ret void
 | ||||
| +}
 | ||||
| +
 | ||||
| +define amdgpu_hs void @test_export_hs() #0 {
 | ||||
| +; GCN-LABEL: test_export_hs:
 | ||||
| +; GCN:       ; %bb.0:
 | ||||
| +; GCN-NEXT:    s_setprio 2
 | ||||
| +; GCN-NEXT:    v_mov_b32_e32 v0, 4.0
 | ||||
| +; GCN-NEXT:    v_mov_b32_e32 v1, 0.5
 | ||||
| +; GCN-NEXT:    v_mov_b32_e32 v2, 2.0
 | ||||
| +; GCN-NEXT:    v_mov_b32_e32 v3, 1.0
 | ||||
| +; GCN-NEXT:    exp mrt0 off, v2, off, off done
 | ||||
| +; GCN-NEXT:    s_setprio 0
 | ||||
| +; GCN-NEXT:    s_nop 0
 | ||||
| +; GCN-NEXT:    s_nop 0
 | ||||
| +; GCN-NEXT:    s_endpgm
 | ||||
| +  call void @llvm.amdgcn.exp.f32(i32 0, i32 2, float 1.0, float 2.0, float 0.5, float 4.0, i1 true, i1 false)
 | ||||
| +  ret void
 | ||||
| +}
 | ||||
| +
 | ||||
| +define amdgpu_gfx void @test_export_gfx(float %v) #0 {
 | ||||
| +; GCN-LABEL: test_export_gfx:
 | ||||
| +; GCN:       ; %bb.0:
 | ||||
| +; GCN-NEXT:    s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
 | ||||
| +; GCN-NEXT:    v_mov_b32_e32 v1, 4.0
 | ||||
| +; GCN-NEXT:    v_mov_b32_e32 v2, 0.5
 | ||||
| +; GCN-NEXT:    v_mov_b32_e32 v3, 2.0
 | ||||
| +; GCN-NEXT:    exp mrt0 off, v3, off, off done
 | ||||
| +; GCN-NEXT:    s_setprio 0
 | ||||
| +; GCN-NEXT:    s_waitcnt_expcnt null, 0x0
 | ||||
| +; GCN-NEXT:    s_nop 0
 | ||||
| +; GCN-NEXT:    s_nop 0
 | ||||
| +; GCN-NEXT:    s_setprio 2
 | ||||
| +; GCN-NEXT:    s_waitcnt expcnt(0)
 | ||||
| +; GCN-NEXT:    s_setpc_b64 s[30:31]
 | ||||
| +  call void @llvm.amdgcn.exp.f32(i32 0, i32 2, float %v, float 2.0, float 0.5, float 4.0, i1 true, i1 false)
 | ||||
| +  ret void
 | ||||
| +}
 | ||||
| +
 | ||||
| +define amdgpu_cs void @test_export_cs() #0 {
 | ||||
| +; GCN-LABEL: test_export_cs:
 | ||||
| +; GCN:       ; %bb.0:
 | ||||
| +; GCN-NEXT:    v_mov_b32_e32 v0, 4.0
 | ||||
| +; GCN-NEXT:    v_mov_b32_e32 v1, 0.5
 | ||||
| +; GCN-NEXT:    v_mov_b32_e32 v2, 2.0
 | ||||
| +; GCN-NEXT:    v_mov_b32_e32 v3, 1.0
 | ||||
| +; GCN-NEXT:    exp mrt0 off, v2, off, off done
 | ||||
| +; GCN-NEXT:    s_endpgm
 | ||||
| +  call void @llvm.amdgcn.exp.f32(i32 0, i32 2, float 1.0, float 2.0, float 0.5, float 4.0, i1 true, i1 false)
 | ||||
| +  ret void
 | ||||
| +}
 | ||||
| +
 | ||||
| +define amdgpu_kernel void @test_export_kernel() #0 {
 | ||||
| +; GCN-LABEL: test_export_kernel:
 | ||||
| +; GCN:       ; %bb.0:
 | ||||
| +; GCN-NEXT:    v_mov_b32_e32 v0, 4.0
 | ||||
| +; GCN-NEXT:    v_mov_b32_e32 v1, 0.5
 | ||||
| +; GCN-NEXT:    v_mov_b32_e32 v2, 2.0
 | ||||
| +; GCN-NEXT:    v_mov_b32_e32 v3, 1.0
 | ||||
| +; GCN-NEXT:    exp mrt0 off, v2, off, off done
 | ||||
| +; GCN-NEXT:    s_endpgm
 | ||||
| +  call void @llvm.amdgcn.exp.f32(i32 0, i32 2, float 1.0, float 2.0, float 0.5, float 4.0, i1 true, i1 false)
 | ||||
| +  ret void
 | ||||
| +}
 | ||||
| +
 | ||||
| +define amdgpu_gfx void @test_no_export_gfx(float %v) #0 {
 | ||||
| +; GCN-LABEL: test_no_export_gfx:
 | ||||
| +; GCN:       ; %bb.0:
 | ||||
| +; GCN-NEXT:    s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
 | ||||
| +; GCN-NEXT:    s_setpc_b64 s[30:31]
 | ||||
| +  ret void
 | ||||
| +}
 | ||||
| +
 | ||||
| +define amdgpu_ps void @test_no_export_ps(float %v) #0 {
 | ||||
| +; GCN-LABEL: test_no_export_ps:
 | ||||
| +; GCN:       ; %bb.0:
 | ||||
| +; GCN-NEXT:    s_endpgm
 | ||||
| +  ret void
 | ||||
| +}
 | ||||
| +
 | ||||
| +define amdgpu_ps void @test_if_export_f32(i32 %flag, float %x, float %y, float %z, float %w) #0 {
 | ||||
| +; GCN-LABEL: test_if_export_f32:
 | ||||
| +; GCN:       ; %bb.0:
 | ||||
| +; GCN-NEXT:    s_setprio 2
 | ||||
| +; GCN-NEXT:    s_mov_b32 s0, exec_lo
 | ||||
| +; GCN-NEXT:    v_cmpx_ne_u32_e32 0, v0
 | ||||
| +; GCN-NEXT:    s_cbranch_execz .LBB9_2
 | ||||
| +; GCN-NEXT:  ; %bb.1: ; %exp
 | ||||
| +; GCN-NEXT:    exp mrt0 v1, v2, v3, v4
 | ||||
| +; GCN-NEXT:    s_setprio 0
 | ||||
| +; GCN-NEXT:    s_waitcnt_expcnt null, 0x0
 | ||||
| +; GCN-NEXT:    s_nop 0
 | ||||
| +; GCN-NEXT:    s_nop 0
 | ||||
| +; GCN-NEXT:    s_setprio 2
 | ||||
| +; GCN-NEXT:  .LBB9_2: ; %end
 | ||||
| +; GCN-NEXT:    s_endpgm
 | ||||
| +  %cc = icmp eq i32 %flag, 0
 | ||||
| +  br i1 %cc, label %end, label %exp
 | ||||
| +
 | ||||
| +exp:
 | ||||
| +  call void @llvm.amdgcn.exp.f32(i32 0, i32 15, float %x, float %y, float %z, float %w, i1 false, i1 false)
 | ||||
| +  br label %end
 | ||||
| +
 | ||||
| +end:
 | ||||
| +  ret void
 | ||||
| +}
 | ||||
| +
 | ||||
| +define amdgpu_ps void @test_if_export_vm_f32(i32 %flag, float %x, float %y, float %z, float %w) #0 {
 | ||||
| +; GCN-LABEL: test_if_export_vm_f32:
 | ||||
| +; GCN:       ; %bb.0:
 | ||||
| +; GCN-NEXT:    s_setprio 2
 | ||||
| +; GCN-NEXT:    s_mov_b32 s0, exec_lo
 | ||||
| +; GCN-NEXT:    v_cmpx_ne_u32_e32 0, v0
 | ||||
| +; GCN-NEXT:    s_cbranch_execz .LBB10_2
 | ||||
| +; GCN-NEXT:  ; %bb.1: ; %exp
 | ||||
| +; GCN-NEXT:    exp mrt0 v1, v2, v3, v4
 | ||||
| +; GCN-NEXT:    s_setprio 0
 | ||||
| +; GCN-NEXT:    s_waitcnt_expcnt null, 0x0
 | ||||
| +; GCN-NEXT:    s_nop 0
 | ||||
| +; GCN-NEXT:    s_nop 0
 | ||||
| +; GCN-NEXT:    s_setprio 2
 | ||||
| +; GCN-NEXT:  .LBB10_2: ; %end
 | ||||
| +; GCN-NEXT:    s_endpgm
 | ||||
| +  %cc = icmp eq i32 %flag, 0
 | ||||
| +  br i1 %cc, label %end, label %exp
 | ||||
| +
 | ||||
| +exp:
 | ||||
| +  call void @llvm.amdgcn.exp.f32(i32 0, i32 15, float %x, float %y, float %z, float %w, i1 false, i1 true)
 | ||||
| +  br label %end
 | ||||
| +
 | ||||
| +end:
 | ||||
| +  ret void
 | ||||
| +}
 | ||||
| +
 | ||||
| +define amdgpu_ps void @test_if_export_done_f32(i32 %flag, float %x, float %y, float %z, float %w) #0 {
 | ||||
| +; GCN-LABEL: test_if_export_done_f32:
 | ||||
| +; GCN:       ; %bb.0:
 | ||||
| +; GCN-NEXT:    s_setprio 2
 | ||||
| +; GCN-NEXT:    s_mov_b32 s0, exec_lo
 | ||||
| +; GCN-NEXT:    v_cmpx_ne_u32_e32 0, v0
 | ||||
| +; GCN-NEXT:    s_cbranch_execz .LBB11_2
 | ||||
| +; GCN-NEXT:  ; %bb.1: ; %exp
 | ||||
| +; GCN-NEXT:    exp mrt0 v1, v2, v3, v4 done
 | ||||
| +; GCN-NEXT:    s_setprio 0
 | ||||
| +; GCN-NEXT:    s_waitcnt_expcnt null, 0x0
 | ||||
| +; GCN-NEXT:    s_nop 0
 | ||||
| +; GCN-NEXT:    s_nop 0
 | ||||
| +; GCN-NEXT:    s_setprio 2
 | ||||
| +; GCN-NEXT:  .LBB11_2: ; %end
 | ||||
| +; GCN-NEXT:    s_endpgm
 | ||||
| +  %cc = icmp eq i32 %flag, 0
 | ||||
| +  br i1 %cc, label %end, label %exp
 | ||||
| +
 | ||||
| +exp:
 | ||||
| +  call void @llvm.amdgcn.exp.f32(i32 0, i32 15, float %x, float %y, float %z, float %w, i1 true, i1 false)
 | ||||
| +  br label %end
 | ||||
| +
 | ||||
| +end:
 | ||||
| +  ret void
 | ||||
| +}
 | ||||
| +
 | ||||
| +define amdgpu_ps void @test_if_export_vm_done_f32(i32 %flag, float %x, float %y, float %z, float %w) #0 {
 | ||||
| +; GCN-LABEL: test_if_export_vm_done_f32:
 | ||||
| +; GCN:       ; %bb.0:
 | ||||
| +; GCN-NEXT:    s_setprio 2
 | ||||
| +; GCN-NEXT:    s_mov_b32 s0, exec_lo
 | ||||
| +; GCN-NEXT:    v_cmpx_ne_u32_e32 0, v0
 | ||||
| +; GCN-NEXT:    s_cbranch_execz .LBB12_2
 | ||||
| +; GCN-NEXT:  ; %bb.1: ; %exp
 | ||||
| +; GCN-NEXT:    exp mrt0 v1, v2, v3, v4 done
 | ||||
| +; GCN-NEXT:    s_setprio 0
 | ||||
| +; GCN-NEXT:    s_waitcnt_expcnt null, 0x0
 | ||||
| +; GCN-NEXT:    s_nop 0
 | ||||
| +; GCN-NEXT:    s_nop 0
 | ||||
| +; GCN-NEXT:    s_setprio 2
 | ||||
| +; GCN-NEXT:  .LBB12_2: ; %end
 | ||||
| +; GCN-NEXT:    s_endpgm
 | ||||
| +  %cc = icmp eq i32 %flag, 0
 | ||||
| +  br i1 %cc, label %end, label %exp
 | ||||
| +
 | ||||
| +exp:
 | ||||
| +  call void @llvm.amdgcn.exp.f32(i32 0, i32 15, float %x, float %y, float %z, float %w, i1 true, i1 true)
 | ||||
| +  br label %end
 | ||||
| +
 | ||||
| +end:
 | ||||
| +  ret void
 | ||||
| +}
 | ||||
| +
 | ||||
| +define amdgpu_ps void @test_export_pos_before_param_across_load(i32 %idx) #0 {
 | ||||
| +; GCN-LABEL: test_export_pos_before_param_across_load:
 | ||||
| +; GCN:       ; %bb.0:
 | ||||
| +; GCN-NEXT:    s_setprio 2
 | ||||
| +; GCN-NEXT:    buffer_load_b32 v0, v0, s[0:3], 0 offen
 | ||||
| +; GCN-NEXT:    v_mov_b32_e32 v1, 0
 | ||||
| +; GCN-NEXT:    v_mov_b32_e32 v2, 1.0
 | ||||
| +; GCN-NEXT:    v_mov_b32_e32 v3, 0.5
 | ||||
| +; GCN-NEXT:    s_waitcnt vmcnt(0)
 | ||||
| +; GCN-NEXT:    exp pos0 v1, v1, v1, v0 done
 | ||||
| +; GCN-NEXT:    exp invalid_target_32 v2, v2, v2, v2
 | ||||
| +; GCN-NEXT:    exp invalid_target_33 v2, v2, v2, v3
 | ||||
| +; GCN-NEXT:    s_setprio 0
 | ||||
| +; GCN-NEXT:    s_nop 0
 | ||||
| +; GCN-NEXT:    s_nop 0
 | ||||
| +; GCN-NEXT:    s_endpgm
 | ||||
| +  call void @llvm.amdgcn.exp.f32(i32 32, i32 15, float 1.0, float 1.0, float 1.0, float 1.0, i1 false, i1 false)
 | ||||
| +  call void @llvm.amdgcn.exp.f32(i32 33, i32 15, float 1.0, float 1.0, float 1.0, float 0.5, i1 false, i1 false)
 | ||||
| +  %load = call float @llvm.amdgcn.raw.ptr.buffer.load.f32(ptr addrspace(8) undef, i32 %idx, i32 0, i32 0)
 | ||||
| +  call void @llvm.amdgcn.exp.f32(i32 12, i32 15, float 0.0, float 0.0, float 0.0, float %load, i1 true, i1 false)
 | ||||
| +  ret void
 | ||||
| +}
 | ||||
| +
 | ||||
| +define amdgpu_ps void @test_export_across_store_load(i32 %idx, float %v) #0 {
 | ||||
| +; GCN-LABEL: test_export_across_store_load:
 | ||||
| +; GCN:       ; %bb.0:
 | ||||
| +; GCN-NEXT:    s_setprio 2
 | ||||
| +; GCN-NEXT:    v_mov_b32_e32 v2, 24
 | ||||
| +; GCN-NEXT:    v_cmp_eq_u32_e32 vcc_lo, 1, v0
 | ||||
| +; GCN-NEXT:    s_delay_alu instid0(VALU_DEP_2)
 | ||||
| +; GCN-NEXT:    v_cndmask_b32_e64 v0, v2, 8, vcc_lo
 | ||||
| +; GCN-NEXT:    v_mov_b32_e32 v2, 0
 | ||||
| +; GCN-NEXT:    scratch_store_b32 v0, v1, off
 | ||||
| +; GCN-NEXT:    scratch_load_b32 v0, off, off
 | ||||
| +; GCN-NEXT:    v_mov_b32_e32 v1, 1.0
 | ||||
| +; GCN-NEXT:    exp pos0 v2, v2, v2, v1 done
 | ||||
| +; GCN-NEXT:    s_setprio 0
 | ||||
| +; GCN-NEXT:    s_waitcnt_expcnt null, 0x0
 | ||||
| +; GCN-NEXT:    s_nop 0
 | ||||
| +; GCN-NEXT:    s_nop 0
 | ||||
| +; GCN-NEXT:    s_setprio 2
 | ||||
| +; GCN-NEXT:    s_waitcnt vmcnt(0)
 | ||||
| +; GCN-NEXT:    exp invalid_target_32 v0, v2, v1, v2
 | ||||
| +; GCN-NEXT:    exp invalid_target_33 v0, v2, v1, v2
 | ||||
| +; GCN-NEXT:    s_setprio 0
 | ||||
| +; GCN-NEXT:    s_nop 0
 | ||||
| +; GCN-NEXT:    s_nop 0
 | ||||
| +; GCN-NEXT:    s_endpgm
 | ||||
| +  %data0 = alloca <4 x float>, align 8, addrspace(5)
 | ||||
| +  %data1 = alloca <4 x float>, align 8, addrspace(5)
 | ||||
| +  %cmp = icmp eq i32 %idx, 1
 | ||||
| +  %data = select i1 %cmp, ptr addrspace(5) %data0, ptr addrspace(5) %data1
 | ||||
| +  store float %v, ptr addrspace(5) %data, align 8
 | ||||
| +  call void @llvm.amdgcn.exp.f32(i32 12, i32 15, float 0.0, float 0.0, float 0.0, float 1.0, i1 true, i1 false)
 | ||||
| +  %load0 = load float, ptr addrspace(5) %data0, align 8
 | ||||
| +  call void @llvm.amdgcn.exp.f32(i32 32, i32 15, float %load0, float 0.0, float 1.0, float 0.0, i1 false, i1 false)
 | ||||
| +  call void @llvm.amdgcn.exp.f32(i32 33, i32 15, float %load0, float 0.0, float 1.0, float 0.0, i1 false, i1 false)
 | ||||
| +  ret void
 | ||||
| +}
 | ||||
| +
 | ||||
| +define amdgpu_ps void @test_export_in_callee(float %v) #0 {
 | ||||
| +; GCN-LABEL: test_export_in_callee:
 | ||||
| +; GCN:       ; %bb.0:
 | ||||
| +; GCN-NEXT:    s_setprio 2
 | ||||
| +; GCN-NEXT:    s_getpc_b64 s[0:1]
 | ||||
| +; GCN-NEXT:    s_add_u32 s0, s0, test_export_gfx@gotpcrel32@lo+4
 | ||||
| +; GCN-NEXT:    s_addc_u32 s1, s1, test_export_gfx@gotpcrel32@hi+12
 | ||||
| +; GCN-NEXT:    v_add_f32_e32 v0, 1.0, v0
 | ||||
| +; GCN-NEXT:    s_load_b64 s[0:1], s[0:1], 0x0
 | ||||
| +; GCN-NEXT:    s_mov_b32 s32, 0
 | ||||
| +; GCN-NEXT:    s_waitcnt lgkmcnt(0)
 | ||||
| +; GCN-NEXT:    s_swappc_b64 s[30:31], s[0:1]
 | ||||
| +; GCN-NEXT:    s_endpgm
 | ||||
| +  %x = fadd float %v, 1.0
 | ||||
| +  call void @test_export_gfx(float %x)
 | ||||
| +  ret void
 | ||||
| +}
 | ||||
| +
 | ||||
| +define amdgpu_ps void @test_export_in_callee_prio(float %v) #0 {
 | ||||
| +; GCN-LABEL: test_export_in_callee_prio:
 | ||||
| +; GCN:       ; %bb.0:
 | ||||
| +; GCN-NEXT:    s_setprio 2
 | ||||
| +; GCN-NEXT:    s_mov_b32 s32, 0
 | ||||
| +; GCN-NEXT:    v_add_f32_e32 v0, 1.0, v0
 | ||||
| +; GCN-NEXT:    s_setprio 2
 | ||||
| +; GCN-NEXT:    s_getpc_b64 s[0:1]
 | ||||
| +; GCN-NEXT:    s_add_u32 s0, s0, test_export_gfx@gotpcrel32@lo+4
 | ||||
| +; GCN-NEXT:    s_addc_u32 s1, s1, test_export_gfx@gotpcrel32@hi+12
 | ||||
| +; GCN-NEXT:    s_load_b64 s[0:1], s[0:1], 0x0
 | ||||
| +; GCN-NEXT:    s_waitcnt lgkmcnt(0)
 | ||||
| +; GCN-NEXT:    s_swappc_b64 s[30:31], s[0:1]
 | ||||
| +; GCN-NEXT:    s_endpgm
 | ||||
| +  %x = fadd float %v, 1.0
 | ||||
| +  call void @llvm.amdgcn.s.setprio(i16 0)
 | ||||
| +  call void @test_export_gfx(float %x)
 | ||||
| +  ret void
 | ||||
| +}
 | ||||
| +
 | ||||
| +declare void @llvm.amdgcn.exp.f32(i32, i32, float, float, float, float, i1, i1) #1
 | ||||
| +declare void @llvm.amdgcn.exp.i32(i32, i32, i32, i32, i32, i32, i1, i1) #1
 | ||||
| +declare float @llvm.amdgcn.raw.ptr.buffer.load.f32(ptr addrspace(8), i32, i32, i32) #2
 | ||||
| +declare void @llvm.amdgcn.s.setprio(i16)
 | ||||
| +
 | ||||
| +attributes #0 = { nounwind }
 | ||||
| +attributes #1 = { nounwind inaccessiblememonly }
 | ||||
| +attributes #2 = { nounwind readnone }
 | ||||
| diff --git a/llvm/test/CodeGen/AMDGPU/required-export-priority.mir b/llvm/test/CodeGen/AMDGPU/required-export-priority.mir
 | ||||
| new file mode 100644 | ||||
| index 0000000000000..eee04468036e5
 | ||||
| --- /dev/null
 | ||||
| +++ b/llvm/test/CodeGen/AMDGPU/required-export-priority.mir
 | ||||
| @@ -0,0 +1,293 @@
 | ||||
| +# NOTE: Assertions have been autogenerated by utils/update_mir_test_checks.py UTC_ARGS: --version 5
 | ||||
| +# RUN: llc -mtriple=amdgcn -mcpu=gfx1150 -mattr=-wavefrontsize32,+wavefrontsize64 -run-pass=post-RA-hazard-rec -verify-machineinstrs  %s -o - | FileCheck -check-prefixes=GFX1150 %s
 | ||||
| +
 | ||||
| +--- |
 | ||||
| +  define amdgpu_ps void @end_of_shader() {
 | ||||
| +    ret void
 | ||||
| +  }
 | ||||
| +  define amdgpu_ps void @end_of_shader_return_to_epilogue() {
 | ||||
| +    ret void
 | ||||
| +  }
 | ||||
| +  define amdgpu_ps void @end_of_block() {
 | ||||
| +    ret void
 | ||||
| +  }
 | ||||
| +  define amdgpu_ps void @start_of_block() {
 | ||||
| +    ret void
 | ||||
| +  }
 | ||||
| +  define amdgpu_ps void @block_of_exports() {
 | ||||
| +    ret void
 | ||||
| +  }
 | ||||
| +  define amdgpu_ps void @sparse_exports() {
 | ||||
| +    ret void
 | ||||
| +  }
 | ||||
| +  define amdgpu_ps void @existing_setprio_1() {
 | ||||
| +    ret void
 | ||||
| +  }
 | ||||
| +  define amdgpu_ps void @existing_setprio_2() {
 | ||||
| +    ret void
 | ||||
| +  }
 | ||||
| +...
 | ||||
| +
 | ||||
| +---
 | ||||
| +name: end_of_shader
 | ||||
| +tracksRegLiveness: true
 | ||||
| +liveins:
 | ||||
| +  - { reg: '$vgpr0' }
 | ||||
| +body: |
 | ||||
| +  bb.0:
 | ||||
| +    liveins: $vgpr0
 | ||||
| +    ; GFX1150-LABEL: name: end_of_shader
 | ||||
| +    ; GFX1150: liveins: $vgpr0
 | ||||
| +    ; GFX1150-NEXT: {{  $}}
 | ||||
| +    ; GFX1150-NEXT: S_SETPRIO 2
 | ||||
| +    ; GFX1150-NEXT: EXP_DONE 0, $vgpr0, $vgpr0, $vgpr0, $vgpr0, -1, -1, 15, implicit $exec
 | ||||
| +    ; GFX1150-NEXT: S_SETPRIO 0
 | ||||
| +    ; GFX1150-NEXT: S_NOP 0
 | ||||
| +    ; GFX1150-NEXT: S_NOP 0
 | ||||
| +    ; GFX1150-NEXT: S_ENDPGM 0
 | ||||
| +    EXP_DONE 0, $vgpr0, $vgpr0, $vgpr0, $vgpr0, -1, -1, 15, implicit $exec
 | ||||
| +    S_ENDPGM 0
 | ||||
| +...
 | ||||
| +
 | ||||
| +---
 | ||||
| +name: end_of_shader_return_to_epilogue
 | ||||
| +tracksRegLiveness: true
 | ||||
| +liveins:
 | ||||
| +  - { reg: '$vgpr0' }
 | ||||
| +body: |
 | ||||
| +  bb.0:
 | ||||
| +    liveins: $vgpr0
 | ||||
| +    ; GFX1150-LABEL: name: end_of_shader_return_to_epilogue
 | ||||
| +    ; GFX1150: liveins: $vgpr0
 | ||||
| +    ; GFX1150-NEXT: {{  $}}
 | ||||
| +    ; GFX1150-NEXT: S_SETPRIO 2
 | ||||
| +    ; GFX1150-NEXT: EXP_DONE 0, $vgpr0, $vgpr0, $vgpr0, $vgpr0, -1, -1, 15, implicit $exec
 | ||||
| +    ; GFX1150-NEXT: S_SETPRIO 0
 | ||||
| +    ; GFX1150-NEXT: S_WAITCNT_EXPCNT $sgpr_null, 0
 | ||||
| +    ; GFX1150-NEXT: S_NOP 0
 | ||||
| +    ; GFX1150-NEXT: S_NOP 0
 | ||||
| +    ; GFX1150-NEXT: S_SETPRIO 2
 | ||||
| +    ; GFX1150-NEXT: SI_RETURN_TO_EPILOG $vgpr0
 | ||||
| +    EXP_DONE 0, $vgpr0, $vgpr0, $vgpr0, $vgpr0, -1, -1, 15, implicit $exec
 | ||||
| +    SI_RETURN_TO_EPILOG $vgpr0
 | ||||
| +...
 | ||||
| +
 | ||||
| +---
 | ||||
| +name: end_of_block
 | ||||
| +tracksRegLiveness: true
 | ||||
| +liveins:
 | ||||
| +  - { reg: '$vgpr0' }
 | ||||
| +body: |
 | ||||
| +  ; GFX1150-LABEL: name: end_of_block
 | ||||
| +  ; GFX1150: bb.0:
 | ||||
| +  ; GFX1150-NEXT:   successors: %bb.1(0x80000000)
 | ||||
| +  ; GFX1150-NEXT:   liveins: $vgpr0
 | ||||
| +  ; GFX1150-NEXT: {{  $}}
 | ||||
| +  ; GFX1150-NEXT:   S_SETPRIO 2
 | ||||
| +  ; GFX1150-NEXT:   EXP_DONE 0, $vgpr0, $vgpr0, $vgpr0, $vgpr0, -1, -1, 15, implicit $exec
 | ||||
| +  ; GFX1150-NEXT:   S_SETPRIO 0
 | ||||
| +  ; GFX1150-NEXT:   S_WAITCNT_EXPCNT $sgpr_null, 0
 | ||||
| +  ; GFX1150-NEXT:   S_NOP 0
 | ||||
| +  ; GFX1150-NEXT:   S_NOP 0
 | ||||
| +  ; GFX1150-NEXT:   S_SETPRIO 2
 | ||||
| +  ; GFX1150-NEXT: {{  $}}
 | ||||
| +  ; GFX1150-NEXT: bb.1:
 | ||||
| +  ; GFX1150-NEXT:   S_ENDPGM 0
 | ||||
| +  bb.0:
 | ||||
| +    liveins: $vgpr0
 | ||||
| +    EXP_DONE 0, $vgpr0, $vgpr0, $vgpr0, $vgpr0, -1, -1, 15, implicit $exec
 | ||||
| +
 | ||||
| +  bb.1:
 | ||||
| +    S_ENDPGM 0
 | ||||
| +...
 | ||||
| +
 | ||||
| +---
 | ||||
| +name: start_of_block
 | ||||
| +tracksRegLiveness: true
 | ||||
| +liveins:
 | ||||
| +  - { reg: '$vgpr0' }
 | ||||
| +body: |
 | ||||
| +  ; GFX1150-LABEL: name: start_of_block
 | ||||
| +  ; GFX1150: bb.0:
 | ||||
| +  ; GFX1150-NEXT:   successors: %bb.1(0x80000000)
 | ||||
| +  ; GFX1150-NEXT:   liveins: $vgpr0
 | ||||
| +  ; GFX1150-NEXT: {{  $}}
 | ||||
| +  ; GFX1150-NEXT:   S_SETPRIO 2
 | ||||
| +  ; GFX1150-NEXT: {{  $}}
 | ||||
| +  ; GFX1150-NEXT: bb.1:
 | ||||
| +  ; GFX1150-NEXT:   successors: %bb.2(0x80000000)
 | ||||
| +  ; GFX1150-NEXT:   liveins: $vgpr0
 | ||||
| +  ; GFX1150-NEXT: {{  $}}
 | ||||
| +  ; GFX1150-NEXT:   EXP_DONE 0, $vgpr0, $vgpr0, $vgpr0, $vgpr0, -1, -1, 15, implicit $exec
 | ||||
| +  ; GFX1150-NEXT:   S_SETPRIO 0
 | ||||
| +  ; GFX1150-NEXT:   S_WAITCNT_EXPCNT $sgpr_null, 0
 | ||||
| +  ; GFX1150-NEXT:   S_NOP 0
 | ||||
| +  ; GFX1150-NEXT:   S_NOP 0
 | ||||
| +  ; GFX1150-NEXT:   S_SETPRIO 2
 | ||||
| +  ; GFX1150-NEXT: {{  $}}
 | ||||
| +  ; GFX1150-NEXT: bb.2:
 | ||||
| +  ; GFX1150-NEXT:   S_ENDPGM 0
 | ||||
| +  bb.0:
 | ||||
| +    liveins: $vgpr0
 | ||||
| +
 | ||||
| +  bb.1:
 | ||||
| +    liveins: $vgpr0
 | ||||
| +    EXP_DONE 0, $vgpr0, $vgpr0, $vgpr0, $vgpr0, -1, -1, 15, implicit $exec
 | ||||
| +
 | ||||
| +  bb.2:
 | ||||
| +    S_ENDPGM 0
 | ||||
| +...
 | ||||
| +
 | ||||
| +---
 | ||||
| +name: block_of_exports
 | ||||
| +tracksRegLiveness: true
 | ||||
| +liveins:
 | ||||
| +  - { reg: '$vgpr0' }
 | ||||
| +body: |
 | ||||
| +  bb.0:
 | ||||
| +    liveins: $vgpr0
 | ||||
| +    ; GFX1150-LABEL: name: block_of_exports
 | ||||
| +    ; GFX1150: liveins: $vgpr0
 | ||||
| +    ; GFX1150-NEXT: {{  $}}
 | ||||
| +    ; GFX1150-NEXT: S_SETPRIO 2
 | ||||
| +    ; GFX1150-NEXT: EXP 2, $vgpr0, $vgpr0, $vgpr0, $vgpr0, -1, -1, 15, implicit $exec
 | ||||
| +    ; GFX1150-NEXT: EXP 1, $vgpr0, $vgpr0, $vgpr0, $vgpr0, -1, -1, 15, implicit $exec
 | ||||
| +    ; GFX1150-NEXT: EXP_DONE 0, $vgpr0, $vgpr0, $vgpr0, $vgpr0, -1, -1, 15, implicit $exec
 | ||||
| +    ; GFX1150-NEXT: S_SETPRIO 0
 | ||||
| +    ; GFX1150-NEXT: S_NOP 0
 | ||||
| +    ; GFX1150-NEXT: S_NOP 0
 | ||||
| +    ; GFX1150-NEXT: S_ENDPGM 0
 | ||||
| +    EXP 2, $vgpr0, $vgpr0, $vgpr0, $vgpr0, -1, -1, 15, implicit $exec
 | ||||
| +    EXP 1, $vgpr0, $vgpr0, $vgpr0, $vgpr0, -1, -1, 15, implicit $exec
 | ||||
| +    EXP_DONE 0, $vgpr0, $vgpr0, $vgpr0, $vgpr0, -1, -1, 15, implicit $exec
 | ||||
| +    S_ENDPGM 0
 | ||||
| +...
 | ||||
| +
 | ||||
| +---
 | ||||
| +name: sparse_exports
 | ||||
| +tracksRegLiveness: true
 | ||||
| +liveins:
 | ||||
| +  - { reg: '$vgpr0' }
 | ||||
| +body: |
 | ||||
| +  bb.0:
 | ||||
| +    liveins: $vgpr0
 | ||||
| +    ; GFX1150-LABEL: name: sparse_exports
 | ||||
| +    ; GFX1150: liveins: $vgpr0
 | ||||
| +    ; GFX1150-NEXT: {{  $}}
 | ||||
| +    ; GFX1150-NEXT: S_SETPRIO 2
 | ||||
| +    ; GFX1150-NEXT: EXP 2, $vgpr0, $vgpr0, $vgpr0, $vgpr0, -1, -1, 15, implicit $exec
 | ||||
| +    ; GFX1150-NEXT: S_SETPRIO 0
 | ||||
| +    ; GFX1150-NEXT: S_WAITCNT_EXPCNT $sgpr_null, 0
 | ||||
| +    ; GFX1150-NEXT: S_NOP 0
 | ||||
| +    ; GFX1150-NEXT: S_NOP 0
 | ||||
| +    ; GFX1150-NEXT: S_SETPRIO 2
 | ||||
| +    ; GFX1150-NEXT: $vgpr0 = V_AND_B32_e32 1, $vgpr0, implicit $exec
 | ||||
| +    ; GFX1150-NEXT: EXP 1, $vgpr0, $vgpr0, $vgpr0, $vgpr0, -1, -1, 15, implicit $exec
 | ||||
| +    ; GFX1150-NEXT: S_SETPRIO 0
 | ||||
| +    ; GFX1150-NEXT: S_WAITCNT_EXPCNT $sgpr_null, 0
 | ||||
| +    ; GFX1150-NEXT: S_NOP 0
 | ||||
| +    ; GFX1150-NEXT: S_NOP 0
 | ||||
| +    ; GFX1150-NEXT: S_SETPRIO 2
 | ||||
| +    ; GFX1150-NEXT: $vgpr0 = V_OR_B32_e32 2, $vgpr0, implicit $exec
 | ||||
| +    ; GFX1150-NEXT: EXP_DONE 0, $vgpr0, $vgpr0, $vgpr0, $vgpr0, -1, -1, 15, implicit $exec
 | ||||
| +    ; GFX1150-NEXT: S_SETPRIO 0
 | ||||
| +    ; GFX1150-NEXT: S_NOP 0
 | ||||
| +    ; GFX1150-NEXT: S_NOP 0
 | ||||
| +    ; GFX1150-NEXT: S_ENDPGM 0
 | ||||
| +    EXP 2, $vgpr0, $vgpr0, $vgpr0, $vgpr0, -1, -1, 15, implicit $exec
 | ||||
| +    $vgpr0 = V_AND_B32_e32 1, $vgpr0, implicit $exec
 | ||||
| +    EXP 1, $vgpr0, $vgpr0, $vgpr0, $vgpr0, -1, -1, 15, implicit $exec
 | ||||
| +    $vgpr0 = V_OR_B32_e32 2, $vgpr0, implicit $exec
 | ||||
| +    EXP_DONE 0, $vgpr0, $vgpr0, $vgpr0, $vgpr0, -1, -1, 15, implicit $exec
 | ||||
| +    S_ENDPGM 0
 | ||||
| +...
 | ||||
| +
 | ||||
| +---
 | ||||
| +name: existing_setprio_1
 | ||||
| +tracksRegLiveness: true
 | ||||
| +liveins:
 | ||||
| +  - { reg: '$vgpr0' }
 | ||||
| +body: |
 | ||||
| +  ; GFX1150-LABEL: name: existing_setprio_1
 | ||||
| +  ; GFX1150: bb.0:
 | ||||
| +  ; GFX1150-NEXT:   successors: %bb.1(0x80000000)
 | ||||
| +  ; GFX1150-NEXT:   liveins: $vgpr0
 | ||||
| +  ; GFX1150-NEXT: {{  $}}
 | ||||
| +  ; GFX1150-NEXT:   S_SETPRIO 2
 | ||||
| +  ; GFX1150-NEXT:   $vgpr0 = V_AND_B32_e32 1, $vgpr0, implicit $exec
 | ||||
| +  ; GFX1150-NEXT: {{  $}}
 | ||||
| +  ; GFX1150-NEXT: bb.1:
 | ||||
| +  ; GFX1150-NEXT:   successors: %bb.2(0x80000000)
 | ||||
| +  ; GFX1150-NEXT:   liveins: $vgpr0
 | ||||
| +  ; GFX1150-NEXT: {{  $}}
 | ||||
| +  ; GFX1150-NEXT:   S_SETPRIO 3
 | ||||
| +  ; GFX1150-NEXT:   $vgpr0 = V_OR_B32_e32 2, $vgpr0, implicit $exec
 | ||||
| +  ; GFX1150-NEXT:   S_SETPRIO 2
 | ||||
| +  ; GFX1150-NEXT: {{  $}}
 | ||||
| +  ; GFX1150-NEXT: bb.2:
 | ||||
| +  ; GFX1150-NEXT:   successors: %bb.3(0x80000000)
 | ||||
| +  ; GFX1150-NEXT:   liveins: $vgpr0
 | ||||
| +  ; GFX1150-NEXT: {{  $}}
 | ||||
| +  ; GFX1150-NEXT:   S_SETPRIO 3
 | ||||
| +  ; GFX1150-NEXT:   $vgpr0 = V_OR_B32_e32 3, $vgpr0, implicit $exec
 | ||||
| +  ; GFX1150-NEXT:   S_SETPRIO 2
 | ||||
| +  ; GFX1150-NEXT: {{  $}}
 | ||||
| +  ; GFX1150-NEXT: bb.3:
 | ||||
| +  ; GFX1150-NEXT:   liveins: $vgpr0
 | ||||
| +  ; GFX1150-NEXT: {{  $}}
 | ||||
| +  ; GFX1150-NEXT:   EXP 1, $vgpr0, $vgpr0, $vgpr0, $vgpr0, -1, -1, 15, implicit $exec
 | ||||
| +  ; GFX1150-NEXT:   EXP_DONE 0, $vgpr0, $vgpr0, $vgpr0, $vgpr0, -1, -1, 15, implicit $exec
 | ||||
| +  ; GFX1150-NEXT:   S_SETPRIO 0
 | ||||
| +  ; GFX1150-NEXT:   S_NOP 0
 | ||||
| +  ; GFX1150-NEXT:   S_NOP 0
 | ||||
| +  ; GFX1150-NEXT:   S_ENDPGM 0
 | ||||
| +  bb.0:
 | ||||
| +    liveins: $vgpr0
 | ||||
| +    $vgpr0 = V_AND_B32_e32 1, $vgpr0, implicit $exec
 | ||||
| +
 | ||||
| +  bb.1:
 | ||||
| +    liveins: $vgpr0
 | ||||
| +    S_SETPRIO 3
 | ||||
| +    $vgpr0 = V_OR_B32_e32 2, $vgpr0, implicit $exec
 | ||||
| +    S_SETPRIO 0
 | ||||
| +
 | ||||
| +  bb.2:
 | ||||
| +    liveins: $vgpr0
 | ||||
| +    S_SETPRIO 1
 | ||||
| +    $vgpr0 = V_OR_B32_e32 3, $vgpr0, implicit $exec
 | ||||
| +    S_SETPRIO 0
 | ||||
| +
 | ||||
| +  bb.3:
 | ||||
| +    liveins: $vgpr0
 | ||||
| +    EXP 1, $vgpr0, $vgpr0, $vgpr0, $vgpr0, -1, -1, 15, implicit $exec
 | ||||
| +    EXP_DONE 0, $vgpr0, $vgpr0, $vgpr0, $vgpr0, -1, -1, 15, implicit $exec
 | ||||
| +    S_ENDPGM 0
 | ||||
| +...
 | ||||
| +
 | ||||
| +---
 | ||||
| +name: existing_setprio_2
 | ||||
| +tracksRegLiveness: true
 | ||||
| +liveins:
 | ||||
| +  - { reg: '$vgpr0' }
 | ||||
| +body: |
 | ||||
| +  bb.0:
 | ||||
| +    liveins: $vgpr0
 | ||||
| +    ; GFX1150-LABEL: name: existing_setprio_2
 | ||||
| +    ; GFX1150: liveins: $vgpr0
 | ||||
| +    ; GFX1150-NEXT: {{  $}}
 | ||||
| +    ; GFX1150-NEXT: S_SETPRIO 3
 | ||||
| +    ; GFX1150-NEXT: EXP 1, $vgpr0, $vgpr0, $vgpr0, $vgpr0, -1, -1, 15, implicit $exec
 | ||||
| +    ; GFX1150-NEXT: EXP_DONE 0, $vgpr0, $vgpr0, $vgpr0, $vgpr0, -1, -1, 15, implicit $exec
 | ||||
| +    ; GFX1150-NEXT: S_SETPRIO 0
 | ||||
| +    ; GFX1150-NEXT: S_WAITCNT_EXPCNT $sgpr_null, 0
 | ||||
| +    ; GFX1150-NEXT: S_NOP 0
 | ||||
| +    ; GFX1150-NEXT: S_NOP 0
 | ||||
| +    ; GFX1150-NEXT: S_SETPRIO 2
 | ||||
| +    ; GFX1150-NEXT: S_SETPRIO 3
 | ||||
| +    ; GFX1150-NEXT: S_ENDPGM 0
 | ||||
| +    S_SETPRIO 3
 | ||||
| +    EXP 1, $vgpr0, $vgpr0, $vgpr0, $vgpr0, -1, -1, 15, implicit $exec
 | ||||
| +    EXP_DONE 0, $vgpr0, $vgpr0, $vgpr0, $vgpr0, -1, -1, 15, implicit $exec
 | ||||
| +    S_SETPRIO 3
 | ||||
| +    S_ENDPGM 0
 | ||||
| +...
 | ||||
| 
 | ||||
| From 8ea44e65f2c19facff751aeb2ac960f907fb210f Mon Sep 17 00:00:00 2001 | ||||
| From: Carl Ritson <carl.ritson@amd.com> | ||||
| Date: Wed, 17 Jul 2024 16:18:02 +0900 | ||||
| Subject: [PATCH 2/3] Remove -verify-machineinstrs from test. | ||||
| 
 | ||||
| ---
 | ||||
|  llvm/test/CodeGen/AMDGPU/required-export-priority.ll | 2 +- | ||||
|  1 file changed, 1 insertion(+), 1 deletion(-) | ||||
| 
 | ||||
| diff --git a/llvm/test/CodeGen/AMDGPU/required-export-priority.ll b/llvm/test/CodeGen/AMDGPU/required-export-priority.ll
 | ||||
| index 377902f3f0d1a..ebc209bd4d451 100644
 | ||||
| --- a/llvm/test/CodeGen/AMDGPU/required-export-priority.ll
 | ||||
| +++ b/llvm/test/CodeGen/AMDGPU/required-export-priority.ll
 | ||||
| @@ -1,5 +1,5 @@
 | ||||
|  ; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py UTC_ARGS: --version 5 | ||||
| -; RUN: llc -mtriple=amdgcn -mcpu=gfx1150 -amdgpu-enable-vopd=0 -verify-machineinstrs < %s | FileCheck -check-prefix=GCN %s
 | ||||
| +; RUN: llc -mtriple=amdgcn -mcpu=gfx1150 -amdgpu-enable-vopd=0 < %s | FileCheck -check-prefix=GCN %s
 | ||||
|   | ||||
|  define amdgpu_ps void @test_export_zeroes_f32() #0 { | ||||
|  ; GCN-LABEL: test_export_zeroes_f32: | ||||
							
								
								
									
										190
									
								
								Makefile
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										190
									
								
								Makefile
									
									
									
									
									
										Normal file
									
								
							| @ -0,0 +1,190 @@ | ||||
| .DEFAULT_GOAL=help | ||||
| 
 | ||||
| # See ~/.config/mock/<CONFIG>.cfg or /etc/mock/<CONFIG>.cfg
 | ||||
| # Tweak this to centos-stream-9-x86_64 to build for CentOS
 | ||||
| MOCK_CHROOT?=centos-stream-10-x86_64 | ||||
| MOCK_OPTS?= | ||||
| MOCK_OPTS_RELEASE?=--no-clean --no-cleanup-after --without lto_build --define "debug_package %{nil}" $(MOCK_OPTS) | ||||
| MOCK_OPTS_SNAPSHOT?=$(MOCK_OPTS_RELEASE) --with snapshot_build $(MOCK_OPTS) | ||||
| YYYYMMDD?=$(shell date +%Y%m%d) | ||||
| SOURCEDIR=$(shell pwd) | ||||
| SPEC=llvm.spec | ||||
| # When nothing is given, this will be determined based on release or snapshot
 | ||||
| # builds.
 | ||||
| SRPM_PATH?= | ||||
| # Provide a path to your local llvm-project clone to build a snapshot of that
 | ||||
| # tree.
 | ||||
| GIT_TREE?= | ||||
| 
 | ||||
| ######### Get sources
 | ||||
| 
 | ||||
| .PHONY: get-sources-snapshot | ||||
| ## Downloads all sources we need for a snapshot build.
 | ||||
| get-sources-snapshot: | ||||
| 	YYYYMMDD=$(YYYYMMDD) GIT_TREE=$(GIT_TREE) ./.copr/snapshot-info.sh > $(SOURCEDIR)/version.spec.inc | ||||
| ifeq ($(GIT_TREE),) | ||||
| 	spectool -g --define "_sourcedir $(SOURCEDIR)" --define "_with_snapshot_build 1" $(SPEC) | ||||
| else | ||||
| 	$(info Creating tarball from git tree: $(GIT_TREE)) | ||||
| 	$(eval llvm_snapshot_git_revision:=$(shell git -C $(GIT_TREE) rev-parse HEAD)) | ||||
| 	git -C $(GIT_TREE) archive --format=tar.gz -o $(PWD)/$(llvm_snapshot_git_revision).tar.gz --prefix=llvm-project-$(llvm_snapshot_git_revision)/ HEAD | ||||
| endif | ||||
| 
 | ||||
| 
 | ||||
| .PHONY: get-sources-release | ||||
| ## Downloads all sources we need for a release build.
 | ||||
| get-sources-release: | ||||
| 	spectool -g --define "_sourcedir $(SOURCEDIR)" $(SPEC) | ||||
| 
 | ||||
| ######### Build SRPM
 | ||||
| 
 | ||||
| .PHONY: srpm-release | ||||
| ## Builds an SRPM that can be used for a release build.
 | ||||
| srpm-release: get-sources-release | ||||
| 	rpmbuild \
 | ||||
| 		--define "_rpmdir $(SOURCEDIR)" \
 | ||||
| 		--define "_sourcedir $(SOURCEDIR)" \
 | ||||
| 		--define "_specdir $(SOURCEDIR)" \
 | ||||
| 		--define "_srcrpmdir $(SOURCEDIR)" \
 | ||||
| 		--define "_builddir $(SOURCEDIR)" \
 | ||||
| 		-bs $(SPEC) | ||||
| 
 | ||||
| .PHONY: srpm-snapshot | ||||
| ## Builds an SRPM that can be used for a snapshot build.
 | ||||
| srpm-snapshot: get-sources-snapshot | ||||
| 	rpmbuild \
 | ||||
| 		--with=snapshot_build \
 | ||||
| 		--define "_rpmdir $(SOURCEDIR)" \
 | ||||
| 		--define "_sourcedir $(SOURCEDIR)" \
 | ||||
| 		--define "_specdir $(SOURCEDIR)" \
 | ||||
| 		--define "_srcrpmdir $(SOURCEDIR)" \
 | ||||
| 		--define "_builddir $(SOURCEDIR)" \
 | ||||
| 		-bs $(SPEC) | ||||
| 
 | ||||
| ######### Scrub mock chroot and cache
 | ||||
| 
 | ||||
| .PHONY: scrub-chroot | ||||
| ## Completely remove the fedora chroot and cache.
 | ||||
| scrub-chroot: | ||||
| 	mock -r $(MOCK_CHROOT) --scrub all | ||||
| 
 | ||||
| ######### Do a mock build
 | ||||
| 
 | ||||
| .PHONY: mockbuild-release | ||||
| ## Start a mock build of the release SRPM.
 | ||||
| mockbuild-release: srpm-release get-srpm-release | ||||
| 	mock -r $(MOCK_CHROOT) $(MOCK_OPTS_RELEASE) $(srpm_path) | ||||
| 
 | ||||
| .PHONY: mockbuild-snapshot | ||||
| ## Start a mock build of the snapshot SRPM.
 | ||||
| mockbuild-snapshot: srpm-snapshot get-srpm-snapshot | ||||
| 	mock -r $(MOCK_CHROOT) $(MOCK_OPTS_SNAPSHOT) $(srpm_path) | ||||
| 
 | ||||
| ######### Edit-last-failing-script
 | ||||
| 
 | ||||
| .PHONY: get-last-run-script | ||||
| ## Get the file that was last modified in /var/tmp/ within the chroot.
 | ||||
| get-last-run-script: | ||||
| 	$(eval last_run_script:=/var/tmp/$(shell ls -t1 /var/lib/mock/$(MOCK_CHROOT)/root/var/tmp | head -n1)) | ||||
| 	$(info last_run_script=$(last_run_script)) | ||||
| 	@echo > /dev/null | ||||
| 
 | ||||
| .PHONY: edit-last-failing-script | ||||
| ## Opens the last failing or running script from mock in your editor
 | ||||
| ## of choice for you to edit it and later re-run it in mock with:
 | ||||
| ## "make mockbuild-rerun-last-script".
 | ||||
| edit-last-failing-script: get-last-run-script | ||||
| 	$$EDITOR /var/lib/mock/$(MOCK_CHROOT)/root$(last_run_script) | ||||
| 
 | ||||
| ######### Re-run the last failing script from mock
 | ||||
| 
 | ||||
| .PHONY: mockbuild-rerun-last-script | ||||
| ## Re-runs the last failing or running script of your release/snapshot mock mockbuild.
 | ||||
| mockbuild-rerun-last-script: get-last-run-script | ||||
| 	mock --root=$(MOCK_CHROOT) --shell 'sh -e $(last_run_script)' | ||||
| 
 | ||||
| .PHONY: help | ||||
| # Based on https://gist.github.com/rcmachado/af3db315e31383502660
 | ||||
| ## Display this help text.
 | ||||
| help:/ | ||||
| 	$(info Available targets) | ||||
| 	$(info -----------------) | ||||
| 	@awk '/^[a-zA-Z\-0-9]+:/ { \
 | ||||
| 		helpMessage = match(lastLine, /^## (.*)/); \
 | ||||
| 		helpCommand = substr($$1, 0, index($$1, ":")-1); \
 | ||||
| 		if (helpMessage) { \
 | ||||
| 			helpMessage = substr(lastLine, RSTART + 3, RLENGTH); \
 | ||||
| 			gsub(/##/, "\n                                       ", helpMessage); \
 | ||||
| 		} else { \
 | ||||
| 			helpMessage = "(No documentation)"; \
 | ||||
| 		} \
 | ||||
| 		printf "%-37s - %s\n", helpCommand, helpMessage; \
 | ||||
| 		lastLine = "" \
 | ||||
| 	} \
 | ||||
| 	{ hasComment = match(lastLine, /^## (.*)/); \
 | ||||
|           if(hasComment) { \
 | ||||
|             lastLine=lastLine$$0; \
 | ||||
| 	  } \
 | ||||
|           else { \
 | ||||
| 	    lastLine = $$0 \
 | ||||
|           } \
 | ||||
|         }' $(MAKEFILE_LIST) | ||||
| 
 | ||||
| ######### Deprecated targets
 | ||||
| 
 | ||||
| # Map deprecated targets to new targets
 | ||||
| .PHONY: snapshot-srpm release-srpm | ||||
| snapshot-srpm release-srpm: | ||||
| 	$(eval mapped_target:=$(subst snapshot-srpm,srpm-snapshot,$(MAKECMDGOALS))) | ||||
| 	$(eval mapped_target:=$(subst release-srpm,srpm-release,$(mapped_target))) | ||||
| 	$(info WARNING: "$(MAKECMDGOALS)" is deprecated. Instead running "$(mapped_target)") | ||||
| 	$(MAKE) $(mapped_target) | ||||
| 
 | ||||
| ######### Version/Release helper targets to build name of SRPM
 | ||||
| 
 | ||||
| .PHONY: get-llvm-version-release | ||||
| ## Determines the LLVM version given in the llvm.spec file.
 | ||||
| get-llvm-version-release: | ||||
| 	$(eval llvm_version_release:=$(shell grep -ioP "%global\s+(maj|min|patch)_ver[^0-9]\K[0-9]+" $(SPEC) | paste -sd'.')) | ||||
| 	$(info LLVM Release Version: $(llvm_version_release)) | ||||
| 	@echo > /dev/null | ||||
| 
 | ||||
| .PHONY: get-llvm-version-snapshot | ||||
| ## Determines the LLVM version given in the version.spec.inc file.
 | ||||
| get-llvm-version-snapshot: | ||||
| 	$(eval llvm_version_snapshot:=$(shell grep -ioP "%global\s+(maj|min|patch)_ver[^0-9]\K[0-9]+" version.spec.inc | paste -sd'.')) | ||||
| 	$(info LLVM Snapshot Version: $(llvm_version_snapshot)) | ||||
| 	@echo > /dev/null | ||||
| 
 | ||||
| .PHONY: get-spec-file-release | ||||
| ## Parses the spec file for the Release: tag
 | ||||
| get-spec-file-release: | ||||
| 	$(eval spec_file_release:=$(shell grep -ioP '^Release:\s*\K[0-9]+' $(SPEC))) | ||||
| 	$(info LLVM Spec file Release: $(spec_file_release)) | ||||
| 	@echo > /dev/null | ||||
| 
 | ||||
| .PHONY: get-srpm-release | ||||
| ## Determines the name of the SRPM used for release builds
 | ||||
| ## Can be overriden by giving "make ... SRPM_PATH=foo.src.rpm".
 | ||||
| get-srpm-release: get-llvm-version-release get-spec-file-release | ||||
| ifeq ($(SRPM_PATH),) | ||||
| 	$(eval srpm_path:=llvm-$(llvm_version_release)-$(spec_file_release).*.src.rpm) | ||||
| else | ||||
| 	$(eval srpm_path:=$(SRPM_PATH)) | ||||
| endif | ||||
| 	$(info LLVM SRPM Release: $(srpm_path)) | ||||
| 	@echo > /dev/null | ||||
| 
 | ||||
| .PHONY: get-srpm-snapshot | ||||
| ## Determines the name of the SRPM used for snapshot builds
 | ||||
| ## Can be overriden by giving "make ... SRPM_PATH=foo.src.rpm".
 | ||||
| get-srpm-snapshot: get-llvm-version-snapshot get-spec-file-release | ||||
| ifeq ($(SRPM_PATH),) | ||||
| 	$(eval yyyymmdd:=$(shell grep -ioP "%global\s+llvm_snapshot_yyyymmdd\s+\K[0-9]+" version.spec.inc)) | ||||
| 	$(eval git_short:=$(shell grep -ioP "%global\s+llvm_snapshot_git_revision_short\s+\K[a-zA-Z0-9]+" version.spec.inc)) | ||||
| 	$(eval srpm_path:=llvm-$(llvm_version_snapshot)~pre$(yyyymmdd).g$(git_short)-$(spec_file_release).*.src.rpm) | ||||
| else | ||||
| 	$(eval srpm_path:=$(SRPM_PATH)) | ||||
| endif | ||||
| 	$(info LLVM SRPM Snapshot: $(srpm_path)) | ||||
| 	@echo > /dev/null | ||||
| @ -1,3 +1,5 @@ | ||||
| ## LLVM ############################################################# | ||||
| 
 | ||||
| # This library has no dependencies. | ||||
| addFilter("llvm-libs.x86_64: E: shared-lib-without-dependency-information /usr/lib64/libRemarks.so.[0-9]+") | ||||
| addFilter("llvm-googletest.x86_64: W: devel-file-in-non-devel-package") | ||||
| @ -16,3 +18,32 @@ addFilter("llvm-googletest.x86_64: W: no-documentation") | ||||
| addFilter("llvm-libs.x86_64: W: no-documentation") | ||||
| addFilter("llvm-static.x86_64: W: no-documentation") | ||||
| addFilter("llvm-test.x86_64: W: no-documentation") | ||||
| 
 | ||||
| ## COMPILER-RT ###################################################### | ||||
| 
 | ||||
| # This is a devel package | ||||
| addFilter("W: devel-file-in-non-devel-package") | ||||
| 
 | ||||
| # These symlinks are dangling on x64_64 | ||||
| addFilter("compiler-rt.x86_64: W: dangling-relative-symlink /usr/lib64/clang/[0-9]+.[0-9]+.[0-9]+/") | ||||
| 
 | ||||
| addFilter("E: hardcoded-library-path in ../../lib/clang/") | ||||
| 
 | ||||
| 
 | ||||
| ## LIBOMP ########################################################### | ||||
| 
 | ||||
| 
 | ||||
| 
 | ||||
| ## CLANG ############################################################ | ||||
| 
 | ||||
| clang needs libstdc++-devel installed in order to compile c++ programs. | ||||
| 
 | ||||
| addFilter("E: devel-dependency libstdc\+\+-devel") | ||||
| 
 | ||||
| addFilter("E: explicit-lib-dependency libstdc\+\+-devel") | ||||
| 
 | ||||
| # clang installs libear to /usr/lib on all arches, so we have to use | ||||
| 
 | ||||
| # a hard-coded /usr/lib path in order to move it to the python3 sitelib. | ||||
| 
 | ||||
| addFilter("E: hardcoded-library-path in %{_prefix}/lib/{libear") | ||||
|  | ||||
| @ -18,3 +18,7 @@ badfuncs: | ||||
|             - gethostbyname2 | ||||
|             - inet_aton | ||||
| 
 | ||||
| unicode: | ||||
|     ignore: | ||||
|         # Ignore bidirectional unicode sequence documentation file | ||||
|         - llvm-project-*.src/clang-tools-extra/docs/clang-tidy/checks/misc/misleading-bidirectional.rst | ||||
|  | ||||
							
								
								
									
										2
									
								
								sources
									
									
									
									
									
								
							
							
						
						
									
										2
									
								
								sources
									
									
									
									
									
								
							| @ -1,2 +1,4 @@ | ||||
| SHA512 (llvm-project-20.1.2.src.tar.xz) = c95e088e471d49c6692c8af1a7e40924467e4c269dada019c44455687c9f0e6a213b9b3ac8afa4e3d20cb3e757afc3400152e7cd06981aeebd61591cac15580d | ||||
| SHA512 (llvm-project-20.1.2.src.tar.xz.sig) = d3f6a350ebd9884878442ea202f58328f8e85c30cfb150371e4af7fa8dc560bb421cd0f49f49e6bc95f57de6c06543633f0b2799aab9590750f440e099424e01 | ||||
| SHA512 (llvm-project-19.1.7.src.tar.xz) = c7d63286d662707a9cd54758c9e3aaf52794a91900c484c4a6efa62d90bc719d5e7a345e4192feeb0c9fd11c82570d64677c781e5be1d645556b6aa018e47ec8 | ||||
| SHA512 (llvm-project-19.1.7.src.tar.xz.sig) = 195797b06ac80a742e0ccbc03a50dc06dd2e04377d783d5474e3e72c5a75203b60292b047929312a411d22b137a239943fba414a4d136a2be14cbff978eb6bda | ||||
|  | ||||
| @ -1,13 +1,14 @@ | ||||
| # | ||||
| # Build/PR gating tests for *LLVM 13* | ||||
| # Build/PR gating tests for *LLVM 19* | ||||
| # | ||||
| # Compatible with various LLVM 13 distributions: | ||||
| # Compatible with various LLVM 19 distributions: | ||||
| # | ||||
| #   * Fedora (ursine packages) | ||||
| #   * CentOS 10 stream (ursine packages) | ||||
| #   * Centos 9 stream (ursine packages) | ||||
| #   * RHEL-10 (ursine packages) | ||||
| #   * RHEL-9 (ursine packages) | ||||
| #   * RHEL-8 (Red Hat module) | ||||
| #   * RHEL-7 (software collection) | ||||
| # | ||||
| 
 | ||||
| summary: LLVM tests for build/PR gating | ||||
|  | ||||
		Loading…
	
		Reference in New Issue
	
	Block a user