r342078 - [Hexagon] Remove fp-contract=fast setting for at O3
Author: bcahoon Date: Wed Sep 12 13:35:56 2018 New Revision: 342078 URL: http://llvm.org/viewvc/llvm-project?rev=342078&view=rev Log: [Hexagon] Remove fp-contract=fast setting for at O3 Change Hexagon so that the setting for fp-contract is the default setting. This makes Hexagon consistent with all other targets. Differential Revision: https://reviews.llvm.org/D4 Modified: cfe/trunk/lib/Driver/ToolChains/Hexagon.cpp cfe/trunk/test/Driver/hexagon-toolchain-elf.c Modified: cfe/trunk/lib/Driver/ToolChains/Hexagon.cpp URL: http://llvm.org/viewvc/llvm-project/cfe/trunk/lib/Driver/ToolChains/Hexagon.cpp?rev=342078&r1=342077&r2=342078&view=diff == --- cfe/trunk/lib/Driver/ToolChains/Hexagon.cpp (original) +++ cfe/trunk/lib/Driver/ToolChains/Hexagon.cpp Wed Sep 12 13:35:56 2018 @@ -513,11 +513,6 @@ unsigned HexagonToolChain::getOptimizati void HexagonToolChain::addClangTargetOptions(const ArgList &DriverArgs, ArgStringList &CC1Args, Action::OffloadKind) const { - if (!DriverArgs.hasArg(options::OPT_ffp_contract)) { -unsigned OptLevel = getOptimizationLevel(DriverArgs); -if (OptLevel >= 3) - CC1Args.push_back("-ffp-contract=fast"); - } if (DriverArgs.hasArg(options::OPT_ffixed_r19)) { CC1Args.push_back("-target-feature"); CC1Args.push_back("+reserved-r19"); Modified: cfe/trunk/test/Driver/hexagon-toolchain-elf.c URL: http://llvm.org/viewvc/llvm-project/cfe/trunk/test/Driver/hexagon-toolchain-elf.c?rev=342078&r1=342077&r2=342078&view=diff == --- cfe/trunk/test/Driver/hexagon-toolchain-elf.c (original) +++ cfe/trunk/test/Driver/hexagon-toolchain-elf.c Wed Sep 12 13:35:56 2018 @@ -110,7 +110,7 @@ // RUN: -O3 \ // RUN: %s 2>&1 \ // RUN: | FileCheck -check-prefix=CHECK026 %s -// CHECK026: "-ffp-contract=fast" +// CHECK026-NOT: "-ffp-contract=fast" // CHECK026: hexagon-link // RUN: %clang -### -target hexagon-unknown-elf \ ___ cfe-commits mailing list cfe-commits@lists.llvm.org http://lists.llvm.org/cgi-bin/mailman/listinfo/cfe-commits
[clang] ea10a86 - [AMDGPU] Add gfx1013 target
Author: Brendon Cahoon Date: 2021-06-08T12:49:49-04:00 New Revision: ea10a86984ea73fcec3b12d22404a15f2f59b219 URL: https://github.com/llvm/llvm-project/commit/ea10a86984ea73fcec3b12d22404a15f2f59b219 DIFF: https://github.com/llvm/llvm-project/commit/ea10a86984ea73fcec3b12d22404a15f2f59b219.diff LOG: [AMDGPU] Add gfx1013 target Differential Revision: https://reviews.llvm.org/D103663 Added: Modified: clang/include/clang/Basic/Cuda.h clang/lib/Basic/Cuda.cpp clang/lib/Basic/Targets/AMDGPU.cpp clang/lib/Basic/Targets/NVPTX.cpp clang/lib/CodeGen/CGOpenMPRuntimeGPU.cpp clang/test/CodeGenOpenCL/amdgpu-features.cl clang/test/Driver/amdgpu-macros.cl clang/test/Driver/amdgpu-mcpu.cl clang/test/Misc/target-invalid-cpu-note.c llvm/docs/AMDGPUUsage.rst llvm/include/llvm/BinaryFormat/ELF.h llvm/include/llvm/Support/TargetParser.h llvm/lib/Object/ELFObjectFile.cpp llvm/lib/ObjectYAML/ELFYAML.cpp llvm/lib/Support/TargetParser.cpp llvm/lib/Target/AMDGPU/AMDGPU.td llvm/lib/Target/AMDGPU/AMDGPULegalizerInfo.cpp llvm/lib/Target/AMDGPU/AMDGPUSubtarget.cpp llvm/lib/Target/AMDGPU/GCNProcessors.td llvm/lib/Target/AMDGPU/GCNSubtarget.h llvm/lib/Target/AMDGPU/MCTargetDesc/AMDGPUTargetStreamer.cpp llvm/lib/Target/AMDGPU/MIMGInstructions.td llvm/lib/Target/AMDGPU/SIISelLowering.cpp llvm/lib/Target/AMDGPU/Utils/AMDGPUBaseInfo.cpp llvm/lib/Target/AMDGPU/Utils/AMDGPUBaseInfo.h llvm/test/CodeGen/AMDGPU/GlobalISel/llvm.amdgcn.intersect_ray.ll llvm/test/CodeGen/AMDGPU/directive-amdgcn-target.ll llvm/test/CodeGen/AMDGPU/elf-header-flags-mach.ll llvm/test/CodeGen/AMDGPU/llvm.amdgcn.intersect_ray.ll llvm/test/MC/AMDGPU/dl-insts-err.s llvm/test/MC/AMDGPU/gfx10_unsupported.s llvm/test/Object/AMDGPU/elf-header-flags-mach.yaml llvm/test/tools/llvm-objdump/ELF/AMDGPU/subtarget.ll llvm/test/tools/llvm-readobj/ELF/amdgpu-elf-headers.test llvm/tools/llvm-readobj/ELFDumper.cpp openmp/libomptarget/plugins/amdgpu/impl/get_elf_mach_gfx_name.cpp Removed: diff --git a/clang/include/clang/Basic/Cuda.h b/clang/include/clang/Basic/Cuda.h index e580fea9c5102..13317f62c3c5a 100644 --- a/clang/include/clang/Basic/Cuda.h +++ b/clang/include/clang/Basic/Cuda.h @@ -83,6 +83,7 @@ enum class CudaArch { GFX1010, GFX1011, GFX1012, + GFX1013, GFX1030, GFX1031, GFX1032, diff --git a/clang/lib/Basic/Cuda.cpp b/clang/lib/Basic/Cuda.cpp index 79cc6c9d7489d..fa7f78a25829f 100644 --- a/clang/lib/Basic/Cuda.cpp +++ b/clang/lib/Basic/Cuda.cpp @@ -105,6 +105,7 @@ static const CudaArchToStringMap arch_names[] = { GFX(1010), // gfx1010 GFX(1011), // gfx1011 GFX(1012), // gfx1012 +GFX(1013), // gfx1013 GFX(1030), // gfx1030 GFX(1031), // gfx1031 GFX(1032), // gfx1032 diff --git a/clang/lib/Basic/Targets/AMDGPU.cpp b/clang/lib/Basic/Targets/AMDGPU.cpp index 12cab8bd456b3..8a8165e9c895c 100644 --- a/clang/lib/Basic/Targets/AMDGPU.cpp +++ b/clang/lib/Basic/Targets/AMDGPU.cpp @@ -214,6 +214,7 @@ bool AMDGPUTargetInfo::initFeatureMap( Features["dot6-insts"] = true; Features["dot7-insts"] = true; LLVM_FALLTHROUGH; +case GK_GFX1013: case GK_GFX1010: Features["dl-insts"] = true; Features["ci-insts"] = true; diff --git a/clang/lib/Basic/Targets/NVPTX.cpp b/clang/lib/Basic/Targets/NVPTX.cpp index 70ddff4c7cf35..885dac9ab79d7 100644 --- a/clang/lib/Basic/Targets/NVPTX.cpp +++ b/clang/lib/Basic/Targets/NVPTX.cpp @@ -207,6 +207,7 @@ void NVPTXTargetInfo::getTargetDefines(const LangOptions &Opts, case CudaArch::GFX1010: case CudaArch::GFX1011: case CudaArch::GFX1012: + case CudaArch::GFX1013: case CudaArch::GFX1030: case CudaArch::GFX1031: case CudaArch::GFX1032: diff --git a/clang/lib/CodeGen/CGOpenMPRuntimeGPU.cpp b/clang/lib/CodeGen/CGOpenMPRuntimeGPU.cpp index 2ceb3a4cd5ab6..e0f9f5449b64b 100644 --- a/clang/lib/CodeGen/CGOpenMPRuntimeGPU.cpp +++ b/clang/lib/CodeGen/CGOpenMPRuntimeGPU.cpp @@ -4482,6 +4482,7 @@ void CGOpenMPRuntimeGPU::processRequiresDirective( case CudaArch::GFX1010: case CudaArch::GFX1011: case CudaArch::GFX1012: + case CudaArch::GFX1013: case CudaArch::GFX1030: case CudaArch::GFX1031: case CudaArch::GFX1032: @@ -4553,6 +4554,7 @@ static std::pair getSMsBlocksPerSM(CodeGenModule &CGM) { case CudaArch::GFX1010: case CudaArch::GFX1011: case CudaArch::GFX1012: + case CudaArch::GFX1013: case CudaArch::GFX1030: case CudaArch::GFX1031: case CudaArch::GFX1032: diff --git a/clang/test/CodeGenOpenCL/amdgpu-features.cl b/clang/test/CodeGenOpenCL/amdgpu-features.cl index 35c1ab3c1a6d8..b4b86d75c9ae7 100644 --- a/clang/test/CodeGenOpenCL/amdgpu-features.cl +++ b/clang/test/CodeGenOpenCL/amdgpu-features.cl @@ -28,6 +28,
[clang] 211e584 - Revert "[AMDGPU] Add gfx1013 target"
Author: Brendon Cahoon Date: 2021-06-08T16:29:41-04:00 New Revision: 211e584fa2a4c032e4d573e7cdbffd622aad0a8f URL: https://github.com/llvm/llvm-project/commit/211e584fa2a4c032e4d573e7cdbffd622aad0a8f DIFF: https://github.com/llvm/llvm-project/commit/211e584fa2a4c032e4d573e7cdbffd622aad0a8f.diff LOG: Revert "[AMDGPU] Add gfx1013 target" This reverts commit ea10a86984ea73fcec3b12d22404a15f2f59b219. A sanitizer buildbot reports an error. Added: Modified: clang/include/clang/Basic/Cuda.h clang/lib/Basic/Cuda.cpp clang/lib/Basic/Targets/AMDGPU.cpp clang/lib/Basic/Targets/NVPTX.cpp clang/lib/CodeGen/CGOpenMPRuntimeGPU.cpp clang/test/CodeGenOpenCL/amdgpu-features.cl clang/test/Driver/amdgpu-macros.cl clang/test/Driver/amdgpu-mcpu.cl clang/test/Misc/target-invalid-cpu-note.c llvm/docs/AMDGPUUsage.rst llvm/include/llvm/BinaryFormat/ELF.h llvm/include/llvm/Support/TargetParser.h llvm/lib/Object/ELFObjectFile.cpp llvm/lib/ObjectYAML/ELFYAML.cpp llvm/lib/Support/TargetParser.cpp llvm/lib/Target/AMDGPU/AMDGPU.td llvm/lib/Target/AMDGPU/AMDGPULegalizerInfo.cpp llvm/lib/Target/AMDGPU/AMDGPUSubtarget.cpp llvm/lib/Target/AMDGPU/GCNProcessors.td llvm/lib/Target/AMDGPU/GCNSubtarget.h llvm/lib/Target/AMDGPU/MCTargetDesc/AMDGPUTargetStreamer.cpp llvm/lib/Target/AMDGPU/MIMGInstructions.td llvm/lib/Target/AMDGPU/SIISelLowering.cpp llvm/lib/Target/AMDGPU/Utils/AMDGPUBaseInfo.cpp llvm/lib/Target/AMDGPU/Utils/AMDGPUBaseInfo.h llvm/test/CodeGen/AMDGPU/GlobalISel/llvm.amdgcn.intersect_ray.ll llvm/test/CodeGen/AMDGPU/directive-amdgcn-target.ll llvm/test/CodeGen/AMDGPU/elf-header-flags-mach.ll llvm/test/CodeGen/AMDGPU/llvm.amdgcn.intersect_ray.ll llvm/test/MC/AMDGPU/dl-insts-err.s llvm/test/MC/AMDGPU/gfx10_unsupported.s llvm/test/Object/AMDGPU/elf-header-flags-mach.yaml llvm/test/tools/llvm-objdump/ELF/AMDGPU/subtarget.ll llvm/test/tools/llvm-readobj/ELF/amdgpu-elf-headers.test llvm/tools/llvm-readobj/ELFDumper.cpp openmp/libomptarget/plugins/amdgpu/impl/get_elf_mach_gfx_name.cpp Removed: diff --git a/clang/include/clang/Basic/Cuda.h b/clang/include/clang/Basic/Cuda.h index 13317f62c3c5a..e580fea9c5102 100644 --- a/clang/include/clang/Basic/Cuda.h +++ b/clang/include/clang/Basic/Cuda.h @@ -83,7 +83,6 @@ enum class CudaArch { GFX1010, GFX1011, GFX1012, - GFX1013, GFX1030, GFX1031, GFX1032, diff --git a/clang/lib/Basic/Cuda.cpp b/clang/lib/Basic/Cuda.cpp index fa7f78a25829f..79cc6c9d7489d 100644 --- a/clang/lib/Basic/Cuda.cpp +++ b/clang/lib/Basic/Cuda.cpp @@ -105,7 +105,6 @@ static const CudaArchToStringMap arch_names[] = { GFX(1010), // gfx1010 GFX(1011), // gfx1011 GFX(1012), // gfx1012 -GFX(1013), // gfx1013 GFX(1030), // gfx1030 GFX(1031), // gfx1031 GFX(1032), // gfx1032 diff --git a/clang/lib/Basic/Targets/AMDGPU.cpp b/clang/lib/Basic/Targets/AMDGPU.cpp index 8a8165e9c895c..12cab8bd456b3 100644 --- a/clang/lib/Basic/Targets/AMDGPU.cpp +++ b/clang/lib/Basic/Targets/AMDGPU.cpp @@ -214,7 +214,6 @@ bool AMDGPUTargetInfo::initFeatureMap( Features["dot6-insts"] = true; Features["dot7-insts"] = true; LLVM_FALLTHROUGH; -case GK_GFX1013: case GK_GFX1010: Features["dl-insts"] = true; Features["ci-insts"] = true; diff --git a/clang/lib/Basic/Targets/NVPTX.cpp b/clang/lib/Basic/Targets/NVPTX.cpp index 885dac9ab79d7..70ddff4c7cf35 100644 --- a/clang/lib/Basic/Targets/NVPTX.cpp +++ b/clang/lib/Basic/Targets/NVPTX.cpp @@ -207,7 +207,6 @@ void NVPTXTargetInfo::getTargetDefines(const LangOptions &Opts, case CudaArch::GFX1010: case CudaArch::GFX1011: case CudaArch::GFX1012: - case CudaArch::GFX1013: case CudaArch::GFX1030: case CudaArch::GFX1031: case CudaArch::GFX1032: diff --git a/clang/lib/CodeGen/CGOpenMPRuntimeGPU.cpp b/clang/lib/CodeGen/CGOpenMPRuntimeGPU.cpp index e0f9f5449b64b..2ceb3a4cd5ab6 100644 --- a/clang/lib/CodeGen/CGOpenMPRuntimeGPU.cpp +++ b/clang/lib/CodeGen/CGOpenMPRuntimeGPU.cpp @@ -4482,7 +4482,6 @@ void CGOpenMPRuntimeGPU::processRequiresDirective( case CudaArch::GFX1010: case CudaArch::GFX1011: case CudaArch::GFX1012: - case CudaArch::GFX1013: case CudaArch::GFX1030: case CudaArch::GFX1031: case CudaArch::GFX1032: @@ -4554,7 +4553,6 @@ static std::pair getSMsBlocksPerSM(CodeGenModule &CGM) { case CudaArch::GFX1010: case CudaArch::GFX1011: case CudaArch::GFX1012: - case CudaArch::GFX1013: case CudaArch::GFX1030: case CudaArch::GFX1031: case CudaArch::GFX1032: diff --git a/clang/test/CodeGenOpenCL/amdgpu-features.cl b/clang/test/CodeGenOpenCL/amdgpu-features.cl index b4b86d75c9ae7..35c1ab3c1a6d8 100644 --- a/clang/test/CodeGenOpenCL/amdgpu-features.cl +++ b/cl
[clang] 294efbb - Reland "[AMDGPU] Add gfx1013 target"
Author: Brendon Cahoon Date: 2021-06-08T21:15:35-04:00 New Revision: 294efbbd3e3d55671ef8b220c231a2807c38eefe URL: https://github.com/llvm/llvm-project/commit/294efbbd3e3d55671ef8b220c231a2807c38eefe DIFF: https://github.com/llvm/llvm-project/commit/294efbbd3e3d55671ef8b220c231a2807c38eefe.diff LOG: Reland "[AMDGPU] Add gfx1013 target" This reverts commit 211e584fa2a4c032e4d573e7cdbffd622aad0a8f. Fixed a use-after-free error that caused the sanitizers to fail. Added: Modified: clang/include/clang/Basic/Cuda.h clang/lib/Basic/Cuda.cpp clang/lib/Basic/Targets/AMDGPU.cpp clang/lib/Basic/Targets/NVPTX.cpp clang/lib/CodeGen/CGOpenMPRuntimeGPU.cpp clang/test/CodeGenOpenCL/amdgpu-features.cl clang/test/Driver/amdgpu-macros.cl clang/test/Driver/amdgpu-mcpu.cl clang/test/Misc/target-invalid-cpu-note.c llvm/docs/AMDGPUUsage.rst llvm/include/llvm/BinaryFormat/ELF.h llvm/include/llvm/Support/TargetParser.h llvm/lib/Object/ELFObjectFile.cpp llvm/lib/ObjectYAML/ELFYAML.cpp llvm/lib/Support/TargetParser.cpp llvm/lib/Target/AMDGPU/AMDGPU.td llvm/lib/Target/AMDGPU/AMDGPULegalizerInfo.cpp llvm/lib/Target/AMDGPU/AMDGPUSubtarget.cpp llvm/lib/Target/AMDGPU/GCNProcessors.td llvm/lib/Target/AMDGPU/GCNSubtarget.h llvm/lib/Target/AMDGPU/MCTargetDesc/AMDGPUTargetStreamer.cpp llvm/lib/Target/AMDGPU/MIMGInstructions.td llvm/lib/Target/AMDGPU/SIISelLowering.cpp llvm/lib/Target/AMDGPU/Utils/AMDGPUBaseInfo.cpp llvm/lib/Target/AMDGPU/Utils/AMDGPUBaseInfo.h llvm/test/CodeGen/AMDGPU/GlobalISel/llvm.amdgcn.intersect_ray.ll llvm/test/CodeGen/AMDGPU/directive-amdgcn-target.ll llvm/test/CodeGen/AMDGPU/elf-header-flags-mach.ll llvm/test/CodeGen/AMDGPU/llvm.amdgcn.intersect_ray.ll llvm/test/MC/AMDGPU/dl-insts-err.s llvm/test/MC/AMDGPU/gfx10_unsupported.s llvm/test/Object/AMDGPU/elf-header-flags-mach.yaml llvm/test/tools/llvm-objdump/ELF/AMDGPU/subtarget.ll llvm/test/tools/llvm-readobj/ELF/amdgpu-elf-headers.test llvm/tools/llvm-readobj/ELFDumper.cpp openmp/libomptarget/plugins/amdgpu/impl/get_elf_mach_gfx_name.cpp Removed: diff --git a/clang/include/clang/Basic/Cuda.h b/clang/include/clang/Basic/Cuda.h index e580fea9c5102..13317f62c3c5a 100644 --- a/clang/include/clang/Basic/Cuda.h +++ b/clang/include/clang/Basic/Cuda.h @@ -83,6 +83,7 @@ enum class CudaArch { GFX1010, GFX1011, GFX1012, + GFX1013, GFX1030, GFX1031, GFX1032, diff --git a/clang/lib/Basic/Cuda.cpp b/clang/lib/Basic/Cuda.cpp index 79cc6c9d7489d..fa7f78a25829f 100644 --- a/clang/lib/Basic/Cuda.cpp +++ b/clang/lib/Basic/Cuda.cpp @@ -105,6 +105,7 @@ static const CudaArchToStringMap arch_names[] = { GFX(1010), // gfx1010 GFX(1011), // gfx1011 GFX(1012), // gfx1012 +GFX(1013), // gfx1013 GFX(1030), // gfx1030 GFX(1031), // gfx1031 GFX(1032), // gfx1032 diff --git a/clang/lib/Basic/Targets/AMDGPU.cpp b/clang/lib/Basic/Targets/AMDGPU.cpp index 12cab8bd456b3..8a8165e9c895c 100644 --- a/clang/lib/Basic/Targets/AMDGPU.cpp +++ b/clang/lib/Basic/Targets/AMDGPU.cpp @@ -214,6 +214,7 @@ bool AMDGPUTargetInfo::initFeatureMap( Features["dot6-insts"] = true; Features["dot7-insts"] = true; LLVM_FALLTHROUGH; +case GK_GFX1013: case GK_GFX1010: Features["dl-insts"] = true; Features["ci-insts"] = true; diff --git a/clang/lib/Basic/Targets/NVPTX.cpp b/clang/lib/Basic/Targets/NVPTX.cpp index 70ddff4c7cf35..885dac9ab79d7 100644 --- a/clang/lib/Basic/Targets/NVPTX.cpp +++ b/clang/lib/Basic/Targets/NVPTX.cpp @@ -207,6 +207,7 @@ void NVPTXTargetInfo::getTargetDefines(const LangOptions &Opts, case CudaArch::GFX1010: case CudaArch::GFX1011: case CudaArch::GFX1012: + case CudaArch::GFX1013: case CudaArch::GFX1030: case CudaArch::GFX1031: case CudaArch::GFX1032: diff --git a/clang/lib/CodeGen/CGOpenMPRuntimeGPU.cpp b/clang/lib/CodeGen/CGOpenMPRuntimeGPU.cpp index 2ceb3a4cd5ab6..e0f9f5449b64b 100644 --- a/clang/lib/CodeGen/CGOpenMPRuntimeGPU.cpp +++ b/clang/lib/CodeGen/CGOpenMPRuntimeGPU.cpp @@ -4482,6 +4482,7 @@ void CGOpenMPRuntimeGPU::processRequiresDirective( case CudaArch::GFX1010: case CudaArch::GFX1011: case CudaArch::GFX1012: + case CudaArch::GFX1013: case CudaArch::GFX1030: case CudaArch::GFX1031: case CudaArch::GFX1032: @@ -4553,6 +4554,7 @@ static std::pair getSMsBlocksPerSM(CodeGenModule &CGM) { case CudaArch::GFX1010: case CudaArch::GFX1011: case CudaArch::GFX1012: + case CudaArch::GFX1013: case CudaArch::GFX1030: case CudaArch::GFX1031: case CudaArch::GFX1032: diff --git a/clang/test/CodeGenOpenCL/amdgpu-features.cl b/clang/test/CodeGenOpenCL/amdgpu-features.cl index 35c1ab3c1a6d8..b4b86d75c9ae7 100644 --- a/clang/test/CodeGenOpenCL/a