https://github.com/inbelic updated https://github.com/llvm/llvm-project/pull/122981
>From 98deff6a407b912852e70b2bdc3618aaec8a1931 Mon Sep 17 00:00:00 2001 From: Finn Plummer <canadienf...@gmail.com> Date: Fri, 24 Jan 2025 22:23:39 +0000 Subject: [PATCH 1/5] [HLSL][RootSignature] Initial Lexer Definition with puncuators - Defines the RootSignatureLexer class - Defines the test harness required for testing - Implements the punctuator tokens and tests functionality --- .../include/clang/Basic/DiagnosticLexKinds.td | 6 + .../Parse/HLSLRootSignatureTokenKinds.def | 35 ++++ .../clang/Parse/ParseHLSLRootSignature.h | 79 +++++++++ clang/lib/Parse/CMakeLists.txt | 1 + clang/lib/Parse/ParseHLSLRootSignature.cpp | 50 ++++++ clang/unittests/CMakeLists.txt | 1 + clang/unittests/Parse/CMakeLists.txt | 26 +++ .../Parse/ParseHLSLRootSignatureTest.cpp | 167 ++++++++++++++++++ 8 files changed, 365 insertions(+) create mode 100644 clang/include/clang/Parse/HLSLRootSignatureTokenKinds.def create mode 100644 clang/include/clang/Parse/ParseHLSLRootSignature.h create mode 100644 clang/lib/Parse/ParseHLSLRootSignature.cpp create mode 100644 clang/unittests/Parse/CMakeLists.txt create mode 100644 clang/unittests/Parse/ParseHLSLRootSignatureTest.cpp diff --git a/clang/include/clang/Basic/DiagnosticLexKinds.td b/clang/include/clang/Basic/DiagnosticLexKinds.td index 959376b0847216..7755c05bc8969b 100644 --- a/clang/include/clang/Basic/DiagnosticLexKinds.td +++ b/clang/include/clang/Basic/DiagnosticLexKinds.td @@ -1017,4 +1017,10 @@ Error<"'#pragma unsafe_buffer_usage' was not ended">; def err_pp_pragma_unsafe_buffer_usage_syntax : Error<"expected 'begin' or 'end'">; + +// HLSL Root Signature Lexing Errors +let CategoryName = "Root Signature Lexical Issue" in { + def err_hlsl_invalid_token: Error<"unable to lex a valid Root Signature token">; +} + } diff --git a/clang/include/clang/Parse/HLSLRootSignatureTokenKinds.def b/clang/include/clang/Parse/HLSLRootSignatureTokenKinds.def new file mode 100644 index 00000000000000..9625f6a5bd76d9 --- /dev/null +++ b/clang/include/clang/Parse/HLSLRootSignatureTokenKinds.def @@ -0,0 +1,35 @@ +//===--- HLSLRootSignature.def - Tokens and Enum Database -------*- C++ -*-===// + +// +// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. +// See https://llvm.org/LICENSE.txt for license information. +// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception +// +//===----------------------------------------------------------------------===// +// +// This file defines the TokenKinds used in the Root Signature DSL. This +// includes keywords, enums and a small subset of punctuators. Users of this +// file must optionally #define the TOK, KEYWORD, ENUM or specific ENUM macros +// to make use of this file. +// +//===----------------------------------------------------------------------===// + +#ifndef TOK +#define TOK(X) +#endif +#ifndef PUNCTUATOR +#define PUNCTUATOR(X,Y) TOK(pu_ ## X) +#endif + +// General Tokens: +TOK(invalid) + +// Punctuators: +PUNCTUATOR(l_paren, '(') +PUNCTUATOR(r_paren, ')') +PUNCTUATOR(comma, ',') +PUNCTUATOR(or, '|') +PUNCTUATOR(equal, '=') + +#undef PUNCTUATOR +#undef TOK diff --git a/clang/include/clang/Parse/ParseHLSLRootSignature.h b/clang/include/clang/Parse/ParseHLSLRootSignature.h new file mode 100644 index 00000000000000..39069e7cc39988 --- /dev/null +++ b/clang/include/clang/Parse/ParseHLSLRootSignature.h @@ -0,0 +1,79 @@ +//===--- ParseHLSLRootSignature.h -------------------------------*- C++ -*-===// +// +// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. +// See https://llvm.org/LICENSE.txt for license information. +// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception +// +//===----------------------------------------------------------------------===// +// +// This file defines the ParseHLSLRootSignature interface. +// +//===----------------------------------------------------------------------===// + +#ifndef LLVM_CLANG_PARSE_PARSEHLSLROOTSIGNATURE_H +#define LLVM_CLANG_PARSE_PARSEHLSLROOTSIGNATURE_H + +#include "clang/Basic/DiagnosticLex.h" +#include "clang/Lex/Preprocessor.h" + +#include "llvm/ADT/SmallVector.h" +#include "llvm/ADT/StringRef.h" + +namespace clang { +namespace hlsl { + +struct RootSignatureToken { + enum Kind { +#define TOK(X) X, +#include "clang/Parse/HLSLRootSignatureTokenKinds.def" + }; + + Kind Kind = Kind::invalid; + + // Retain the SouceLocation of the token for diagnostics + clang::SourceLocation TokLoc; + + // Constructors + RootSignatureToken(clang::SourceLocation TokLoc) : TokLoc(TokLoc) {} +}; +using TokenKind = enum RootSignatureToken::Kind; + +class RootSignatureLexer { +public: + RootSignatureLexer(StringRef Signature, clang::SourceLocation SourceLoc, + clang::Preprocessor &PP) + : Buffer(Signature), SourceLoc(SourceLoc), PP(PP) {} + + // Consumes the internal buffer as a list of tokens and will emplace them + // onto the given tokens. + // + // It will consume until it successfully reaches the end of the buffer, + // or, until the first error is encountered. The return value denotes if + // there was a failure. + bool Lex(SmallVector<RootSignatureToken> &Tokens); + +private: + // Internal buffer to iterate over + StringRef Buffer; + + // Passed down parameters from Sema + clang::SourceLocation SourceLoc; + clang::Preprocessor &PP; + + // Consumes the internal buffer for a single token. + // + // The return value denotes if there was a failure. + bool LexToken(RootSignatureToken &Token); + + // Advance the buffer by the specified number of characters. Updates the + // SourceLocation appropriately. + void AdvanceBuffer(unsigned NumCharacters = 1) { + Buffer = Buffer.drop_front(NumCharacters); + SourceLoc = SourceLoc.getLocWithOffset(NumCharacters); + } +}; + +} // namespace hlsl +} // namespace clang + +#endif // LLVM_CLANG_PARSE_PARSEHLSLROOTSIGNATURE_H diff --git a/clang/lib/Parse/CMakeLists.txt b/clang/lib/Parse/CMakeLists.txt index 22e902f7e1bc50..00fde537bb9c60 100644 --- a/clang/lib/Parse/CMakeLists.txt +++ b/clang/lib/Parse/CMakeLists.txt @@ -14,6 +14,7 @@ add_clang_library(clangParse ParseExpr.cpp ParseExprCXX.cpp ParseHLSL.cpp + ParseHLSLRootSignature.cpp ParseInit.cpp ParseObjc.cpp ParseOpenMP.cpp diff --git a/clang/lib/Parse/ParseHLSLRootSignature.cpp b/clang/lib/Parse/ParseHLSLRootSignature.cpp new file mode 100644 index 00000000000000..a9a9d209085c91 --- /dev/null +++ b/clang/lib/Parse/ParseHLSLRootSignature.cpp @@ -0,0 +1,50 @@ +#include "clang/Parse/ParseHLSLRootSignature.h" + +namespace clang { +namespace hlsl { + +// Lexer Definitions + +bool RootSignatureLexer::Lex(SmallVector<RootSignatureToken> &Tokens) { + // Discard any leading whitespace + AdvanceBuffer(Buffer.take_while(isspace).size()); + + while (!Buffer.empty()) { + // Record where this token is in the text for usage in parser diagnostics + RootSignatureToken Result(SourceLoc); + if (LexToken(Result)) + return true; + + // Successfully Lexed the token so we can store it + Tokens.push_back(Result); + + // Discard any trailing whitespace + AdvanceBuffer(Buffer.take_while(isspace).size()); + } + + return false; +} + +bool RootSignatureLexer::LexToken(RootSignatureToken &Result) { + char C = Buffer.front(); + + // Punctuators + switch (C) { +#define PUNCTUATOR(X, Y) \ + case Y: { \ + Result.Kind = TokenKind::pu_##X; \ + AdvanceBuffer(); \ + return false; \ + } +#include "clang/Parse/HLSLRootSignatureTokenKinds.def" + default: + break; + } + + // Unable to match on any token type + PP.getDiagnostics().Report(Result.TokLoc, diag::err_hlsl_invalid_token); + return true; +} + +} // namespace hlsl +} // namespace clang diff --git a/clang/unittests/CMakeLists.txt b/clang/unittests/CMakeLists.txt index 85d265426ec80b..9b3ce8aa7de739 100644 --- a/clang/unittests/CMakeLists.txt +++ b/clang/unittests/CMakeLists.txt @@ -25,6 +25,7 @@ endfunction() add_subdirectory(Basic) add_subdirectory(Lex) +add_subdirectory(Parse) add_subdirectory(Driver) if(CLANG_ENABLE_STATIC_ANALYZER) add_subdirectory(Analysis) diff --git a/clang/unittests/Parse/CMakeLists.txt b/clang/unittests/Parse/CMakeLists.txt new file mode 100644 index 00000000000000..1b7eb4934a46c8 --- /dev/null +++ b/clang/unittests/Parse/CMakeLists.txt @@ -0,0 +1,26 @@ +set(LLVM_LINK_COMPONENTS + Support + ) + +add_clang_unittest(ParseTests + ParseHLSLRootSignatureTest.cpp + ) + +clang_target_link_libraries(ParseTests + PRIVATE + clangAST + clangASTMatchers + clangBasic + clangFrontend + clangParse + clangSema + clangSerialization + clangTooling + ) + +target_link_libraries(ParseTests + PRIVATE + LLVMTestingAnnotations + LLVMTestingSupport + clangTesting + ) diff --git a/clang/unittests/Parse/ParseHLSLRootSignatureTest.cpp b/clang/unittests/Parse/ParseHLSLRootSignatureTest.cpp new file mode 100644 index 00000000000000..e5f88bbfa0ff6a --- /dev/null +++ b/clang/unittests/Parse/ParseHLSLRootSignatureTest.cpp @@ -0,0 +1,167 @@ +//=== ParseHLSLRootSignatureTest.cpp - Parse Root Signature tests ---------===// +// +// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. +// See https://llvm.org/LICENSE.txt for license information. +// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception +// +//===----------------------------------------------------------------------===// + +#include "clang/Basic/Diagnostic.h" +#include "clang/Basic/DiagnosticOptions.h" +#include "clang/Basic/FileManager.h" +#include "clang/Basic/LangOptions.h" +#include "clang/Basic/SourceLocation.h" +#include "clang/Basic/SourceManager.h" +#include "clang/Basic/TargetInfo.h" +#include "clang/Lex/HeaderSearch.h" +#include "clang/Lex/HeaderSearchOptions.h" +#include "clang/Lex/Lexer.h" +#include "clang/Lex/ModuleLoader.h" +#include "clang/Lex/Preprocessor.h" +#include "clang/Lex/PreprocessorOptions.h" + +#include "clang/Parse/ParseHLSLRootSignature.h" +#include "gtest/gtest.h" + +using namespace clang; + +namespace { + +// Diagnostic helper for helper tests +class ExpectedDiagConsumer : public DiagnosticConsumer { + virtual void anchor() {} + + void HandleDiagnostic(DiagnosticsEngine::Level DiagLevel, + const Diagnostic &Info) override { + if (!FirstDiag || !ExpectedDiagID.has_value()) { + Satisfied = false; + return; + } + FirstDiag = false; + + Satisfied = ExpectedDiagID.value() == Info.getID(); + } + + bool FirstDiag = true; + bool Satisfied = false; + std::optional<unsigned> ExpectedDiagID; + +public: + void SetNoDiag() { + Satisfied = true; + ExpectedDiagID = std::nullopt; + } + + void SetExpected(unsigned DiagID) { + Satisfied = false; + ExpectedDiagID = DiagID; + } + + bool IsSatisfied() { return Satisfied; } +}; + +// The test fixture. +class ParseHLSLRootSignatureTest : public ::testing::Test { +protected: + ParseHLSLRootSignatureTest() + : FileMgr(FileMgrOpts), DiagID(new DiagnosticIDs()), + Consumer(new ExpectedDiagConsumer()), + Diags(DiagID, new DiagnosticOptions, Consumer), + SourceMgr(Diags, FileMgr), TargetOpts(new TargetOptions) { + TargetOpts->Triple = "x86_64-apple-darwin11.1.0"; + Target = TargetInfo::CreateTargetInfo(Diags, TargetOpts); + } + + std::unique_ptr<Preprocessor> CreatePP(StringRef Source, + TrivialModuleLoader &ModLoader) { + std::unique_ptr<llvm::MemoryBuffer> Buf = + llvm::MemoryBuffer::getMemBuffer(Source); + SourceMgr.setMainFileID(SourceMgr.createFileID(std::move(Buf))); + + HeaderSearch HeaderInfo(std::make_shared<HeaderSearchOptions>(), SourceMgr, + Diags, LangOpts, Target.get()); + std::unique_ptr<Preprocessor> PP = std::make_unique<Preprocessor>( + std::make_shared<PreprocessorOptions>(), Diags, LangOpts, SourceMgr, + HeaderInfo, ModLoader, + /*IILookup =*/nullptr, + /*OwnsHeaderSearch =*/false); + PP->Initialize(*Target); + PP->EnterMainSourceFile(); + return PP; + } + + void CheckTokens(SmallVector<hlsl::RootSignatureToken> &Computed, + SmallVector<hlsl::TokenKind> &Expected) { + ASSERT_EQ(Computed.size(), Expected.size()); + for (unsigned I = 0, E = Expected.size(); I != E; ++I) { + ASSERT_EQ(Computed[I].Kind, Expected[I]); + } + } + + FileSystemOptions FileMgrOpts; + FileManager FileMgr; + IntrusiveRefCntPtr<DiagnosticIDs> DiagID; + ExpectedDiagConsumer *Consumer; + DiagnosticsEngine Diags; + SourceManager SourceMgr; + LangOptions LangOpts; + std::shared_ptr<TargetOptions> TargetOpts; + IntrusiveRefCntPtr<TargetInfo> Target; +}; + +// Valid Lexing Tests + +TEST_F(ParseHLSLRootSignatureTest, ValidLexAllTokensTest) { + // This test will check that we can lex all defined tokens as defined in + // HLSLRootSignatureTokenKinds.def, plus some additional integer variations + const llvm::StringLiteral Source = R"cc( + (),|= + )cc"; + + TrivialModuleLoader ModLoader; + auto PP = CreatePP(Source, ModLoader); + auto TokLoc = SourceLocation(); + + // Test no diagnostics produced + Consumer->SetNoDiag(); + + hlsl::RootSignatureLexer Lexer(Source, TokLoc, *PP); + + SmallVector<hlsl::RootSignatureToken> Tokens = { + hlsl::RootSignatureToken( + SourceLocation()) // invalid token for completeness + }; + ASSERT_FALSE(Lexer.Lex(Tokens)); + ASSERT_TRUE(Consumer->IsSatisfied()); + + SmallVector<hlsl::TokenKind> Expected = { +#define TOK(NAME) hlsl::TokenKind::NAME, +#include "clang/Parse/HLSLRootSignatureTokenKinds.def" + }; + + CheckTokens(Tokens, Expected); +} + +// Invalid Lexing Tests + +TEST_F(ParseHLSLRootSignatureTest, InvalidLexIdentifierTest) { + // This test will check that the lexing fails due to no valid token + const llvm::StringLiteral Source = R"cc( + notAToken + )cc"; + + TrivialModuleLoader ModLoader; + auto PP = CreatePP(Source, ModLoader); + auto TokLoc = SourceLocation(); + + // Test correct diagnostic produced + Consumer->SetExpected(diag::err_hlsl_invalid_token); + + hlsl::RootSignatureLexer Lexer(Source, TokLoc, *PP); + + SmallVector<hlsl::RootSignatureToken> Tokens; + ASSERT_TRUE(Lexer.Lex(Tokens)); + ASSERT_TRUE(Consumer->IsSatisfied()); +} + +} // anonymous namespace >From 5f43ed80a6173ecf0b234da8b93cde2f76b2ef5b Mon Sep 17 00:00:00 2001 From: Finn Plummer <canadienf...@gmail.com> Date: Fri, 24 Jan 2025 22:28:05 +0000 Subject: [PATCH 2/5] Add lexing of integer literals - Integrate the use of the `NumericLiteralParser` to lex integer literals - Add additional hlsl specific diagnostics messages --- .../include/clang/Basic/DiagnosticLexKinds.td | 4 ++ .../Parse/HLSLRootSignatureTokenKinds.def | 1 + .../clang/Parse/ParseHLSLRootSignature.h | 6 ++ clang/lib/Parse/ParseHLSLRootSignature.cpp | 59 ++++++++++++++++ .../Parse/ParseHLSLRootSignatureTest.cpp | 69 +++++++++++++++++++ 5 files changed, 139 insertions(+) diff --git a/clang/include/clang/Basic/DiagnosticLexKinds.td b/clang/include/clang/Basic/DiagnosticLexKinds.td index 7755c05bc8969b..81d314c838cede 100644 --- a/clang/include/clang/Basic/DiagnosticLexKinds.td +++ b/clang/include/clang/Basic/DiagnosticLexKinds.td @@ -1020,6 +1020,10 @@ Error<"expected 'begin' or 'end'">; // HLSL Root Signature Lexing Errors let CategoryName = "Root Signature Lexical Issue" in { + def err_hlsl_invalid_number_literal: + Error<"expected number literal is not a supported number literal of unsigned integer or integer">; + def err_hlsl_number_literal_overflow : + Error<"provided %select{unsigned integer|signed integer}0 literal '%1' that overflows the maximum of 32 bits">; def err_hlsl_invalid_token: Error<"unable to lex a valid Root Signature token">; } diff --git a/clang/include/clang/Parse/HLSLRootSignatureTokenKinds.def b/clang/include/clang/Parse/HLSLRootSignatureTokenKinds.def index 9625f6a5bd76d9..64c5fd14a2017f 100644 --- a/clang/include/clang/Parse/HLSLRootSignatureTokenKinds.def +++ b/clang/include/clang/Parse/HLSLRootSignatureTokenKinds.def @@ -23,6 +23,7 @@ // General Tokens: TOK(invalid) +TOK(int_literal) // Punctuators: PUNCTUATOR(l_paren, '(') diff --git a/clang/include/clang/Parse/ParseHLSLRootSignature.h b/clang/include/clang/Parse/ParseHLSLRootSignature.h index 39069e7cc39988..3b2c61781b1da3 100644 --- a/clang/include/clang/Parse/ParseHLSLRootSignature.h +++ b/clang/include/clang/Parse/ParseHLSLRootSignature.h @@ -13,7 +13,9 @@ #ifndef LLVM_CLANG_PARSE_PARSEHLSLROOTSIGNATURE_H #define LLVM_CLANG_PARSE_PARSEHLSLROOTSIGNATURE_H +#include "clang/AST/APValue.h" #include "clang/Basic/DiagnosticLex.h" +#include "clang/Lex/LiteralSupport.h" #include "clang/Lex/Preprocessor.h" #include "llvm/ADT/SmallVector.h" @@ -33,6 +35,8 @@ struct RootSignatureToken { // Retain the SouceLocation of the token for diagnostics clang::SourceLocation TokLoc; + APValue NumLiteral = APValue(); + // Constructors RootSignatureToken(clang::SourceLocation TokLoc) : TokLoc(TokLoc) {} }; @@ -60,6 +64,8 @@ class RootSignatureLexer { clang::SourceLocation SourceLoc; clang::Preprocessor &PP; + bool LexNumber(RootSignatureToken &Result); + // Consumes the internal buffer for a single token. // // The return value denotes if there was a failure. diff --git a/clang/lib/Parse/ParseHLSLRootSignature.cpp b/clang/lib/Parse/ParseHLSLRootSignature.cpp index a9a9d209085c91..1cc75998ca07da 100644 --- a/clang/lib/Parse/ParseHLSLRootSignature.cpp +++ b/clang/lib/Parse/ParseHLSLRootSignature.cpp @@ -5,6 +5,61 @@ namespace hlsl { // Lexer Definitions +static bool IsNumberChar(char C) { + // TODO(#120472): extend for float support exponents + return isdigit(C); // integer support +} + +bool RootSignatureLexer::LexNumber(RootSignatureToken &Result) { + // NumericLiteralParser does not handle the sign so we will manually apply it + bool Negative = Buffer.front() == '-'; + bool Signed = Negative || Buffer.front() == '+'; + if (Signed) + AdvanceBuffer(); + + // Retrieve the possible number + StringRef NumSpelling = Buffer.take_while(IsNumberChar); + + // Catch this now as the Literal Parser will accept it as valid + if (NumSpelling.empty()) { + PP.getDiagnostics().Report(Result.TokLoc, + diag::err_hlsl_invalid_number_literal); + return true; + } + + // Parse the numeric value and do semantic checks on its specification + clang::NumericLiteralParser Literal(NumSpelling, SourceLoc, + PP.getSourceManager(), PP.getLangOpts(), + PP.getTargetInfo(), PP.getDiagnostics()); + if (Literal.hadError) + return true; // Error has already been reported so just return + + if (!Literal.isIntegerLiteral()) { + // Note: if IsNumberChar allows for hexidecimal we will need to turn this + // into a diagnostics for potential fixed-point literals + llvm_unreachable("IsNumberChar will only support digits"); + return true; + } + + // Retrieve the number value to store into the token + Result.Kind = TokenKind::int_literal; + + llvm::APSInt X = llvm::APSInt(32, !Signed); + if (Literal.GetIntegerValue(X)) { + // Report that the value has overflowed + PP.getDiagnostics().Report(Result.TokLoc, + diag::err_hlsl_number_literal_overflow) + << (unsigned)Signed << NumSpelling; + return true; + } + + X = Negative ? -X : X; + Result.NumLiteral = APValue(X); + + AdvanceBuffer(NumSpelling.size()); + return false; +} + bool RootSignatureLexer::Lex(SmallVector<RootSignatureToken> &Tokens) { // Discard any leading whitespace AdvanceBuffer(Buffer.take_while(isspace).size()); @@ -41,6 +96,10 @@ bool RootSignatureLexer::LexToken(RootSignatureToken &Result) { break; } + // Numeric constant + if (isdigit(C) || C == '-' || C == '+') + return LexNumber(Result); + // Unable to match on any token type PP.getDiagnostics().Report(Result.TokLoc, diag::err_hlsl_invalid_token); return true; diff --git a/clang/unittests/Parse/ParseHLSLRootSignatureTest.cpp b/clang/unittests/Parse/ParseHLSLRootSignatureTest.cpp index e5f88bbfa0ff6a..713bc5b1257f74 100644 --- a/clang/unittests/Parse/ParseHLSLRootSignatureTest.cpp +++ b/clang/unittests/Parse/ParseHLSLRootSignatureTest.cpp @@ -111,10 +111,39 @@ class ParseHLSLRootSignatureTest : public ::testing::Test { // Valid Lexing Tests +TEST_F(ParseHLSLRootSignatureTest, ValidLexNumbersTest) { + // This test will check that we can lex different number tokens + const llvm::StringLiteral Source = R"cc( + -42 42 +42 + )cc"; + + TrivialModuleLoader ModLoader; + auto PP = CreatePP(Source, ModLoader); + auto TokLoc = SourceLocation(); + + // Test no diagnostics produced + Consumer->SetNoDiag(); + + hlsl::RootSignatureLexer Lexer(Source, TokLoc, *PP); + + SmallVector<hlsl::RootSignatureToken> Tokens; + ASSERT_FALSE(Lexer.Lex(Tokens)); + ASSERT_TRUE(Consumer->IsSatisfied()); + + SmallVector<hlsl::TokenKind> Expected = { + hlsl::TokenKind::int_literal, + hlsl::TokenKind::int_literal, + hlsl::TokenKind::int_literal, + }; + CheckTokens(Tokens, Expected); +} + TEST_F(ParseHLSLRootSignatureTest, ValidLexAllTokensTest) { // This test will check that we can lex all defined tokens as defined in // HLSLRootSignatureTokenKinds.def, plus some additional integer variations const llvm::StringLiteral Source = R"cc( + 42 + (),|= )cc"; @@ -144,6 +173,46 @@ TEST_F(ParseHLSLRootSignatureTest, ValidLexAllTokensTest) { // Invalid Lexing Tests +TEST_F(ParseHLSLRootSignatureTest, InvalidLexOverflowedNumberTest) { + // This test will check that the lexing fails due to an integer overflow + const llvm::StringLiteral Source = R"cc( + 4294967296 + )cc"; + + TrivialModuleLoader ModLoader; + auto PP = CreatePP(Source, ModLoader); + auto TokLoc = SourceLocation(); + + // Test correct diagnostic produced + Consumer->SetExpected(diag::err_hlsl_number_literal_overflow); + + hlsl::RootSignatureLexer Lexer(Source, TokLoc, *PP); + + SmallVector<hlsl::RootSignatureToken> Tokens; + ASSERT_TRUE(Lexer.Lex(Tokens)); + ASSERT_TRUE(Consumer->IsSatisfied()); +} + +TEST_F(ParseHLSLRootSignatureTest, InvalidLexEmptyNumberTest) { + // This test will check that the lexing fails due to no integer being provided + const llvm::StringLiteral Source = R"cc( + - + )cc"; + + TrivialModuleLoader ModLoader; + auto PP = CreatePP(Source, ModLoader); + auto TokLoc = SourceLocation(); + + // Test correct diagnostic produced + Consumer->SetExpected(diag::err_hlsl_invalid_number_literal); + + hlsl::RootSignatureLexer Lexer(Source, TokLoc, *PP); + + SmallVector<hlsl::RootSignatureToken> Tokens; + ASSERT_TRUE(Lexer.Lex(Tokens)); + ASSERT_TRUE(Consumer->IsSatisfied()); +} + TEST_F(ParseHLSLRootSignatureTest, InvalidLexIdentifierTest) { // This test will check that the lexing fails due to no valid token const llvm::StringLiteral Source = R"cc( >From dc0c7ba8da50f3b12395d1ff90f77c42073d21ff Mon Sep 17 00:00:00 2001 From: Finn Plummer <canadienf...@gmail.com> Date: Fri, 24 Jan 2025 21:04:36 +0000 Subject: [PATCH 3/5] Add support for lexing registers --- .../include/clang/Basic/DiagnosticLexKinds.td | 1 + .../Parse/HLSLRootSignatureTokenKinds.def | 6 +++ clang/lib/Parse/ParseHLSLRootSignature.cpp | 47 +++++++++++++++++++ .../Parse/ParseHLSLRootSignatureTest.cpp | 23 +++++++++ 4 files changed, 77 insertions(+) diff --git a/clang/include/clang/Basic/DiagnosticLexKinds.td b/clang/include/clang/Basic/DiagnosticLexKinds.td index 81d314c838cede..cbadd16df3f9db 100644 --- a/clang/include/clang/Basic/DiagnosticLexKinds.td +++ b/clang/include/clang/Basic/DiagnosticLexKinds.td @@ -1025,6 +1025,7 @@ let CategoryName = "Root Signature Lexical Issue" in { def err_hlsl_number_literal_overflow : Error<"provided %select{unsigned integer|signed integer}0 literal '%1' that overflows the maximum of 32 bits">; def err_hlsl_invalid_token: Error<"unable to lex a valid Root Signature token">; + def err_hlsl_invalid_register_literal: Error<"expected unsigned integer literal as part of register">; } } diff --git a/clang/include/clang/Parse/HLSLRootSignatureTokenKinds.def b/clang/include/clang/Parse/HLSLRootSignatureTokenKinds.def index 64c5fd14a2017f..fc4dbfef728798 100644 --- a/clang/include/clang/Parse/HLSLRootSignatureTokenKinds.def +++ b/clang/include/clang/Parse/HLSLRootSignatureTokenKinds.def @@ -25,6 +25,12 @@ TOK(invalid) TOK(int_literal) +// Register Tokens: +TOK(bReg) +TOK(tReg) +TOK(uReg) +TOK(sReg) + // Punctuators: PUNCTUATOR(l_paren, '(') PUNCTUATOR(r_paren, ')') diff --git a/clang/lib/Parse/ParseHLSLRootSignature.cpp b/clang/lib/Parse/ParseHLSLRootSignature.cpp index 1cc75998ca07da..1b9973beb44170 100644 --- a/clang/lib/Parse/ParseHLSLRootSignature.cpp +++ b/clang/lib/Parse/ParseHLSLRootSignature.cpp @@ -100,6 +100,53 @@ bool RootSignatureLexer::LexToken(RootSignatureToken &Result) { if (isdigit(C) || C == '-' || C == '+') return LexNumber(Result); + // All following tokens require at least one additional character + if (Buffer.size() <= 1) { + PP.getDiagnostics().Report(Result.TokLoc, diag::err_hlsl_invalid_token); + return true; + } + + // Peek at the next character to deteremine token type + char NextC = Buffer[1]; + + // Registers: [tsub][0-9+] + if ((C == 't' || C == 's' || C == 'u' || C == 'b') && isdigit(NextC)) { + AdvanceBuffer(); + + if (LexNumber(Result)) + return true; // Error parsing number which is already reported + + // Lex number could also parse a float so ensure it was an unsigned int + if (Result.Kind != TokenKind::int_literal || + Result.NumLiteral.getInt().isSigned()) { + // Return invalid number literal for register error + PP.getDiagnostics().Report(Result.TokLoc, + diag::err_hlsl_invalid_register_literal); + return true; + } + + // Convert character to the register type. + // This is done after LexNumber to override the TokenKind + switch (C) { + case 'b': + Result.Kind = TokenKind::bReg; + break; + case 't': + Result.Kind = TokenKind::tReg; + break; + case 'u': + Result.Kind = TokenKind::uReg; + break; + case 's': + Result.Kind = TokenKind::sReg; + break; + default: + llvm_unreachable("Switch for an expected token was not provided"); + return true; + } + return false; + } + // Unable to match on any token type PP.getDiagnostics().Report(Result.TokLoc, diag::err_hlsl_invalid_token); return true; diff --git a/clang/unittests/Parse/ParseHLSLRootSignatureTest.cpp b/clang/unittests/Parse/ParseHLSLRootSignatureTest.cpp index 713bc5b1257f74..47195099ed60df 100644 --- a/clang/unittests/Parse/ParseHLSLRootSignatureTest.cpp +++ b/clang/unittests/Parse/ParseHLSLRootSignatureTest.cpp @@ -144,6 +144,8 @@ TEST_F(ParseHLSLRootSignatureTest, ValidLexAllTokensTest) { const llvm::StringLiteral Source = R"cc( 42 + b0 t43 u987 s234 + (),|= )cc"; @@ -213,6 +215,27 @@ TEST_F(ParseHLSLRootSignatureTest, InvalidLexEmptyNumberTest) { ASSERT_TRUE(Consumer->IsSatisfied()); } +TEST_F(ParseHLSLRootSignatureTest, InvalidLexRegNumberTest) { + // This test will check that the lexing fails due to no integer being provided + const llvm::StringLiteral Source = R"cc( + b32.4 + )cc"; + + TrivialModuleLoader ModLoader; + auto PP = CreatePP(Source, ModLoader); + auto TokLoc = SourceLocation(); + + // Test correct diagnostic produced + Consumer->SetExpected(diag::err_hlsl_invalid_register_literal); + + hlsl::RootSignatureLexer Lexer(Source, TokLoc, *PP); + + SmallVector<hlsl::RootSignatureToken> Tokens; + ASSERT_TRUE(Lexer.Lex(Tokens)); + // FIXME(#120472): This should be TRUE once we can lex a floating + ASSERT_FALSE(Consumer->IsSatisfied()); +} + TEST_F(ParseHLSLRootSignatureTest, InvalidLexIdentifierTest) { // This test will check that the lexing fails due to no valid token const llvm::StringLiteral Source = R"cc( >From c5d3881c89cbed9f3dd7782ebad08e9a71f4bd64 Mon Sep 17 00:00:00 2001 From: Finn Plummer <canadienf...@gmail.com> Date: Fri, 24 Jan 2025 21:40:23 +0000 Subject: [PATCH 4/5] Add lexing for example keyword and enum --- .../Parse/HLSLRootSignatureTokenKinds.def | 20 ++++++++++++++++ .../clang/Parse/ParseHLSLRootSignature.h | 1 + clang/lib/Parse/ParseHLSLRootSignature.cpp | 23 ++++++++++++++++--- .../Parse/ParseHLSLRootSignatureTest.cpp | 4 ++++ 4 files changed, 45 insertions(+), 3 deletions(-) diff --git a/clang/include/clang/Parse/HLSLRootSignatureTokenKinds.def b/clang/include/clang/Parse/HLSLRootSignatureTokenKinds.def index fc4dbfef728798..d73c9adbb94e5c 100644 --- a/clang/include/clang/Parse/HLSLRootSignatureTokenKinds.def +++ b/clang/include/clang/Parse/HLSLRootSignatureTokenKinds.def @@ -20,6 +20,17 @@ #ifndef PUNCTUATOR #define PUNCTUATOR(X,Y) TOK(pu_ ## X) #endif +#ifndef KEYWORD +#define KEYWORD(X) TOK(kw_ ## X) +#endif +#ifndef ENUM +#define ENUM(NAME, LIT) TOK(en_ ## NAME) +#endif + +// Defines the various types of enum +#ifndef DESCRIPTOR_RANGE_OFFSET_ENUM +#define DESCRIPTOR_RANGE_OFFSET_ENUM(NAME, LIT) ENUM(NAME, LIT) +#endif // General Tokens: TOK(invalid) @@ -38,5 +49,14 @@ PUNCTUATOR(comma, ',') PUNCTUATOR(or, '|') PUNCTUATOR(equal, '=') +// RootElement Keywords: +KEYWORD(DescriptorTable) + +// Descriptor Range Offset Enum: +DESCRIPTOR_RANGE_OFFSET_ENUM(DescriptorRangeOffsetAppend, "DESCRIPTOR_RANGE_OFFSET_APPEND") + +#undef DESCRIPTOR_RANGE_OFFSET_ENUM +#undef ENUM +#undef KEYWORD #undef PUNCTUATOR #undef TOK diff --git a/clang/include/clang/Parse/ParseHLSLRootSignature.h b/clang/include/clang/Parse/ParseHLSLRootSignature.h index 3b2c61781b1da3..899608bd1527ea 100644 --- a/clang/include/clang/Parse/ParseHLSLRootSignature.h +++ b/clang/include/clang/Parse/ParseHLSLRootSignature.h @@ -20,6 +20,7 @@ #include "llvm/ADT/SmallVector.h" #include "llvm/ADT/StringRef.h" +#include "llvm/ADT/StringSwitch.h" namespace clang { namespace hlsl { diff --git a/clang/lib/Parse/ParseHLSLRootSignature.cpp b/clang/lib/Parse/ParseHLSLRootSignature.cpp index 1b9973beb44170..7ceb85a47a088e 100644 --- a/clang/lib/Parse/ParseHLSLRootSignature.cpp +++ b/clang/lib/Parse/ParseHLSLRootSignature.cpp @@ -147,9 +147,26 @@ bool RootSignatureLexer::LexToken(RootSignatureToken &Result) { return false; } - // Unable to match on any token type - PP.getDiagnostics().Report(Result.TokLoc, diag::err_hlsl_invalid_token); - return true; + // Keywords and Enums: + StringRef TokSpelling = + Buffer.take_while([](char C) { return isalnum(C) || C == '_'; }); + + // Define a large string switch statement for all the keywords and enums + auto Switch = llvm::StringSwitch<TokenKind>(TokSpelling); +#define KEYWORD(NAME) Switch.Case(#NAME, TokenKind::kw_##NAME); +#define ENUM(NAME, LIT) Switch.CaseLower(LIT, TokenKind::en_##NAME); +#include "clang/Parse/HLSLRootSignatureTokenKinds.def" + + // Then attempt to retreive a string from it + auto Kind = Switch.Default(TokenKind::invalid); + if (Kind == TokenKind::invalid) { + PP.getDiagnostics().Report(Result.TokLoc, diag::err_hlsl_invalid_token); + return true; + } + + Result.Kind = Kind; + AdvanceBuffer(TokSpelling.size()); + return false; } } // namespace hlsl diff --git a/clang/unittests/Parse/ParseHLSLRootSignatureTest.cpp b/clang/unittests/Parse/ParseHLSLRootSignatureTest.cpp index 47195099ed60df..d80ded10ba313c 100644 --- a/clang/unittests/Parse/ParseHLSLRootSignatureTest.cpp +++ b/clang/unittests/Parse/ParseHLSLRootSignatureTest.cpp @@ -147,6 +147,10 @@ TEST_F(ParseHLSLRootSignatureTest, ValidLexAllTokensTest) { b0 t43 u987 s234 (),|= + + DescriptorTable + + DESCRIPTOR_RANGE_OFFSET_APPEND )cc"; TrivialModuleLoader ModLoader; >From dc784ffa0da9b7e2d16397912f53c0408d3208c7 Mon Sep 17 00:00:00 2001 From: Finn Plummer <canadienf...@gmail.com> Date: Fri, 24 Jan 2025 21:44:24 +0000 Subject: [PATCH 5/5] Add lexing for remaining DescriptorTable keywords and enums --- .../Parse/HLSLRootSignatureTokenKinds.def | 59 +++++++++++++++++++ .../Parse/ParseHLSLRootSignatureTest.cpp | 19 ++++++ 2 files changed, 78 insertions(+) diff --git a/clang/include/clang/Parse/HLSLRootSignatureTokenKinds.def b/clang/include/clang/Parse/HLSLRootSignatureTokenKinds.def index d73c9adbb94e5c..5e47af8d4b1364 100644 --- a/clang/include/clang/Parse/HLSLRootSignatureTokenKinds.def +++ b/clang/include/clang/Parse/HLSLRootSignatureTokenKinds.def @@ -31,6 +31,23 @@ #ifndef DESCRIPTOR_RANGE_OFFSET_ENUM #define DESCRIPTOR_RANGE_OFFSET_ENUM(NAME, LIT) ENUM(NAME, LIT) #endif +#ifndef ROOT_DESCRIPTOR_FLAG_ENUM +#define ROOT_DESCRIPTOR_FLAG_ENUM(NAME, LIT) ENUM(NAME, LIT) +#endif +// Note: ON denotes that the flag is unique from the above Root Descriptor +// Flags. This is required to avoid token kind enum conflicts. +#ifndef DESCRIPTOR_RANGE_FLAG_ENUM_OFF +#define DESCRIPTOR_RANGE_FLAG_ENUM_OFF(NAME, LIT) +#endif +#ifndef DESCRIPTOR_RANGE_FLAG_ENUM_ON +#define DESCRIPTOR_RANGE_FLAG_ENUM_ON(NAME, LIT) ENUM(NAME, LIT) +#endif +#ifndef DESCRIPTOR_RANGE_FLAG_ENUM +#define DESCRIPTOR_RANGE_FLAG_ENUM(NAME, LIT, ON) DESCRIPTOR_RANGE_FLAG_ENUM_##ON(NAME, LIT) +#endif +#ifndef SHADER_VISIBILITY_ENUM +#define SHADER_VISIBILITY_ENUM(NAME, LIT) ENUM(NAME, LIT) +#endif // General Tokens: TOK(invalid) @@ -52,9 +69,51 @@ PUNCTUATOR(equal, '=') // RootElement Keywords: KEYWORD(DescriptorTable) +// DescriptorTable Keywords: +KEYWORD(CBV) +KEYWORD(SRV) +KEYWORD(UAV) +KEYWORD(Sampler) + +// General Parameter Keywords: +KEYWORD(space) +KEYWORD(visibility) +KEYWORD(flags) + +// View Parameter Keywords: +KEYWORD(numDescriptors) +KEYWORD(offset) + // Descriptor Range Offset Enum: DESCRIPTOR_RANGE_OFFSET_ENUM(DescriptorRangeOffsetAppend, "DESCRIPTOR_RANGE_OFFSET_APPEND") +// Root Descriptor Flag Enums: +ROOT_DESCRIPTOR_FLAG_ENUM(DataVolatile, "DATA_VOLATILE") +ROOT_DESCRIPTOR_FLAG_ENUM(DataStaticWhileSetAtExecute, "DATA_STATIC_WHILE_SET_AT_EXECUTE") +ROOT_DESCRIPTOR_FLAG_ENUM(DataStatic, "DATA_STATIC") + +// Descriptor Range Flag Enums: +DESCRIPTOR_RANGE_FLAG_ENUM(DescriptorsVolatile, "DESCRIPTORS_VOLATILE", ON) +DESCRIPTOR_RANGE_FLAG_ENUM(DataVolatile, "DATA_VOLATILE", OFF) +DESCRIPTOR_RANGE_FLAG_ENUM(DataStaticWhileSetAtExecute, "DATA_STATIC_WHILE_SET_AT_EXECUTE", OFF) +DESCRIPTOR_RANGE_FLAG_ENUM(DataStatic, "DATA_STATIC", OFF) +DESCRIPTOR_RANGE_FLAG_ENUM(DescriptorsStaticKeepingBufferBoundsChecks, "DESCRIPTORS_STATIC_KEEPING_BUFFER_BOUNDS_CHECKS", ON) + +// Shader Visibiliy Enums: +SHADER_VISIBILITY_ENUM(All, "SHADER_VISIBILITY_ALL") +SHADER_VISIBILITY_ENUM(Vertex, "SHADER_VISIBILITY_VERTEX") +SHADER_VISIBILITY_ENUM(Hull, "SHADER_VISIBILITY_HULL") +SHADER_VISIBILITY_ENUM(Domain, "SHADER_VISIBILITY_DOMAIN") +SHADER_VISIBILITY_ENUM(Geometry, "SHADER_VISIBILITY_GEOMETRY") +SHADER_VISIBILITY_ENUM(Pixel, "SHADER_VISIBILITY_PIXEL") +SHADER_VISIBILITY_ENUM(Amplification, "SHADER_VISIBILITY_AMPLIFICATION") +SHADER_VISIBILITY_ENUM(Mesh, "SHADER_VISIBILITY_MESH") + +#undef SHADER_VISIBILITY_ENUM +#undef DESCRIPTOR_RANGE_FLAG_ENUM +#undef DESCRIPTOR_RANGE_FLAG_ENUM_OFF +#undef DESCRIPTOR_RANGE_FLAG_ENUM_ON +#undef ROOT_DESCRIPTOR_FLAG_ENUM #undef DESCRIPTOR_RANGE_OFFSET_ENUM #undef ENUM #undef KEYWORD diff --git a/clang/unittests/Parse/ParseHLSLRootSignatureTest.cpp b/clang/unittests/Parse/ParseHLSLRootSignatureTest.cpp index d80ded10ba313c..57b61e43746a0b 100644 --- a/clang/unittests/Parse/ParseHLSLRootSignatureTest.cpp +++ b/clang/unittests/Parse/ParseHLSLRootSignatureTest.cpp @@ -150,7 +150,26 @@ TEST_F(ParseHLSLRootSignatureTest, ValidLexAllTokensTest) { DescriptorTable + CBV SRV UAV Sampler + space visibility flags + numDescriptors offset + DESCRIPTOR_RANGE_OFFSET_APPEND + + DATA_VOLATILE + DATA_STATIC_WHILE_SET_AT_EXECUTE + DATA_STATIC + DESCRIPTORS_VOLATILE + DESCRIPTORS_STATIC_KEEPING_BUFFER_BOUNDS_CHECKS + + shader_visibility_all + shader_visibility_vertex + shader_visibility_hull + shader_visibility_domain + shader_visibility_geometry + shader_visibility_pixel + shader_visibility_amplification + shader_visibility_mesh )cc"; TrivialModuleLoader ModLoader; _______________________________________________ cfe-commits mailing list cfe-commits@lists.llvm.org https://lists.llvm.org/cgi-bin/mailman/listinfo/cfe-commits