https://github.com/alejandro-alvarez-sonarsource created https://github.com/llvm/llvm-project/pull/156507
Signature: ```c size_t strxfrm(char *dest, const char *src, size_t n); ``` The modeling covers: * `src` can never be null * `dest` can be null only if n is 0, and then the return value is some unspecified positive integer * `src` and `dest` must not overlap * `dest` must have at least `n` bytes of capacity * The return value can either be: - `< n`, and the contents of the buffer pointed by `dest` is invalidated - `>= n`, and the contents of the buffer pointed by `dest` is marked as undefined CPP-6854 From 736d0dcf2e31f402607656bf100004f8c8dd6539 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Alejandro=20=C3=81lvarez=20Ayll=C3=B3n?= <alejandro.alva...@sonarsource.com> Date: Fri, 29 Aug 2025 09:51:04 +0200 Subject: [PATCH] [clang][analyzer] Model `strxfrm` Signature: ```c size_t strxfrm(char *dest, const char *src, size_t n); ``` The modeling covers: * `src` can never be null * `dest` can be null only if n is 0, and then the return value is some unspecified positive integer * `src` and `dest` must not overlap * `dest` must have at least `n` bytes of capacity * The return value can either be: - `< n`, and the contents of the buffer pointed by `dest` is invalidated - `>= n`, and the contents of the buffer pointed by `dest` is marked as undefined CPP-6854 --- .../Checkers/CStringChecker.cpp | 100 ++++++++++++++++++ clang/test/Analysis/string.c | 57 ++++++++++ 2 files changed, 157 insertions(+) diff --git a/clang/lib/StaticAnalyzer/Checkers/CStringChecker.cpp b/clang/lib/StaticAnalyzer/Checkers/CStringChecker.cpp index cfc6d34a75ca2..296a803bd04c2 100644 --- a/clang/lib/StaticAnalyzer/Checkers/CStringChecker.cpp +++ b/clang/lib/StaticAnalyzer/Checkers/CStringChecker.cpp @@ -101,6 +101,7 @@ class CStringChecker static void *getTag() { static int tag; return &tag; } + bool evalCall(const CallEvent &Call, CheckerContext &C) const; void checkPreStmt(const DeclStmt *DS, CheckerContext &C) const; void checkLiveSymbols(ProgramStateRef state, SymbolReaper &SR) const; @@ -163,6 +164,7 @@ class CStringChecker {{CDM::CLibrary, {"strcasecmp"}, 2}, &CStringChecker::evalStrcasecmp}, {{CDM::CLibrary, {"strncasecmp"}, 3}, &CStringChecker::evalStrncasecmp}, {{CDM::CLibrary, {"strsep"}, 2}, &CStringChecker::evalStrsep}, + {{CDM::CLibrary, {"strxfrm"}, 3}, &CStringChecker::evalStrxfrm}, {{CDM::CLibrary, {"bcopy"}, 3}, &CStringChecker::evalBcopy}, {{CDM::CLibrary, {"bcmp"}, 3}, std::bind(&CStringChecker::evalMemcmp, _1, _2, _3, CK_Regular)}, @@ -211,6 +213,8 @@ class CStringChecker bool ReturnEnd, bool IsBounded, ConcatFnKind appendK, bool returnPtr = true) const; + void evalStrxfrm(CheckerContext &C, const CallEvent &Call) const; + void evalStrcat(CheckerContext &C, const CallEvent &Call) const; void evalStrncat(CheckerContext &C, const CallEvent &Call) const; void evalStrlcat(CheckerContext &C, const CallEvent &Call) const; @@ -2243,6 +2247,102 @@ void CStringChecker::evalStrcpyCommon(CheckerContext &C, const CallEvent &Call, C.addTransition(state); } +void CStringChecker::evalStrxfrm(CheckerContext &C, + const CallEvent &Call) const { + // size_t strxfrm(char *dest, const char *src, size_t n); + CurrentFunctionDescription = "locale transformation function"; + + ProgramStateRef state = C.getState(); + const LocationContext *LCtx = C.getLocationContext(); + SValBuilder &SVB = C.getSValBuilder(); + + // Get arguments + DestinationArgExpr Dest = {{Call.getArgExpr(0), 0}}; + SourceArgExpr Source = {{Call.getArgExpr(1), 1}}; + SizeArgExpr Size = {{Call.getArgExpr(2), 2}}; + + // `src` can never be null + SVal SrcVal = state->getSVal(Source.Expression, LCtx); + state = checkNonNull(C, state, Source, SrcVal); + if (!state) + return; + + // Check overlaps + state = CheckOverlap(C, state, Size, Dest, Source, CK_Regular); + if (!state) + return; + + // The function returns an implementation-defined length needed for + // transformation + SVal retVal = SVB.conjureSymbolVal(Call, C.blockCount()); + + state = state->BindExpr(Call.getOriginExpr(), LCtx, retVal); + + // Check if size is zero + SVal sizeVal = state->getSVal(Size.Expression, LCtx); + QualType sizeTy = Size.Expression->getType(); + + auto [stateZeroSize, StateSizeNonZero] = + assumeZero(C, state, sizeVal, sizeTy); + + // If `n` is 0, we just return the implementation defined length + if (stateZeroSize && !StateSizeNonZero) { + C.addTransition(stateZeroSize); + return; + } + + if (!StateSizeNonZero) + return; + + // If `n` is not 0, `dest` can not be null. + SVal destVal = state->getSVal(Dest.Expression, LCtx); + StateSizeNonZero = checkNonNull(C, StateSizeNonZero, Dest, destVal); + if (!StateSizeNonZero) + return; + + // Check that we can write to the destination buffer + StateSizeNonZero = CheckBufferAccess(C, StateSizeNonZero, Dest, Size, + AccessKind::write, CK_Regular); + if (!StateSizeNonZero) + return; + + // Success: return value < `n` + // Failure: return value >= `n` + auto comparisonVal = SVB.evalBinOp(StateSizeNonZero, BO_LT, retVal, sizeVal, + SVB.getConditionType()) + .getAs<DefinedOrUnknownSVal>(); + + if (comparisonVal) { + auto [StateSuccess, StateFailure] = + StateSizeNonZero->assume(*comparisonVal); + + if (StateSuccess) { + // In this case, the transformation invalidated the buffer. + StateSuccess = invalidateDestinationBufferBySize( + C, StateSuccess, Dest.Expression, Call.getCFGElementRef(), destVal, + sizeVal, Size.Expression->getType()); + + C.addTransition(StateSuccess); + } + + if (StateFailure) { + // In this case, dest buffer content is undefined + if (std::optional<Loc> destLoc = destVal.getAs<Loc>()) { + StateFailure = StateFailure->bindLoc(*destLoc, UndefinedVal{}, LCtx); + } + + C.addTransition(StateFailure); + } + } else { + // Fallback: invalidate the buffer. + StateSizeNonZero = invalidateDestinationBufferBySize( + C, StateSizeNonZero, Dest.Expression, Call.getCFGElementRef(), destVal, + sizeVal, Size.Expression->getType()); + + C.addTransition(StateSizeNonZero); + } +} + void CStringChecker::evalStrcmp(CheckerContext &C, const CallEvent &Call) const { //int strcmp(const char *s1, const char *s2); diff --git a/clang/test/Analysis/string.c b/clang/test/Analysis/string.c index e017aff3b4a1d..427b99bfdf295 100644 --- a/clang/test/Analysis/string.c +++ b/clang/test/Analysis/string.c @@ -1789,3 +1789,60 @@ void CWE124_Buffer_Underwrite__malloc_char_memcpy() { free(dataBuffer); } #endif + +//===----------------------------------------------------------------------=== +// strxfrm() +// It is not a built-in. +//===----------------------------------------------------------------------=== + +size_t strxfrm(char *dest, const char *src, size_t n); + +void strxfrm_null_dest(const char *src) { + strxfrm(NULL, src, 0); // no warning + strxfrm(NULL, src, 10); // expected-warning {{Null pointer passed as 1st argument}} +} + +void strxfrm_null_source(char *dest) { + strxfrm(dest, NULL, 0); // expected-warning {{Null pointer passed as 2nd argument}} +} + +#ifndef SUPPRESS_OUT_OF_BOUND +void strxfrm_overflow(const char *src) { + char dest[10]; + strxfrm(dest, src, 55); // expected-warning {{Locale transformation function overflows the destination buffer}} +} +#endif + +void strxfrm_source_smaller() { + char dest[10]; + char source[5]; + strxfrm(dest, source, 10); +} + +void strxfrm_overlap(char *dest) { + strxfrm(dest, dest, 10); // expected-warning {{Arguments must not be overlapping buffers}} +} + +void strxfrm_regular(const char *src) { + size_t n = strxfrm(NULL, src, 0); + char *dest = (char*)malloc(n + 1); + strxfrm(dest, src, n); + free(dest); +} + +int strxfrm_dest_undef(const char *src) { + char dest[10] = {0}; + size_t n = strxfrm(dest, src, sizeof(dest)); + + int c = 0; + if (n >= sizeof(dest)) { + for (int i = 0; i < sizeof(dest); ++i) { + c += dest[i]; // expected-warning {{Assigned value is uninitialized}} + } + } else { + for (int i = 0; i < sizeof(dest); ++i) { + c += dest[i]; // no-warning + } + } + return c; +} _______________________________________________ cfe-commits mailing list cfe-commits@lists.llvm.org https://lists.llvm.org/cgi-bin/mailman/listinfo/cfe-commits