Applied to master. Thanks!
Philipp.

On Wed, 6 Sept 2023 at 18:07, Christoph Muellner
<christoph.muell...@vrull.eu> wrote:
>
> From: Christoph Müllner <christoph.muell...@vrull.eu>
>
> This patch implements the expansion of the strlen builtin for RV32/RV64
> for xlen-aligned aligned strings if Zbb or XTheadBb instructions are 
> available.
> The inserted sequences are:
>
> rv32gc_zbb (RV64 is similar):
>       add     a3,a0,4
>       li      a4,-1
> .L1:  lw      a5,0(a0)
>       add     a0,a0,4
>       orc.b   a5,a5
>       beq     a5,a4,.L1
>       not     a5,a5
>       ctz     a5,a5
>       srl     a5,a5,0x3
>       add     a0,a0,a5
>       sub     a0,a0,a3
>
> rv64gc_xtheadbb (RV32 is similar):
>       add       a4,a0,8
> .L2:  ld        a5,0(a0)
>       add       a0,a0,8
>       th.tstnbz a5,a5
>       beqz      a5,.L2
>       th.rev    a5,a5
>       th.ff1    a5,a5
>       srl       a5,a5,0x3
>       add       a0,a0,a5
>       sub       a0,a0,a4
>
> This allows to inline calls to strlen(), with optimized code for
> xlen-aligned strings, resulting in the following benefits over
> a call to libc:
> * no call/ret instructions
> * no stack frame allocation
> * no register saving/restoring
> * no alignment test
>
> The inlining mechanism is gated by a new switch ('-minline-strlen')
> and by the variable 'optimize_size'.
>
> Tested using the glibc string tests.
>
> Signed-off-by: Christoph Müllner <christoph.muell...@vrull.eu>
>
> gcc/ChangeLog:
>
>         * config.gcc: Add new object riscv-string.o.
>         riscv-string.cc.
>         * config/riscv/riscv-protos.h (riscv_expand_strlen):
>         New function.
>         * config/riscv/riscv.md (strlen<mode>): New expand INSN.
>         * config/riscv/riscv.opt: New flag 'minline-strlen'.
>         * config/riscv/t-riscv: Add new object riscv-string.o.
>         * config/riscv/thead.md (th_rev<mode>2): Export INSN name.
>         (th_rev<mode>2): Likewise.
>         (th_tstnbz<mode>2): New INSN.
>         * doc/invoke.texi: Document '-minline-strlen'.
>         * emit-rtl.cc (emit_likely_jump_insn): New helper function.
>         (emit_unlikely_jump_insn): Likewise.
>         * rtl.h (emit_likely_jump_insn): New prototype.
>         (emit_unlikely_jump_insn): Likewise.
>         * config/riscv/riscv-string.cc: New file.
>
> gcc/testsuite/ChangeLog:
>
>         * gcc.target/riscv/xtheadbb-strlen-unaligned.c: New test.
>         * gcc.target/riscv/xtheadbb-strlen.c: New test.
>         * gcc.target/riscv/zbb-strlen-disabled-2.c: New test.
>         * gcc.target/riscv/zbb-strlen-disabled.c: New test.
>         * gcc.target/riscv/zbb-strlen-unaligned.c: New test.
>         * gcc.target/riscv/zbb-strlen.c: New test.
> ---
>  gcc/config.gcc                                |   3 +-
>  gcc/config/riscv/riscv-protos.h               |   3 +
>  gcc/config/riscv/riscv-string.cc              | 183 ++++++++++++++++++
>  gcc/config/riscv/riscv.md                     |  28 +++
>  gcc/config/riscv/riscv.opt                    |   4 +
>  gcc/config/riscv/t-riscv                      |   6 +
>  gcc/config/riscv/thead.md                     |   9 +-
>  gcc/doc/invoke.texi                           |  11 +-
>  gcc/emit-rtl.cc                               |  24 +++
>  gcc/rtl.h                                     |   2 +
>  .../riscv/xtheadbb-strlen-unaligned.c         |  14 ++
>  .../gcc.target/riscv/xtheadbb-strlen.c        |  19 ++
>  .../gcc.target/riscv/zbb-strlen-disabled-2.c  |  15 ++
>  .../gcc.target/riscv/zbb-strlen-disabled.c    |  15 ++
>  .../gcc.target/riscv/zbb-strlen-unaligned.c   |  14 ++
>  gcc/testsuite/gcc.target/riscv/zbb-strlen.c   |  19 ++
>  16 files changed, 366 insertions(+), 3 deletions(-)
>  create mode 100644 gcc/config/riscv/riscv-string.cc
>  create mode 100644 gcc/testsuite/gcc.target/riscv/xtheadbb-strlen-unaligned.c
>  create mode 100644 gcc/testsuite/gcc.target/riscv/xtheadbb-strlen.c
>  create mode 100644 gcc/testsuite/gcc.target/riscv/zbb-strlen-disabled-2.c
>  create mode 100644 gcc/testsuite/gcc.target/riscv/zbb-strlen-disabled.c
>  create mode 100644 gcc/testsuite/gcc.target/riscv/zbb-strlen-unaligned.c
>  create mode 100644 gcc/testsuite/gcc.target/riscv/zbb-strlen.c
>
> diff --git a/gcc/config.gcc b/gcc/config.gcc
> index b2fe7c7ceef..aff6b6a5601 100644
> --- a/gcc/config.gcc
> +++ b/gcc/config.gcc
> @@ -530,7 +530,8 @@ pru-*-*)
>         ;;
>  riscv*)
>         cpu_type=riscv
> -       extra_objs="riscv-builtins.o riscv-c.o riscv-sr.o 
> riscv-shorten-memrefs.o riscv-selftests.o riscv-v.o riscv-vsetvl.o 
> riscv-vector-costs.o"
> +       extra_objs="riscv-builtins.o riscv-c.o riscv-sr.o 
> riscv-shorten-memrefs.o riscv-selftests.o riscv-string.o"
> +       extra_objs="${extra_objs} riscv-v.o riscv-vsetvl.o 
> riscv-vector-costs.o"
>         extra_objs="${extra_objs} riscv-vector-builtins.o 
> riscv-vector-builtins-shapes.o riscv-vector-builtins-bases.o"
>         extra_objs="${extra_objs} thead.o"
>         d_target_objs="riscv-d.o"
> diff --git a/gcc/config/riscv/riscv-protos.h b/gcc/config/riscv/riscv-protos.h
> index 6dbf6b9f943..b060d047f01 100644
> --- a/gcc/config/riscv/riscv-protos.h
> +++ b/gcc/config/riscv/riscv-protos.h
> @@ -517,6 +517,9 @@ const unsigned int RISCV_BUILTIN_SHIFT = 1;
>  /* Mask that selects the riscv_builtin_class part of a function code.  */
>  const unsigned int RISCV_BUILTIN_CLASS = (1 << RISCV_BUILTIN_SHIFT) - 1;
>
> +/* Routines implemented in riscv-string.cc.  */
> +extern bool riscv_expand_strlen (rtx, rtx, rtx, rtx);
> +
>  /* Routines implemented in thead.cc.  */
>  extern bool th_mempair_operands_p (rtx[4], bool, machine_mode);
>  extern void th_mempair_order_operands (rtx[4], bool, machine_mode);
> diff --git a/gcc/config/riscv/riscv-string.cc 
> b/gcc/config/riscv/riscv-string.cc
> new file mode 100644
> index 00000000000..086900a6083
> --- /dev/null
> +++ b/gcc/config/riscv/riscv-string.cc
> @@ -0,0 +1,183 @@
> +/* Subroutines used to expand string operations for RISC-V.
> +   Copyright (C) 2023 Free Software Foundation, Inc.
> +
> +   This file is part of GCC.
> +
> +   GCC is free software; you can redistribute it and/or modify it
> +   under the terms of the GNU General Public License as published
> +   by the Free Software Foundation; either version 3, or (at your
> +   option) any later version.
> +
> +   GCC is distributed in the hope that it will be useful, but WITHOUT
> +   ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
> +   or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public
> +   License for more details.
> +
> +   You should have received a copy of the GNU General Public License
> +   along with GCC; see the file COPYING3.  If not see
> +   <http://www.gnu.org/licenses/>.  */
> +
> +#define IN_TARGET_CODE 1
> +
> +#include "config.h"
> +#include "system.h"
> +#include "coretypes.h"
> +#include "backend.h"
> +#include "rtl.h"
> +#include "tree.h"
> +#include "memmodel.h"
> +#include "tm_p.h"
> +#include "ira.h"
> +#include "print-tree.h"
> +#include "varasm.h"
> +#include "explow.h"
> +#include "expr.h"
> +#include "output.h"
> +#include "target.h"
> +#include "predict.h"
> +#include "optabs.h"
> +
> +/* Emit proper instruction depending on mode of dest.  */
> +
> +#define GEN_EMIT_HELPER2(name)                         \
> +static rtx_insn *                                      \
> +do_## name ## 2(rtx dest, rtx src)                     \
> +{                                                      \
> +  rtx_insn *insn;                                      \
> +  if (GET_MODE (dest) == DImode)                       \
> +    insn = emit_insn (gen_ ## name ## di2 (dest, src));        \
> +  else                                                 \
> +    insn = emit_insn (gen_ ## name ## si2 (dest, src));        \
> +  return insn;                                         \
> +}
> +
> +/* Emit proper instruction depending on mode of dest.  */
> +
> +#define GEN_EMIT_HELPER3(name)                                 \
> +static rtx_insn *                                              \
> +do_## name ## 3(rtx dest, rtx src1, rtx src2)                  \
> +{                                                              \
> +  rtx_insn *insn;                                              \
> +  if (GET_MODE (dest) == DImode)                               \
> +    insn = emit_insn (gen_ ## name ## di3 (dest, src1, src2)); \
> +  else                                                         \
> +    insn = emit_insn (gen_ ## name ## si3 (dest, src1, src2)); \
> +  return insn;                                                 \
> +}
> +
> +GEN_EMIT_HELPER3(add) /* do_add3  */
> +GEN_EMIT_HELPER2(clz) /* do_clz2  */
> +GEN_EMIT_HELPER2(ctz) /* do_ctz2  */
> +GEN_EMIT_HELPER3(lshr) /* do_lshr3  */
> +GEN_EMIT_HELPER2(orcb) /* do_orcb2  */
> +GEN_EMIT_HELPER2(one_cmpl) /* do_one_cmpl2  */
> +GEN_EMIT_HELPER3(sub) /* do_sub3  */
> +GEN_EMIT_HELPER2(th_rev) /* do_th_rev2  */
> +GEN_EMIT_HELPER2(th_tstnbz) /* do_th_tstnbz2  */
> +GEN_EMIT_HELPER2(zero_extendqi) /* do_zero_extendqi2  */
> +
> +#undef GEN_EMIT_HELPER2
> +#undef GEN_EMIT_HELPER3
> +
> +/* Helper function to load a byte or a Pmode register.
> +
> +   MODE is the mode to use for the load (QImode or Pmode).
> +   DEST is the destination register for the data.
> +   ADDR_REG is the register that holds the address.
> +   ADDR is the address expression to load from.
> +
> +   This function returns an rtx containing the register,
> +   where the ADDR is stored.  */
> +
> +static rtx
> +do_load_from_addr (machine_mode mode, rtx dest, rtx addr_reg, rtx addr)
> +{
> +  rtx mem = gen_rtx_MEM (mode, addr_reg);
> +  MEM_COPY_ATTRIBUTES (mem, addr);
> +  set_mem_size (mem, GET_MODE_SIZE (mode));
> +
> +  if (mode == QImode)
> +    do_zero_extendqi2 (dest, mem);
> +  else if (mode == Xmode)
> +    emit_move_insn (dest, mem);
> +  else
> +    gcc_unreachable ();
> +
> +  return addr_reg;
> +}
> +
> +/* If the provided string is aligned, then read XLEN bytes
> +   in a loop and use orc.b to find NUL-bytes.  */
> +
> +static bool
> +riscv_expand_strlen_scalar (rtx result, rtx src, rtx align)
> +{
> +  rtx testval, addr, addr_plus_regsz, word, zeros;
> +  rtx loop_label, cond;
> +
> +  gcc_assert (TARGET_ZBB || TARGET_XTHEADBB);
> +
> +  /* The alignment needs to be known and big enough.  */
> +  if (!CONST_INT_P (align) || UINTVAL (align) < GET_MODE_SIZE (Xmode))
> +    return false;
> +
> +  testval = gen_reg_rtx (Xmode);
> +  addr = copy_addr_to_reg (XEXP (src, 0));
> +  addr_plus_regsz = gen_reg_rtx (Pmode);
> +  word = gen_reg_rtx (Xmode);
> +  zeros = gen_reg_rtx (Xmode);
> +
> +  if (TARGET_ZBB)
> +    emit_insn (gen_rtx_SET (testval, constm1_rtx));
> +  else
> +    emit_insn (gen_rtx_SET (testval, const0_rtx));
> +
> +  do_add3 (addr_plus_regsz, addr, GEN_INT (UNITS_PER_WORD));
> +
> +  loop_label = gen_label_rtx ();
> +  emit_label (loop_label);
> +
> +  /* Load a word and use orc.b/th.tstnbz to find a zero-byte.  */
> +  do_load_from_addr (Xmode, word, addr, src);
> +  do_add3 (addr, addr, GEN_INT (UNITS_PER_WORD));
> +  if (TARGET_ZBB)
> +    do_orcb2 (word, word);
> +  else
> +    do_th_tstnbz2 (word, word);
> +  cond = gen_rtx_EQ (VOIDmode, word, testval);
> +  emit_unlikely_jump_insn (gen_cbranch4 (Xmode, cond, word, testval, 
> loop_label));
> +
> +  /* Calculate the return value by counting zero-bits.  */
> +  if (TARGET_ZBB)
> +    do_one_cmpl2 (word, word);
> +  if (TARGET_BIG_ENDIAN)
> +    do_clz2 (zeros, word);
> +  else if (TARGET_ZBB)
> +    do_ctz2 (zeros, word);
> +  else
> +    {
> +      do_th_rev2 (word, word);
> +      do_clz2 (zeros, word);
> +    }
> +
> +  do_lshr3 (zeros, zeros, GEN_INT (exact_log2 (BITS_PER_UNIT)));
> +  do_add3 (addr, addr, zeros);
> +  do_sub3 (result, addr, addr_plus_regsz);
> +
> +  return true;
> +}
> +
> +/* Expand a strlen operation and return true if successful.
> +   Return false if we should let the compiler generate normal
> +   code, probably a strlen call.  */
> +
> +bool
> +riscv_expand_strlen (rtx result, rtx src, rtx search_char, rtx align)
> +{
> +  gcc_assert (search_char == const0_rtx);
> +
> +  if (TARGET_ZBB || TARGET_XTHEADBB)
> +    return riscv_expand_strlen_scalar (result, src, align);
> +
> +  return false;
> +}
> diff --git a/gcc/config/riscv/riscv.md b/gcc/config/riscv/riscv.md
> index 9da2a9f1c42..e078ebc43cb 100644
> --- a/gcc/config/riscv/riscv.md
> +++ b/gcc/config/riscv/riscv.md
> @@ -82,6 +82,9 @@ (define_c_enum "unspec" [
>
>    ;; the calling convention of callee
>    UNSPEC_CALLEE_CC
> +
> +  ;; String unspecs
> +  UNSPEC_STRLEN
>  ])
>
>  (define_c_enum "unspecv" [
> @@ -3500,6 +3503,31 @@ (define_expand "msubhisi4"
>    "TARGET_XTHEADMAC"
>  )
>
> +;; Search character in string (generalization of strlen).
> +;; Argument 0 is the resulting offset
> +;; Argument 1 is the string
> +;; Argument 2 is the search character
> +;; Argument 3 is the alignment
> +
> +(define_expand "strlen<mode>"
> +  [(set (match_operand:X 0 "register_operand")
> +       (unspec:X [(match_operand:BLK 1 "general_operand")
> +                    (match_operand:SI 2 "const_int_operand")
> +                    (match_operand:SI 3 "const_int_operand")]
> +                 UNSPEC_STRLEN))]
> +  "riscv_inline_strlen && !optimize_size && (TARGET_ZBB || TARGET_XTHEADBB)"
> +{
> +  rtx search_char = operands[2];
> +
> +  if (search_char != const0_rtx)
> +    FAIL;
> +
> +  if (riscv_expand_strlen (operands[0], operands[1], operands[2], 
> operands[3]))
> +    DONE;
> +  else
> +    FAIL;
> +})
> +
>  (include "bitmanip.md")
>  (include "crypto.md")
>  (include "sync.md")
> diff --git a/gcc/config/riscv/riscv.opt b/gcc/config/riscv/riscv.opt
> index 98f342348b7..2491b335aef 100644
> --- a/gcc/config/riscv/riscv.opt
> +++ b/gcc/config/riscv/riscv.opt
> @@ -278,6 +278,10 @@ minline-atomics
>  Target Var(TARGET_INLINE_SUBWORD_ATOMIC) Init(1)
>  Always inline subword atomic operations.
>
> +minline-strlen
> +Target Bool Var(riscv_inline_strlen) Init(0)
> +Inline strlen calls if possible.
> +
>  Enum
>  Name(riscv_autovec_preference) Type(enum riscv_autovec_preference_enum)
>  Valid arguments to -param=riscv-autovec-preference=:
> diff --git a/gcc/config/riscv/t-riscv b/gcc/config/riscv/t-riscv
> index b1f80d1d87c..c012ac0cf33 100644
> --- a/gcc/config/riscv/t-riscv
> +++ b/gcc/config/riscv/t-riscv
> @@ -91,6 +91,12 @@ riscv-selftests.o: 
> $(srcdir)/config/riscv/riscv-selftests.cc \
>         $(COMPILE) $<
>         $(POSTCOMPILE)
>
> +riscv-string.o: $(srcdir)/config/riscv/riscv-string.cc \
> +  $(CONFIG_H) $(SYSTEM_H) coretypes.h $(TARGET_H) backend.h $(RTL_H) \
> +  memmodel.h $(EMIT_RTL_H) poly-int.h output.h
> +       $(COMPILE) $<
> +       $(POSTCOMPILE)
> +
>  riscv-v.o: $(srcdir)/config/riscv/riscv-v.cc \
>    $(CONFIG_H) $(SYSTEM_H) coretypes.h $(TM_H) $(TREE_H) $(RTL_H) \
>    $(TM_P_H) $(TARGET_H) memmodel.h insn-codes.h $(OPTABS_H) $(RECOG_H) \
> diff --git a/gcc/config/riscv/thead.md b/gcc/config/riscv/thead.md
> index 29f98dec3a8..982b048cb65 100644
> --- a/gcc/config/riscv/thead.md
> +++ b/gcc/config/riscv/thead.md
> @@ -110,7 +110,7 @@ (define_insn "*th_clz<mode>2"
>    [(set_attr "type" "bitmanip")
>     (set_attr "mode" "<X:MODE>")])
>
> -(define_insn "*th_rev<mode>2"
> +(define_insn "th_rev<mode>2"
>    [(set (match_operand:GPR 0 "register_operand" "=r")
>         (bswap:GPR (match_operand:GPR 1 "register_operand" "r")))]
>    "TARGET_XTHEADBB && (TARGET_64BIT || <MODE>mode == SImode)"
> @@ -121,6 +121,13 @@ (define_insn "*th_rev<mode>2"
>    [(set_attr "type" "bitmanip")
>     (set_attr "mode" "<GPR:MODE>")])
>
> +(define_insn "th_tstnbz<mode>2"
> +  [(set (match_operand:X 0 "register_operand" "=r")
> +       (unspec:X [(match_operand:X 1 "register_operand" "r")] UNSPEC_ORC_B))]
> +  "TARGET_XTHEADBB"
> +  "th.tstnbz\t%0,%1"
> +  [(set_attr "type" "bitmanip")])
> +
>  ;; XTheadBs
>
>  (define_insn "*th_tst<mode>3"
> diff --git a/gcc/doc/invoke.texi b/gcc/doc/invoke.texi
> index 33befee7d6b..4a9e385d009 100644
> --- a/gcc/doc/invoke.texi
> +++ b/gcc/doc/invoke.texi
> @@ -1236,7 +1236,8 @@ See RS/6000 and PowerPC Options.
>  -mstack-protector-guard=@var{guard}  -mstack-protector-guard-reg=@var{reg}
>  -mstack-protector-guard-offset=@var{offset}
>  -mcsr-check -mno-csr-check
> --minline-atomics  -mno-inline-atomics}
> +-minline-atomics  -mno-inline-atomics
> +-minline-strlen  -mno-inline-strlen}
>
>  @emph{RL78 Options}
>  @gccoptlist{-msim  -mmul=none  -mmul=g13  -mmul=g14  -mallregs
> @@ -29359,6 +29360,14 @@ Do or don't use smaller but slower subword atomic 
> emulation code that uses
>  libatomic function calls.  The default is to use fast inline subword atomics
>  that do not require libatomic.
>
> +@opindex minline-strlen
> +@item -minline-strlen
> +@itemx -mno-inline-strlen
> +Do or do not attempt to inline strlen calls if possible.
> +Inlining will only be done if the string is properly aligned
> +and instructions for accelerated processing are available.
> +The default is to not inline strlen calls.
> +
>  @opindex mshorten-memrefs
>  @item -mshorten-memrefs
>  @itemx -mno-shorten-memrefs
> diff --git a/gcc/emit-rtl.cc b/gcc/emit-rtl.cc
> index f6276a2d0b6..8bd623dcd0e 100644
> --- a/gcc/emit-rtl.cc
> +++ b/gcc/emit-rtl.cc
> @@ -5168,6 +5168,30 @@ emit_jump_insn (rtx x)
>    return last;
>  }
>
> +/* Make an insn of code JUMP_INSN with pattern X,
> +   add a REG_BR_PROB note that indicates very likely probability,
> +   and add it to the end of the doubly-linked list.  */
> +
> +rtx_insn *
> +emit_likely_jump_insn (rtx x)
> +{
> +  rtx_insn *jump = emit_jump_insn (x);
> +  add_reg_br_prob_note (jump, profile_probability::very_likely ());
> +  return jump;
> +}
> +
> +/* Make an insn of code JUMP_INSN with pattern X,
> +   add a REG_BR_PROB note that indicates very unlikely probability,
> +   and add it to the end of the doubly-linked list.  */
> +
> +rtx_insn *
> +emit_unlikely_jump_insn (rtx x)
> +{
> +  rtx_insn *jump = emit_jump_insn (x);
> +  add_reg_br_prob_note (jump, profile_probability::very_unlikely ());
> +  return jump;
> +}
> +
>  /* Make an insn of code CALL_INSN with pattern X
>     and add it to the end of the doubly-linked list.  */
>
> diff --git a/gcc/rtl.h b/gcc/rtl.h
> index 0e9491b89b4..102ad9b57a6 100644
> --- a/gcc/rtl.h
> +++ b/gcc/rtl.h
> @@ -3347,6 +3347,8 @@ extern rtx_note *emit_note_after (enum insn_note, 
> rtx_insn *);
>  extern rtx_insn *emit_insn (rtx);
>  extern rtx_insn *emit_debug_insn (rtx);
>  extern rtx_insn *emit_jump_insn (rtx);
> +extern rtx_insn *emit_likely_jump_insn (rtx);
> +extern rtx_insn *emit_unlikely_jump_insn (rtx);
>  extern rtx_insn *emit_call_insn (rtx);
>  extern rtx_code_label *emit_label (rtx);
>  extern rtx_jump_table_data *emit_jump_table_data (rtx);
> diff --git a/gcc/testsuite/gcc.target/riscv/xtheadbb-strlen-unaligned.c 
> b/gcc/testsuite/gcc.target/riscv/xtheadbb-strlen-unaligned.c
> new file mode 100644
> index 00000000000..57a6b5ea66a
> --- /dev/null
> +++ b/gcc/testsuite/gcc.target/riscv/xtheadbb-strlen-unaligned.c
> @@ -0,0 +1,14 @@
> +/* { dg-do compile } */
> +/* { dg-options "-minline-strlen -march=rv32gc_xtheadbb" { target { rv32 } } 
> } */
> +/* { dg-options "-minline-strlen -march=rv64gc_xtheadbb" { target { rv64 } } 
> } */
> +/* { dg-skip-if "" { *-*-* } { "-O0" "-Os" "-Og" "-Oz" } } */
> +
> +typedef long unsigned int size_t;
> +
> +size_t
> +my_str_len (const char *s)
> +{
> +  return __builtin_strlen (s);
> +}
> +
> +/* { dg-final { scan-assembler-not "th.tstnbz\t" } } */
> diff --git a/gcc/testsuite/gcc.target/riscv/xtheadbb-strlen.c 
> b/gcc/testsuite/gcc.target/riscv/xtheadbb-strlen.c
> new file mode 100644
> index 00000000000..dbc8d1e7da7
> --- /dev/null
> +++ b/gcc/testsuite/gcc.target/riscv/xtheadbb-strlen.c
> @@ -0,0 +1,19 @@
> +/* { dg-do compile } */
> +/* { dg-options "-minline-strlen -march=rv32gc_xtheadbb" { target { rv32 } } 
> } */
> +/* { dg-options "-minline-strlen -march=rv64gc_xtheadbb" { target { rv64 } } 
> } */
> +/* { dg-skip-if "" { *-*-* } { "-O0" "-Os" "-Og" "-Oz" } } */
> +
> +typedef long unsigned int size_t;
> +
> +size_t
> +my_str_len (const char *s)
> +{
> +  s = __builtin_assume_aligned (s, 4096);
> +  return __builtin_strlen (s);
> +}
> +
> +/* { dg-final { scan-assembler "th.tstnbz\t" } } */
> +/* { dg-final { scan-assembler-not "jalr" } } */
> +/* { dg-final { scan-assembler-not "call" } } */
> +/* { dg-final { scan-assembler-not "jr" } } */
> +/* { dg-final { scan-assembler-not "tail" } } */
> diff --git a/gcc/testsuite/gcc.target/riscv/zbb-strlen-disabled-2.c 
> b/gcc/testsuite/gcc.target/riscv/zbb-strlen-disabled-2.c
> new file mode 100644
> index 00000000000..a481068aa0c
> --- /dev/null
> +++ b/gcc/testsuite/gcc.target/riscv/zbb-strlen-disabled-2.c
> @@ -0,0 +1,15 @@
> +/* { dg-do compile } */
> +/* { dg-options "-march=rv32gc_zbb" { target { rv32 } } } */
> +/* { dg-options "-march=rv64gc_zbb" { target { rv64 } } } */
> +/* { dg-skip-if "" { *-*-* } { "-O0" "-Os" "-Og" "-Oz" } } */
> +
> +typedef long unsigned int size_t;
> +
> +size_t
> +my_str_len (const char *s)
> +{
> +  s = __builtin_assume_aligned (s, 4096);
> +  return __builtin_strlen (s);
> +}
> +
> +/* { dg-final { scan-assembler-not "orc.b\t" } } */
> diff --git a/gcc/testsuite/gcc.target/riscv/zbb-strlen-disabled.c 
> b/gcc/testsuite/gcc.target/riscv/zbb-strlen-disabled.c
> new file mode 100644
> index 00000000000..1295aeb0086
> --- /dev/null
> +++ b/gcc/testsuite/gcc.target/riscv/zbb-strlen-disabled.c
> @@ -0,0 +1,15 @@
> +/* { dg-do compile } */
> +/* { dg-options "-mno-inline-strlen -march=rv32gc_zbb" { target { rv32 } } } 
> */
> +/* { dg-options "-mno-inline-strlen -march=rv64gc_zbb" { target { rv64 } } } 
> */
> +/* { dg-skip-if "" { *-*-* } { "-O0" "-Os" "-Og" "-Oz" } } */
> +
> +typedef long unsigned int size_t;
> +
> +size_t
> +my_str_len (const char *s)
> +{
> +  s = __builtin_assume_aligned (s, 4096);
> +  return __builtin_strlen (s);
> +}
> +
> +/* { dg-final { scan-assembler-not "orc.b\t" } } */
> diff --git a/gcc/testsuite/gcc.target/riscv/zbb-strlen-unaligned.c 
> b/gcc/testsuite/gcc.target/riscv/zbb-strlen-unaligned.c
> new file mode 100644
> index 00000000000..326fef885d8
> --- /dev/null
> +++ b/gcc/testsuite/gcc.target/riscv/zbb-strlen-unaligned.c
> @@ -0,0 +1,14 @@
> +/* { dg-do compile } */
> +/* { dg-options "-minline-strlen -march=rv32gc_zbb" { target { rv32 } } } */
> +/* { dg-options "-minline-strlen -march=rv64gc_zbb" { target { rv64 } } } */
> +/* { dg-skip-if "" { *-*-* } { "-O0" "-Os" "-Og" "-Oz" } } */
> +
> +typedef long unsigned int size_t;
> +
> +size_t
> +my_str_len (const char *s)
> +{
> +  return __builtin_strlen (s);
> +}
> +
> +/* { dg-final { scan-assembler-not "orc.b\t" } } */
> diff --git a/gcc/testsuite/gcc.target/riscv/zbb-strlen.c 
> b/gcc/testsuite/gcc.target/riscv/zbb-strlen.c
> new file mode 100644
> index 00000000000..19ebfaef16f
> --- /dev/null
> +++ b/gcc/testsuite/gcc.target/riscv/zbb-strlen.c
> @@ -0,0 +1,19 @@
> +/* { dg-do compile } */
> +/* { dg-options "-minline-strlen -march=rv32gc_zbb" { target { rv32 } } } */
> +/* { dg-options "-minline-strlen -march=rv64gc_zbb" { target { rv64 } } } */
> +/* { dg-skip-if "" { *-*-* } { "-O0" "-Os" "-Og" "-Oz" } } */
> +
> +typedef long unsigned int size_t;
> +
> +size_t
> +my_str_len (const char *s)
> +{
> +  s = __builtin_assume_aligned (s, 4096);
> +  return __builtin_strlen (s);
> +}
> +
> +/* { dg-final { scan-assembler "orc.b\t" } } */
> +/* { dg-final { scan-assembler-not "jalr" } } */
> +/* { dg-final { scan-assembler-not "call" } } */
> +/* { dg-final { scan-assembler-not "jr" } } */
> +/* { dg-final { scan-assembler-not "tail" } } */
> --
> 2.41.0
>

Reply via email to