688903eb3e
* All files with FSF copyright notices: Update copyright dates using scripts/update-copyrights. * locale/programs/charmap-kw.h: Regenerated. * locale/programs/locfile-kw.h: Likewise.
85 lines
3.3 KiB
C
85 lines
3.3 KiB
C
/* Copyright (C) 2011-2018 Free Software Foundation, Inc.
|
|
This file is part of the GNU C Library.
|
|
Contributed by Chris Metcalf <cmetcalf@tilera.com>, 2011.
|
|
|
|
The GNU C Library is free software; you can redistribute it and/or
|
|
modify it under the terms of the GNU Lesser General Public
|
|
License as published by the Free Software Foundation; either
|
|
version 2.1 of the License, or (at your option) any later version.
|
|
|
|
The GNU C Library is distributed in the hope that it will be useful,
|
|
but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
|
Lesser General Public License for more details.
|
|
|
|
You should have received a copy of the GNU Lesser General Public
|
|
License along with the GNU C Library. If not, see
|
|
<http://www.gnu.org/licenses/>. */
|
|
|
|
#include <endian.h>
|
|
#include <stdint.h>
|
|
|
|
/* Provide a set of macros to help keep endianness #ifdefs out of
|
|
the string functions.
|
|
|
|
MASK: Provide a mask based on the pointer alignment that
|
|
sets up non-zero bytes before the beginning of the string.
|
|
The MASK expression works because shift counts are taken mod 64.
|
|
|
|
NULMASK: Clear bytes beyond a given point in the string.
|
|
|
|
CFZ: Find the first zero bit in the 8 string bytes in a long.
|
|
|
|
REVCZ: Find the last zero bit in the 8 string bytes in a long.
|
|
|
|
STRSHIFT: Shift N bits towards the start of the string. */
|
|
|
|
#if __BYTE_ORDER == __LITTLE_ENDIAN
|
|
#define MASK(x) (__insn_shl(1ULL, (x << 3)) - 1)
|
|
#define NULMASK(x) ((2ULL << x) - 1)
|
|
#define CFZ(x) __insn_ctz(x)
|
|
#define REVCZ(x) __insn_clz(x)
|
|
#define STRSHIFT(x,n) ((x) >> n)
|
|
#else
|
|
#define MASK(x) (__insn_shl(-2LL, ((-x << 3) - 1)))
|
|
#define NULMASK(x) (-2LL << (63 - x))
|
|
#define CFZ(x) __insn_clz(x)
|
|
#define REVCZ(x) __insn_ctz(x)
|
|
#define STRSHIFT(x,n) ((x) << n)
|
|
#endif
|
|
|
|
/* Create eight copies of the byte in a uint64_t. Byte Shuffle uses
|
|
the bytes of srcB as the index into the dest vector to select a
|
|
byte. With all indices of zero, the first byte is copied into all
|
|
the other bytes. */
|
|
static inline uint64_t copy_byte(uint8_t byte)
|
|
{
|
|
return __insn_shufflebytes(byte, 0, 0);
|
|
}
|
|
|
|
/* Implement the byte vector instructions using extended assembly.
|
|
The __insn_OP() builtins are buggy in the upstream compiler;
|
|
see gcc bugzilla 78117. */
|
|
|
|
#define VECOP(OP) \
|
|
static inline uint64_t OP (uint64_t a, uint64_t b) \
|
|
{ \
|
|
uint64_t result; \
|
|
asm volatile (#OP " %0, %1, %2" : "=r"(result) : "r"(a), "r"(b)); \
|
|
return result; \
|
|
} \
|
|
\
|
|
static inline uint64_t OP ## i (uint64_t a, uint64_t b) \
|
|
{ \
|
|
uint64_t result; \
|
|
asm volatile (#OP "i %0, %1, %2" : "=r"(result) : "r"(a), "I"(b)); \
|
|
return result; \
|
|
}
|
|
|
|
VECOP(v1cmpeq)
|
|
VECOP(v1cmpltu)
|
|
VECOP(v1cmpne)
|
|
VECOP(v1add)
|
|
VECOP(v1shru)
|
|
VECOP(v1shl)
|