mirror of
https://github.com/VectorCamp/vectorscan.git
synced 2025-09-30 03:34:25 +03:00
Move SVE functions into their own files.
Change-Id: I995ba4b7d2b558ee403693ee45d747d414d3b177
This commit is contained in:
committed by
Konstantinos Margaritis
parent
6c6aee9682
commit
a879715953
@@ -46,6 +46,10 @@
|
||||
#include "util/partial_store.h"
|
||||
#include "ue2common.h"
|
||||
|
||||
#ifdef HAVE_SVE2
|
||||
#include "castle_sve.h"
|
||||
#endif
|
||||
|
||||
static really_inline
|
||||
const struct SubCastle *getSubCastle(const struct Castle *c, u32 num) {
|
||||
assert(num < c->numRepeats);
|
||||
@@ -553,42 +557,6 @@ char castleScanNVerm(const struct Castle *c, const u8 *buf, const size_t begin,
|
||||
return 1;
|
||||
}
|
||||
|
||||
#ifdef HAVE_SVE2
|
||||
|
||||
static really_inline
|
||||
char castleScanVerm16(const struct Castle *c, const u8 *buf, const size_t begin,
|
||||
const size_t end, size_t *loc) {
|
||||
const u8 *ptr = vermicelli16Exec(c->u.verm16.mask, buf + begin, buf + end);
|
||||
if (ptr == buf + end) {
|
||||
DEBUG_PRINTF("no escape found\n");
|
||||
return 0;
|
||||
}
|
||||
|
||||
assert(loc);
|
||||
assert(ptr >= buf && ptr < buf + end);
|
||||
*loc = ptr - buf;
|
||||
DEBUG_PRINTF("escape found at offset %zu\n", *loc);
|
||||
return 1;
|
||||
}
|
||||
|
||||
static really_inline
|
||||
char castleScanNVerm16(const struct Castle *c, const u8 *buf, const size_t begin,
|
||||
const size_t end, size_t *loc) {
|
||||
const u8 *ptr = nvermicelli16Exec(c->u.verm16.mask, buf + begin, buf + end);
|
||||
if (ptr == buf + end) {
|
||||
DEBUG_PRINTF("no escape found\n");
|
||||
return 0;
|
||||
}
|
||||
|
||||
assert(loc);
|
||||
assert(ptr >= buf && ptr < buf + end);
|
||||
*loc = ptr - buf;
|
||||
DEBUG_PRINTF("escape found at offset %zu\n", *loc);
|
||||
return 1;
|
||||
}
|
||||
|
||||
#endif // HAVE_SVE2
|
||||
|
||||
static really_inline
|
||||
char castleScanShufti(const struct Castle *c, const u8 *buf, const size_t begin,
|
||||
const size_t end, size_t *loc) {
|
||||
@@ -690,42 +658,6 @@ char castleRevScanNVerm(const struct Castle *c, const u8 *buf,
|
||||
return 1;
|
||||
}
|
||||
|
||||
#ifdef HAVE_SVE2
|
||||
|
||||
static really_inline
|
||||
char castleRevScanVerm16(const struct Castle *c, const u8 *buf,
|
||||
const size_t begin, const size_t end, size_t *loc) {
|
||||
const u8 *ptr = rvermicelli16Exec(c->u.verm16.mask, buf + begin, buf + end);
|
||||
if (ptr == buf + begin - 1) {
|
||||
DEBUG_PRINTF("no escape found\n");
|
||||
return 0;
|
||||
}
|
||||
|
||||
assert(loc);
|
||||
assert(ptr >= buf && ptr < buf + end);
|
||||
*loc = ptr - buf;
|
||||
DEBUG_PRINTF("escape found at offset %zu\n", *loc);
|
||||
return 1;
|
||||
}
|
||||
|
||||
static really_inline
|
||||
char castleRevScanNVerm16(const struct Castle *c, const u8 *buf,
|
||||
const size_t begin, const size_t end, size_t *loc) {
|
||||
const u8 *ptr = rnvermicelli16Exec(c->u.verm16.mask, buf + begin, buf + end);
|
||||
if (ptr == buf + begin - 1) {
|
||||
DEBUG_PRINTF("no escape found\n");
|
||||
return 0;
|
||||
}
|
||||
|
||||
assert(loc);
|
||||
assert(ptr >= buf && ptr < buf + end);
|
||||
*loc = ptr - buf;
|
||||
DEBUG_PRINTF("escape found at offset %zu\n", *loc);
|
||||
return 1;
|
||||
}
|
||||
|
||||
#endif // HAVE_SVE2
|
||||
|
||||
static really_inline
|
||||
char castleRevScanShufti(const struct Castle *c, const u8 *buf,
|
||||
const size_t begin, const size_t end, size_t *loc) {
|
||||
|
96
src/nfa/castle_sve.h
Normal file
96
src/nfa/castle_sve.h
Normal file
@@ -0,0 +1,96 @@
|
||||
/*
|
||||
* Copyright (c) 2015-2016, Intel Corporation
|
||||
* Copyright (c) 2021, Arm Limited
|
||||
*
|
||||
* Redistribution and use in source and binary forms, with or without
|
||||
* modification, are permitted provided that the following conditions are met:
|
||||
*
|
||||
* * Redistributions of source code must retain the above copyright notice,
|
||||
* this list of conditions and the following disclaimer.
|
||||
* * Redistributions in binary form must reproduce the above copyright
|
||||
* notice, this list of conditions and the following disclaimer in the
|
||||
* documentation and/or other materials provided with the distribution.
|
||||
* * Neither the name of Intel Corporation nor the names of its contributors
|
||||
* may be used to endorse or promote products derived from this software
|
||||
* without specific prior written permission.
|
||||
*
|
||||
* THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
|
||||
* AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
|
||||
* IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
|
||||
* ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
|
||||
* LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
|
||||
* CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
|
||||
* SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
|
||||
* INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
|
||||
* CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
|
||||
* ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
|
||||
* POSSIBILITY OF SUCH DAMAGE.
|
||||
*/
|
||||
|
||||
/** \file
|
||||
* \brief Castle for SVE: multi-tenant repeat engine, runtime code.
|
||||
*/
|
||||
|
||||
static really_inline
|
||||
char castleScanVerm16(const struct Castle *c, const u8 *buf, const size_t begin,
|
||||
const size_t end, size_t *loc) {
|
||||
const u8 *ptr = vermicelli16Exec(c->u.verm16.mask, buf + begin, buf + end);
|
||||
if (ptr == buf + end) {
|
||||
DEBUG_PRINTF("no escape found\n");
|
||||
return 0;
|
||||
}
|
||||
|
||||
assert(loc);
|
||||
assert(ptr >= buf && ptr < buf + end);
|
||||
*loc = ptr - buf;
|
||||
DEBUG_PRINTF("escape found at offset %zu\n", *loc);
|
||||
return 1;
|
||||
}
|
||||
|
||||
static really_inline
|
||||
char castleScanNVerm16(const struct Castle *c, const u8 *buf, const size_t begin,
|
||||
const size_t end, size_t *loc) {
|
||||
const u8 *ptr = nvermicelli16Exec(c->u.verm16.mask, buf + begin, buf + end);
|
||||
if (ptr == buf + end) {
|
||||
DEBUG_PRINTF("no escape found\n");
|
||||
return 0;
|
||||
}
|
||||
|
||||
assert(loc);
|
||||
assert(ptr >= buf && ptr < buf + end);
|
||||
*loc = ptr - buf;
|
||||
DEBUG_PRINTF("escape found at offset %zu\n", *loc);
|
||||
return 1;
|
||||
}
|
||||
|
||||
static really_inline
|
||||
char castleRevScanVerm16(const struct Castle *c, const u8 *buf,
|
||||
const size_t begin, const size_t end, size_t *loc) {
|
||||
const u8 *ptr = rvermicelli16Exec(c->u.verm16.mask, buf + begin, buf + end);
|
||||
if (ptr == buf + begin - 1) {
|
||||
DEBUG_PRINTF("no escape found\n");
|
||||
return 0;
|
||||
}
|
||||
|
||||
assert(loc);
|
||||
assert(ptr >= buf && ptr < buf + end);
|
||||
*loc = ptr - buf;
|
||||
DEBUG_PRINTF("escape found at offset %zu\n", *loc);
|
||||
return 1;
|
||||
}
|
||||
|
||||
static really_inline
|
||||
char castleRevScanNVerm16(const struct Castle *c, const u8 *buf,
|
||||
const size_t begin, const size_t end, size_t *loc) {
|
||||
const u8 *ptr = rnvermicelli16Exec(c->u.verm16.mask, buf + begin, buf + end);
|
||||
if (ptr == buf + begin - 1) {
|
||||
DEBUG_PRINTF("no escape found\n");
|
||||
return 0;
|
||||
}
|
||||
|
||||
assert(loc);
|
||||
assert(ptr >= buf && ptr < buf + end);
|
||||
*loc = ptr - buf;
|
||||
DEBUG_PRINTF("escape found at offset %zu\n", *loc);
|
||||
return 1;
|
||||
}
|
114
src/nfa/lbr.c
114
src/nfa/lbr.c
@@ -362,56 +362,6 @@ char lbrRevScanNVerm(const struct NFA *nfa, const u8 *buf,
|
||||
return 1;
|
||||
}
|
||||
|
||||
#ifdef HAVE_SVE2
|
||||
|
||||
static really_inline
|
||||
char lbrRevScanVerm16(const struct NFA *nfa, const u8 *buf,
|
||||
size_t begin, size_t end, size_t *loc) {
|
||||
assert(begin <= end);
|
||||
assert(nfa->type == LBR_NFA_VERM16);
|
||||
const struct lbr_verm16 *l = getImplNfa(nfa);
|
||||
|
||||
if (begin == end) {
|
||||
return 0;
|
||||
}
|
||||
|
||||
const u8 *ptr = rvermicelli16Exec(l->mask, buf + begin, buf + end);
|
||||
if (ptr == buf + begin - 1) {
|
||||
DEBUG_PRINTF("no escape found\n");
|
||||
return 0;
|
||||
}
|
||||
|
||||
assert(loc);
|
||||
*loc = ptr - buf;
|
||||
DEBUG_PRINTF("escape found at offset %zu\n", *loc);
|
||||
return 1;
|
||||
}
|
||||
|
||||
static really_inline
|
||||
char lbrRevScanNVerm16(const struct NFA *nfa, const u8 *buf,
|
||||
size_t begin, size_t end, size_t *loc) {
|
||||
assert(begin <= end);
|
||||
assert(nfa->type == LBR_NFA_NVERM16);
|
||||
const struct lbr_verm16 *l = getImplNfa(nfa);
|
||||
|
||||
if (begin == end) {
|
||||
return 0;
|
||||
}
|
||||
|
||||
const u8 *ptr = rnvermicelli16Exec(l->mask, buf + begin, buf + end);
|
||||
if (ptr == buf + begin - 1) {
|
||||
DEBUG_PRINTF("no escape found\n");
|
||||
return 0;
|
||||
}
|
||||
|
||||
assert(loc);
|
||||
*loc = ptr - buf;
|
||||
DEBUG_PRINTF("escape found at offset %zu\n", *loc);
|
||||
return 1;
|
||||
}
|
||||
|
||||
#endif // HAVE_SVE2
|
||||
|
||||
static really_inline
|
||||
char lbrRevScanShuf(const struct NFA *nfa, const u8 *buf,
|
||||
size_t begin, size_t end,
|
||||
@@ -518,56 +468,6 @@ char lbrFwdScanNVerm(const struct NFA *nfa, const u8 *buf,
|
||||
return 1;
|
||||
}
|
||||
|
||||
#ifdef HAVE_SVE2
|
||||
|
||||
static really_inline
|
||||
char lbrFwdScanVerm16(const struct NFA *nfa, const u8 *buf,
|
||||
size_t begin, size_t end, size_t *loc) {
|
||||
assert(begin <= end);
|
||||
assert(nfa->type == LBR_NFA_VERM16);
|
||||
const struct lbr_verm16 *l = getImplNfa(nfa);
|
||||
|
||||
if (begin == end) {
|
||||
return 0;
|
||||
}
|
||||
|
||||
const u8 *ptr = vermicelli16Exec(l->mask, buf + begin, buf + end);
|
||||
if (ptr == buf + end) {
|
||||
DEBUG_PRINTF("no escape found\n");
|
||||
return 0;
|
||||
}
|
||||
|
||||
assert(loc);
|
||||
*loc = ptr - buf;
|
||||
DEBUG_PRINTF("escape found at offset %zu\n", *loc);
|
||||
return 1;
|
||||
}
|
||||
|
||||
static really_inline
|
||||
char lbrFwdScanNVerm16(const struct NFA *nfa, const u8 *buf,
|
||||
size_t begin, size_t end, size_t *loc) {
|
||||
assert(begin <= end);
|
||||
assert(nfa->type == LBR_NFA_NVERM16);
|
||||
const struct lbr_verm16 *l = getImplNfa(nfa);
|
||||
|
||||
if (begin == end) {
|
||||
return 0;
|
||||
}
|
||||
|
||||
const u8 *ptr = nvermicelli16Exec(l->mask, buf + begin, buf + end);
|
||||
if (ptr == buf + end) {
|
||||
DEBUG_PRINTF("no escape found\n");
|
||||
return 0;
|
||||
}
|
||||
|
||||
assert(loc);
|
||||
*loc = ptr - buf;
|
||||
DEBUG_PRINTF("escape found at offset %zu\n", *loc);
|
||||
return 1;
|
||||
}
|
||||
|
||||
#endif // HAVE_SVE2
|
||||
|
||||
static really_inline
|
||||
char lbrFwdScanShuf(const struct NFA *nfa, const u8 *buf,
|
||||
size_t begin, size_t end,
|
||||
@@ -625,18 +525,12 @@ char lbrFwdScanTruf(const struct NFA *nfa, const u8 *buf,
|
||||
#define ENGINE_ROOT_NAME NVerm
|
||||
#include "lbr_common_impl.h"
|
||||
|
||||
#ifdef HAVE_SVE2
|
||||
|
||||
#define ENGINE_ROOT_NAME Verm16
|
||||
#include "lbr_common_impl.h"
|
||||
|
||||
#define ENGINE_ROOT_NAME NVerm16
|
||||
#include "lbr_common_impl.h"
|
||||
|
||||
#endif // HAVE_SVE2
|
||||
|
||||
#define ENGINE_ROOT_NAME Shuf
|
||||
#include "lbr_common_impl.h"
|
||||
|
||||
#define ENGINE_ROOT_NAME Truf
|
||||
#include "lbr_common_impl.h"
|
||||
|
||||
#ifdef HAVE_SVE2
|
||||
#include "lbr_sve.h"
|
||||
#endif
|
130
src/nfa/lbr_sve.h
Normal file
130
src/nfa/lbr_sve.h
Normal file
@@ -0,0 +1,130 @@
|
||||
/*
|
||||
* Copyright (c) 2015-2017, Intel Corporation
|
||||
* Copyright (c) 2021, Arm Limited
|
||||
*
|
||||
* Redistribution and use in source and binary forms, with or without
|
||||
* modification, are permitted provided that the following conditions are met:
|
||||
*
|
||||
* * Redistributions of source code must retain the above copyright notice,
|
||||
* this list of conditions and the following disclaimer.
|
||||
* * Redistributions in binary form must reproduce the above copyright
|
||||
* notice, this list of conditions and the following disclaimer in the
|
||||
* documentation and/or other materials provided with the distribution.
|
||||
* * Neither the name of Intel Corporation nor the names of its contributors
|
||||
* may be used to endorse or promote products derived from this software
|
||||
* without specific prior written permission.
|
||||
*
|
||||
* THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
|
||||
* AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
|
||||
* IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
|
||||
* ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
|
||||
* LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
|
||||
* CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
|
||||
* SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
|
||||
* INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
|
||||
* CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
|
||||
* ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
|
||||
* POSSIBILITY OF SUCH DAMAGE.
|
||||
*/
|
||||
|
||||
/** \file
|
||||
* \brief Large Bounded Repeat (LBR) engine for SVE: runtime code.
|
||||
*/
|
||||
|
||||
static really_inline
|
||||
char lbrRevScanVerm16(const struct NFA *nfa, const u8 *buf,
|
||||
size_t begin, size_t end, size_t *loc) {
|
||||
assert(begin <= end);
|
||||
assert(nfa->type == LBR_NFA_VERM16);
|
||||
const struct lbr_verm16 *l = getImplNfa(nfa);
|
||||
|
||||
if (begin == end) {
|
||||
return 0;
|
||||
}
|
||||
|
||||
const u8 *ptr = rvermicelli16Exec(l->mask, buf + begin, buf + end);
|
||||
if (ptr == buf + begin - 1) {
|
||||
DEBUG_PRINTF("no escape found\n");
|
||||
return 0;
|
||||
}
|
||||
|
||||
assert(loc);
|
||||
*loc = ptr - buf;
|
||||
DEBUG_PRINTF("escape found at offset %zu\n", *loc);
|
||||
return 1;
|
||||
}
|
||||
|
||||
static really_inline
|
||||
char lbrRevScanNVerm16(const struct NFA *nfa, const u8 *buf,
|
||||
size_t begin, size_t end, size_t *loc) {
|
||||
assert(begin <= end);
|
||||
assert(nfa->type == LBR_NFA_NVERM16);
|
||||
const struct lbr_verm16 *l = getImplNfa(nfa);
|
||||
|
||||
if (begin == end) {
|
||||
return 0;
|
||||
}
|
||||
|
||||
const u8 *ptr = rnvermicelli16Exec(l->mask, buf + begin, buf + end);
|
||||
if (ptr == buf + begin - 1) {
|
||||
DEBUG_PRINTF("no escape found\n");
|
||||
return 0;
|
||||
}
|
||||
|
||||
assert(loc);
|
||||
*loc = ptr - buf;
|
||||
DEBUG_PRINTF("escape found at offset %zu\n", *loc);
|
||||
return 1;
|
||||
}
|
||||
|
||||
static really_inline
|
||||
char lbrFwdScanVerm16(const struct NFA *nfa, const u8 *buf,
|
||||
size_t begin, size_t end, size_t *loc) {
|
||||
assert(begin <= end);
|
||||
assert(nfa->type == LBR_NFA_VERM16);
|
||||
const struct lbr_verm16 *l = getImplNfa(nfa);
|
||||
|
||||
if (begin == end) {
|
||||
return 0;
|
||||
}
|
||||
|
||||
const u8 *ptr = vermicelli16Exec(l->mask, buf + begin, buf + end);
|
||||
if (ptr == buf + end) {
|
||||
DEBUG_PRINTF("no escape found\n");
|
||||
return 0;
|
||||
}
|
||||
|
||||
assert(loc);
|
||||
*loc = ptr - buf;
|
||||
DEBUG_PRINTF("escape found at offset %zu\n", *loc);
|
||||
return 1;
|
||||
}
|
||||
|
||||
static really_inline
|
||||
char lbrFwdScanNVerm16(const struct NFA *nfa, const u8 *buf,
|
||||
size_t begin, size_t end, size_t *loc) {
|
||||
assert(begin <= end);
|
||||
assert(nfa->type == LBR_NFA_NVERM16);
|
||||
const struct lbr_verm16 *l = getImplNfa(nfa);
|
||||
|
||||
if (begin == end) {
|
||||
return 0;
|
||||
}
|
||||
|
||||
const u8 *ptr = nvermicelli16Exec(l->mask, buf + begin, buf + end);
|
||||
if (ptr == buf + end) {
|
||||
DEBUG_PRINTF("no escape found\n");
|
||||
return 0;
|
||||
}
|
||||
|
||||
assert(loc);
|
||||
*loc = ptr - buf;
|
||||
DEBUG_PRINTF("escape found at offset %zu\n", *loc);
|
||||
return 1;
|
||||
}
|
||||
|
||||
#define ENGINE_ROOT_NAME Verm16
|
||||
#include "lbr_common_impl.h"
|
||||
|
||||
#define ENGINE_ROOT_NAME NVerm16
|
||||
#include "lbr_common_impl.h"
|
@@ -270,7 +270,7 @@ static really_inline const u8 *shuftiDoubleMini(SuperVector<S> mask1_lo, SuperVe
|
||||
t.print8("t");
|
||||
|
||||
typename SuperVector<S>::movemask_type z = t.eqmask(SuperVector<S>::Ones());
|
||||
DEBUG_PRINTF(" z: 0x%08x\n", z);
|
||||
DEBUG_PRINTF(" z: 0x%016llx\n", (u64a)z);
|
||||
return firstMatch<S>(buf, z);
|
||||
}
|
||||
|
||||
|
Reference in New Issue
Block a user