mirror of
https://github.com/VectorCamp/vectorscan.git
synced 2025-11-19 02:30:35 +03:00
Implement new Vermicelli16 acceleration functions using SVE2.
The scheme utilises the MATCH and NMATCH instructions to scan for 16 characters at the same rate as vermicelli scans for one. Change-Id: Ie2cef904c56651e6108593c668e9b65bc001a886
This commit is contained in:
committed by
Konstantinos Margaritis
parent
b6a7ee7e84
commit
b54710d208
@@ -1,5 +1,6 @@
|
||||
/*
|
||||
* Copyright (c) 2015-2017, Intel Corporation
|
||||
* Copyright (c) 2021, Arm Limited
|
||||
*
|
||||
* Redistribution and use in source and binary forms, with or without
|
||||
* modification, are permitted provided that the following conditions are met:
|
||||
@@ -81,6 +82,17 @@ const u8 *run_accel(const union AccelAux *accel, const u8 *c, const u8 *c_end) {
|
||||
c_end - 1);
|
||||
break;
|
||||
|
||||
#ifdef HAVE_SVE2
|
||||
case ACCEL_VERM16:
|
||||
DEBUG_PRINTF("accel verm16 %p %p\n", c, c_end);
|
||||
if (c_end - c < 16) {
|
||||
return c;
|
||||
}
|
||||
|
||||
rv = vermicelli16Exec(accel->verm16.mask, c, c_end);
|
||||
break;
|
||||
#endif // HAVE_SVE2
|
||||
|
||||
case ACCEL_DVERM_MASKED:
|
||||
DEBUG_PRINTF("accel dverm masked %p %p\n", c, c_end);
|
||||
if (c + 16 + 1 >= c_end) {
|
||||
|
||||
Reference in New Issue
Block a user