mirror of
https://github.com/VectorCamp/vectorscan.git
synced 2025-06-28 16:41:01 +03:00
149 lines
5.5 KiB
C++
149 lines
5.5 KiB
C++
#include "nfa/shufti.h"
|
|
#include "nfa/shufticompile.h"
|
|
#include "benchmarks.hpp"
|
|
#include <iostream>
|
|
#include <chrono>
|
|
#include <cstring>
|
|
#include <ctime>
|
|
#include <cstdlib>
|
|
|
|
/*
|
|
#define RST "\x1B[0m"
|
|
#define KRED "\x1B[31m"
|
|
#define KGRN "\x1B[32m"
|
|
#define KYEL "\x1B[33m"
|
|
#define KBLU "\x1B[34m"
|
|
#define KMAG "\x1B[35m"
|
|
#define KCYN "\x1B[36m"
|
|
#define KWHT "\x1B[37m"
|
|
*/
|
|
|
|
|
|
void shufti_benchmarks(int size, int loops, int M, bool has_match) {
|
|
size_t real_size = size;
|
|
m128 lo, hi;
|
|
ue2::CharReach chars;
|
|
chars.set('a');
|
|
int ret = shuftiBuildMasks(chars, (u8 *)&lo, (u8 *)&hi);
|
|
u8 *kt1 = new u8[size];
|
|
memset(kt1,'b',size);
|
|
long double total_sec = 0;
|
|
long double trans_size = 0;
|
|
long double bw = 0;
|
|
if (has_match){
|
|
int pos = 0;
|
|
for(int j=0; j<M; j++){
|
|
kt1[pos] = 'b';
|
|
srand (time(NULL));
|
|
pos = rand() % size + 0;
|
|
kt1[pos] = 'a';
|
|
unsigned long act_size = 0;
|
|
auto start = std::chrono::steady_clock::now();
|
|
for (int i = 0; i < loops; i++) {
|
|
const u8 *res = shuftiExec(lo, hi, kt1, kt1 + size);
|
|
act_size += res - kt1;
|
|
}
|
|
auto end = std::chrono::steady_clock::now();
|
|
long double dt = std::chrono::duration_cast<std::chrono::seconds>(end - start).count();
|
|
total_sec += dt;
|
|
/*calculate transferred size*/
|
|
trans_size += act_size * loops;
|
|
/*calculate bandwidth*/
|
|
bw += trans_size / total_sec;
|
|
/*convert to MB/s*/
|
|
bw += bw / 1048576;
|
|
/*calculte average time*/
|
|
total_sec /= loops;
|
|
}
|
|
total_sec /= M;
|
|
bw /= M;
|
|
/*covert average time to μs*/
|
|
long double ms = total_sec * 1000000;
|
|
std::cout << "\x1B[35m Case with match in random pos and size: " << real_size << " for " << loops<<" loops ("
|
|
<< M << " random possisions checked): \x1B[36m shuftiExec elapsetime: \x1B[0m" << (ms/M)
|
|
<<" (μs) \x1B[36m bandwidth: \x1B[0m" << bw <<" (MB/s)"<<std::endl;
|
|
} else {
|
|
auto start = std::chrono::steady_clock::now();
|
|
for (int i = 0; i < loops; i++) {
|
|
shuftiExec(lo, hi, kt1, kt1 + size);
|
|
}
|
|
auto end = std::chrono::steady_clock::now();
|
|
total_sec += std::chrono::duration_cast<std::chrono::seconds>(end - start).count();
|
|
/*calculate transferred size*/
|
|
trans_size = size * loops ;
|
|
/*calculate bandwidth*/
|
|
bw = trans_size / total_sec;
|
|
/*convert to MB/s*/
|
|
bw /=1048576;
|
|
/*covert average time to μs*/
|
|
long double ms = total_sec * 1000000;
|
|
std::cout<<"\x1B[35m Case with no match in random pos and size: "<<real_size<<" for "<<loops<<" loops:"
|
|
<<"\x1B[36m shuftiExec elapsetime: \x1B[0m"<<(ms/loops)<<" (μs) \x1B[36m bandwidth: \x1B[0m"<< bw <<" (MB/s)"<<std::endl;
|
|
}
|
|
delete [] kt1;
|
|
}
|
|
|
|
void rshufti_benchmarks(int size, int loops, int M, bool has_match) {
|
|
size_t real_size = size;
|
|
m128 lo, hi;
|
|
ue2::CharReach chars;
|
|
chars.set('a');
|
|
int ret = shuftiBuildMasks(chars, (u8 *)&lo, (u8 *)&hi);
|
|
u8 *kt1 = new u8[size];
|
|
memset(kt1,'b',size);
|
|
long double total_sec = 0;
|
|
long double trans_size = 0;
|
|
long double bw = 0;
|
|
if (has_match){
|
|
int pos = 0;
|
|
for(int j=0; j<M; j++){
|
|
kt1[pos] = 'b';
|
|
srand (time(NULL));
|
|
pos = rand() % size + 0;
|
|
kt1[pos] = 'a';
|
|
unsigned long act_size = 0;
|
|
auto start = std::chrono::steady_clock::now();
|
|
for (int i = 0; i < loops; i++) {
|
|
const u8 *res = rshuftiExec(lo, hi, kt1, kt1 + size);
|
|
act_size += res - kt1;
|
|
}
|
|
auto end = std::chrono::steady_clock::now();
|
|
long double dt = std::chrono::duration_cast<std::chrono::seconds>(end - start).count();
|
|
total_sec += dt;
|
|
/*calculate transferred size*/
|
|
trans_size += act_size * loops;
|
|
/*calculate bandwidth*/
|
|
bw += trans_size / total_sec;
|
|
/*convert to MB/s*/
|
|
bw += bw / 1048576;
|
|
/*calculte average time*/
|
|
total_sec /= loops;
|
|
}
|
|
total_sec /= M;
|
|
bw /= M;
|
|
/*covert average time to μs*/
|
|
long double ms = total_sec * 1000000;
|
|
std::cout << "\x1B[35m Case with match in random pos and size: " << real_size << " for " << loops<<" loops ("
|
|
<< M << " random possisions checked): \x1B[36m rshuftiExec elapsetime: \x1B[0m" << (ms/M)
|
|
<<" (μs) \x1B[36m bandwidth: \x1B[0m" << bw <<" (MB/s)"<<std::endl;
|
|
} else {
|
|
auto start = std::chrono::steady_clock::now();
|
|
for (int i = 0; i < loops; i++) {
|
|
rshuftiExec(lo, hi, kt1, kt1 + size);
|
|
}
|
|
auto end = std::chrono::steady_clock::now();
|
|
total_sec += std::chrono::duration_cast<std::chrono::seconds>(end - start).count();
|
|
/*calculate transferred size*/
|
|
trans_size = size * loops ;
|
|
/*calculate bandwidth*/
|
|
bw = trans_size / total_sec;
|
|
/*convert to MB/s*/
|
|
bw /=1048576;
|
|
/*covert average time to μs*/
|
|
long double ms = total_sec * 1000000;
|
|
std::cout<<"\x1B[35m Case with no match in random pos and size: "<<real_size<<" for "<<loops<<" loops:"
|
|
<<"\x1B[36m rshuftiExec elapsetime: \x1B[0m"<<(ms/loops)<<" (μs) \x1B[36m bandwidth: \x1B[0m"<< bw <<" (MB/s)"<<std::endl;
|
|
}
|
|
delete [] kt1;
|
|
}
|