summaryrefslogtreecommitdiffstats
path: root/framework/src/suricata/src/util-mpm-ac-cuda-kernel.cu
diff options
context:
space:
mode:
authorAshlee Young <ashlee@onosfw.com>2015-09-09 22:21:41 -0700
committerAshlee Young <ashlee@onosfw.com>2015-09-09 22:21:41 -0700
commit8879b125d26e8db1a5633de5a9c692eb2d1c4f83 (patch)
treec7259d85a991b83dfa85ab2e339360669fc1f58e /framework/src/suricata/src/util-mpm-ac-cuda-kernel.cu
parent13d05bc8458758ee39cb829098241e89616717ee (diff)
suricata checkin based on commit id a4bce14770beee46a537eda3c3f6e8e8565d5d0a
Change-Id: I9a214fa0ee95e58fc640e50bd604dac7f42db48f
Diffstat (limited to 'framework/src/suricata/src/util-mpm-ac-cuda-kernel.cu')
-rw-r--r--framework/src/suricata/src/util-mpm-ac-cuda-kernel.cu96
1 files changed, 96 insertions, 0 deletions
diff --git a/framework/src/suricata/src/util-mpm-ac-cuda-kernel.cu b/framework/src/suricata/src/util-mpm-ac-cuda-kernel.cu
new file mode 100644
index 00000000..d7cc125b
--- /dev/null
+++ b/framework/src/suricata/src/util-mpm-ac-cuda-kernel.cu
@@ -0,0 +1,96 @@
+/* Copyright (C) 2007-2012 Open Information Security Foundation
+ *
+ * You can copy, redistribute or modify this Program under the terms of
+ * the GNU General Public License version 2 as published by the Free
+ * Software Foundation.
+ *
+ * This program is distributed in the hope that it will be useful,
+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
+ * GNU General Public License for more details.
+ *
+ * You should have received a copy of the GNU General Public License
+ * version 2 along with this program; if not, write to the Free Software
+ * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA
+ * 02110-1301, USA.
+ */
+
+/**
+ * \file
+ *
+ * \author Anoop Saldanha <anoopsaldanha@gmail.com>
+ *
+ * The Cuda kernel for MPM AC.
+ *
+ * \todo - This is a basic version of the kernel.
+ * - Support 16 bit state tables.
+ * - Texture memory.
+ * - Multiple threads per blocks of threads. Make use of
+ * shared memory/texture memory.
+ */
+
+extern "C"
+__global__ void SCACCudaSearch64(unsigned char *d_buffer,
+ unsigned int d_buffer_start_offset,
+ unsigned int *o_buffer,
+ unsigned int *results_buffer,
+ unsigned int nop,
+ unsigned char *tolower)
+{
+ unsigned int u = 0;
+ unsigned int tid = blockIdx.x * blockDim.x + threadIdx.x;
+ if (tid >= nop)
+ return;
+
+ unsigned int buflen = *((unsigned long *)(d_buffer + (o_buffer[tid] - d_buffer_start_offset)));
+ unsigned int (*state_table_u32)[256] =
+ (unsigned int (*)[256])*((unsigned long *)(d_buffer + (o_buffer[tid] - d_buffer_start_offset) + 8));
+ unsigned char *buf = (d_buffer + (o_buffer[tid] - d_buffer_start_offset) + 16);
+
+ unsigned int state = 0;
+ unsigned int matches = 0;
+ unsigned int *results = (results_buffer + ((o_buffer[tid] - d_buffer_start_offset) * 2) + 1);
+ for (u = 0; u < buflen; u++) {
+ state = state_table_u32[state & 0x00FFFFFF][tolower[buf[u]]];
+ if (state & 0xFF000000) {
+ results[matches++] = u;
+ results[matches++] = state & 0x00FFFFFF;
+ }
+ }
+
+ *(results - 1) = matches;
+ return;
+}
+
+extern "C"
+__global__ void SCACCudaSearch32(unsigned char *d_buffer,
+ unsigned int d_buffer_start_offset,
+ unsigned int *o_buffer,
+ unsigned int *results_buffer,
+ unsigned int nop,
+ unsigned char *tolower)
+{
+ unsigned int u = 0;
+ unsigned int tid = blockIdx.x * blockDim.x + threadIdx.x;
+ if (tid >= nop)
+ return;
+
+ unsigned int buflen = *((unsigned int *)(d_buffer + (o_buffer[tid] - d_buffer_start_offset)));
+ unsigned int (*state_table_u32)[256] =
+ (unsigned int (*)[256])*((unsigned int *)(d_buffer + (o_buffer[tid] - d_buffer_start_offset) + 4));
+ unsigned char *buf = (d_buffer + (o_buffer[tid] - d_buffer_start_offset) + 8);
+
+ unsigned int state = 0;
+ unsigned int matches = 0;
+ unsigned int *results = (results_buffer + ((o_buffer[tid] - d_buffer_start_offset) * 2) + 1);
+ for (u = 0; u < buflen; u++) {
+ state = state_table_u32[state & 0x00FFFFFF][tolower[buf[u]]];
+ if (state & 0xFF000000) {
+ results[matches++] = u;
+ results[matches++] = state & 0x00FFFFFF;
+ }
+ }
+
+ *(results - 1) = matches;
+ return;
+}