3
0
mirror of https://github.com/CrazyRedMachine/popnhax.git synced 2025-01-24 15:22:12 +01:00
popnhax/util/search.cc

75 lines
2.1 KiB
C++
Raw Normal View History

2023-07-09 21:34:07 +02:00
#include <memory.h>
#include <stdint.h>
#include <cstdio>
#include "util/log.h"
#define NO_OF_CHARS 256
2023-07-10 21:35:09 +02:00
2023-07-09 21:34:07 +02:00
// A utility function to get maximum of two integers
static int max(int a, int b) {
return (a > b) ? a : b;
}
2023-07-10 21:35:09 +02:00
2023-07-09 21:34:07 +02:00
// The preprocessing function for Boyer Moore's bad character heuristic
static void badCharHeuristic(const unsigned char *str, int size, int* badchar) {
int i;
2023-07-10 21:35:09 +02:00
2023-07-09 21:34:07 +02:00
// Initialize all occurrences as -1
for (i = 0; i < NO_OF_CHARS; i++)
badchar[i] = -1;
2023-07-10 21:35:09 +02:00
2023-07-09 21:34:07 +02:00
// Fill the actual value of last occurrence of a character
for (i = 0; i < size; i++)
badchar[(int) str[i]] = i;
}
#define DEBUG_SEARCH 0
2023-07-10 21:35:09 +02:00
2023-07-09 21:34:07 +02:00
int _search(unsigned char *haystack, size_t haystack_size, const unsigned char *needle, size_t needle_size, int orig_offset, int debug) {
int badchar[NO_OF_CHARS];
2023-07-10 21:35:09 +02:00
2023-07-09 21:34:07 +02:00
badCharHeuristic(needle, needle_size, badchar);
2023-07-10 21:35:09 +02:00
2023-07-09 21:34:07 +02:00
int64_t s = 0; // s is shift of the pattern with respect to text
while (s <= (haystack_size - needle_size)) {
int j = needle_size - 1;
if (debug == 2)
{
2023-07-10 21:35:09 +02:00
LOG("--------------------------------\n");
LOG("txt...");
for (size_t i = 0; i < needle_size; i++)
{
LOG("%02x ", haystack[orig_offset+s+i]);
}
LOG("\n");
LOG("pat...");
for (size_t i = 0; i < needle_size; i++)
{
LOG("%02x ", needle[i]);
}
LOG("\n");
2023-07-09 21:34:07 +02:00
}
while (j >= 0 && needle[j] == haystack[orig_offset + s + j])
j--;
2023-07-10 21:35:09 +02:00
2023-07-09 21:34:07 +02:00
if (j < 0) {
2023-07-10 21:35:09 +02:00
if (debug)
LOG("found string at offset %llx!\n", orig_offset +s);
return orig_offset + s;
2023-07-09 21:34:07 +02:00
}
else
2023-07-10 21:35:09 +02:00
{
2023-07-09 21:34:07 +02:00
s += max(1, j - badchar[(int)haystack[orig_offset + s + j]]);
2023-07-10 21:35:09 +02:00
if (debug)
LOG("mismatch at pos %d, new offset %llx\n\n", j, orig_offset+s);
}
2023-07-09 21:34:07 +02:00
}
2023-07-10 21:35:09 +02:00
return -1;
2023-07-09 21:34:07 +02:00
}
int search(char *haystack, size_t haystack_size, const char *needle, size_t needle_size, size_t orig_offset) {
2023-07-10 21:35:09 +02:00
int res = _search((unsigned char*) haystack, haystack_size, (const unsigned char *)needle, needle_size, orig_offset, 0);
return res;
2023-07-09 21:34:07 +02:00
}