xerpi/nidattack.c

## nidattack.c
/*
SHA1 dictionary attack program v2.0 (c) 2005 adresd
based on original by djhuevo

hash searchtable and other mods by adresd
performance checked by gorim

added OpenMP support by xerpi

compile with:
	gcc -march=native -Ofast nidattack.c -o nidattack -fopenmp

No License, public domain, do as you want, no warranties
*/

#include <stdio.h>
#include <string.h>
#include <time.h>
#include <stdlib.h>
#include <stdint.h>

typedef int8_t s8;
typedef int16_t s16;
typedef int32_t s32;
typedef uint8_t u8;
typedef uint16_t u16;
typedef uint32_t u32;

/*
SHA-1 based on Steve Reid SHA1 code <steve@edmweb.com>
*/

// this was originally 64, but since ps3 adds 16 bytes
// to every hash buffer it may need to be increased.
// Note: The '128' size does not currently work -
// would anyone like to fix it? :)
#define MAX_HASH_BUFF		64
//#define MAX_HASH_BUFF		128

#define LITTLE_ENDIAN

#define rol(value, bits) (((value) << (bits)) | ((value) >> (32 - (bits))))

/* blk0() and blk() perform the initial expand. */
/* I got the idea of expanding during the round function from SSLeay */
#ifdef LITTLE_ENDIAN
#define blk0(i) (block[i] = (rol(block[i],24)&0xFF00FF00) \
    |(rol(block[i],8)&0x00FF00FF))
#else
#define blk0(i) block[i]
#endif
#define blk(i) (block[i&15] = rol(block[(i+13)&15]^block[(i+8)&15] \
    ^block[(i+2)&15]^block[i&15],1))

/* (R0+R1), R2, R3, R4 are the different operations used in SHA1 */
#define R0(v,w,x,y,z,i) z+=((w&(x^y))^y)+blk0(i)+0x5A827999+rol(v,5);w=rol(w,30);
#define R1(v,w,x,y,z,i) z+=((w&(x^y))^y)+blk(i)+0x5A827999+rol(v,5);w=rol(w,30);
#define R2(v,w,x,y,z,i) z+=(w^x^y)+blk(i)+0x6ED9EBA1+rol(v,5);w=rol(w,30);
#define R3(v,w,x,y,z,i) z+=(((w|x)&y)|(w&x))+blk(i)+0x8F1BBCDC+rol(v,5);w=rol(w,30);
#define R4(v,w,x,y,z,i) z+=(w^x^y)+blk(i)+0xCA62C1D6+rol(v,5);w=rol(w,30);

u32 fastSHA1(unsigned char *buffer,int len) {
    u8 buf[MAX_HASH_BUFF];
    s32 i;
    u32 a, b, c, d, e;
    u32 *block;

    memcpy(buf, buffer, len);
    block=(u32 *)buf;

    for(i=len+1; i<MAX_HASH_BUFF-1; i++) {
      buf[i]=0x00;
    }

    buf[len]=0x80;
    buf[MAX_HASH_BUFF-2]=(len*8)>>8;
    buf[MAX_HASH_BUFF-1]=(len*8)&0xff;

    a = 0x67452301;
    b = 0xEFCDAB89;
    c = 0x98BADCFE;
    d = 0x10325476;
    e = 0xC3D2E1F0;

    /* 4 rounds of 20 operations each. Loop unrolled. */
    R0(a,b,c,d,e, 0); R0(e,a,b,c,d, 1); R0(d,e,a,b,c, 2); R0(c,d,e,a,b, 3);
    R0(b,c,d,e,a, 4); R0(a,b,c,d,e, 5); R0(e,a,b,c,d, 6); R0(d,e,a,b,c, 7);
    R0(c,d,e,a,b, 8); R0(b,c,d,e,a, 9); R0(a,b,c,d,e,10); R0(e,a,b,c,d,11);
    R0(d,e,a,b,c,12); R0(c,d,e,a,b,13); R0(b,c,d,e,a,14); R0(a,b,c,d,e,15);
    R1(e,a,b,c,d,16); R1(d,e,a,b,c,17); R1(c,d,e,a,b,18); R1(b,c,d,e,a,19);
    R2(a,b,c,d,e,20); R2(e,a,b,c,d,21); R2(d,e,a,b,c,22); R2(c,d,e,a,b,23);
    R2(b,c,d,e,a,24); R2(a,b,c,d,e,25); R2(e,a,b,c,d,26); R2(d,e,a,b,c,27);
    R2(c,d,e,a,b,28); R2(b,c,d,e,a,29); R2(a,b,c,d,e,30); R2(e,a,b,c,d,31);
    R2(d,e,a,b,c,32); R2(c,d,e,a,b,33); R2(b,c,d,e,a,34); R2(a,b,c,d,e,35);
    R2(e,a,b,c,d,36); R2(d,e,a,b,c,37); R2(c,d,e,a,b,38); R2(b,c,d,e,a,39);
    R3(a,b,c,d,e,40); R3(e,a,b,c,d,41); R3(d,e,a,b,c,42); R3(c,d,e,a,b,43);
    R3(b,c,d,e,a,44); R3(a,b,c,d,e,45); R3(e,a,b,c,d,46); R3(d,e,a,b,c,47);
    R3(c,d,e,a,b,48); R3(b,c,d,e,a,49); R3(a,b,c,d,e,50); R3(e,a,b,c,d,51);
    R3(d,e,a,b,c,52); R3(c,d,e,a,b,53); R3(b,c,d,e,a,54); R3(a,b,c,d,e,55);
    R3(e,a,b,c,d,56); R3(d,e,a,b,c,57); R3(c,d,e,a,b,58); R3(b,c,d,e,a,59);
    R4(a,b,c,d,e,60); R4(e,a,b,c,d,61); R4(d,e,a,b,c,62); R4(c,d,e,a,b,63);
    R4(b,c,d,e,a,64); R4(a,b,c,d,e,65); R4(e,a,b,c,d,66); R4(d,e,a,b,c,67);
    R4(c,d,e,a,b,68); R4(b,c,d,e,a,69); R4(a,b,c,d,e,70); R4(e,a,b,c,d,71);
    R4(d,e,a,b,c,72); R4(c,d,e,a,b,73); R4(b,c,d,e,a,74); R4(a,b,c,d,e,75);
    R4(e,a,b,c,d,76); R4(d,e,a,b,c,77); R4(c,d,e,a,b,78); R4(b,c,d,e,a,79);

    a+=0x67452301;
    return (a>>24)|((a>>8)&0xff00)|((a<<8)&0xff0000)|((a<<24));
}

static inline int64_t difftimespec_ns(const struct timespec after, const struct timespec before)
{
    return ((int64_t)after.tv_sec - (int64_t)before.tv_sec) * (int64_t)1000000000
         + ((int64_t)after.tv_nsec - (int64_t)before.tv_nsec);
}

char **dict;
char *dict_member_length;
int dict_count;
unsigned int *hash;
int hash_count;

int load_hash_list(char *filename)
{
	int i;
	unsigned int t;
	FILE *fp;
	printf("Reading hash file '%s'\n", filename);
	if ((fp = fopen(filename, "rt")) == NULL)
		return -1;
	hash_count = 0;
	while (fscanf(fp, "0x%x\n", &t) == 1)
		hash_count++;
	printf("hash_count = %d\n", hash_count);
	fseek(fp, 0, SEEK_SET);
	hash = malloc(hash_count * sizeof(unsigned int));
	i = 0;
	while (fscanf(fp, "0x%x\n", &hash[i++]) == 1);
	fclose(fp);
	return 0;
}

int load_dictionary(char *filename)
{
	int i;
	char buffer[0x200];
	FILE *fp;
	printf("Reading dictionary file '%s'\n", filename);
	if ((fp = fopen(filename, "rt")) == NULL)
		return -1;
	dict_count = 0;
	while (fscanf(fp, "%s\n", buffer) != EOF)
		dict_count++;
	printf("dict_count = %d\n", dict_count);
	fseek(fp, 0, SEEK_SET);
	dict = (char **) malloc(dict_count * sizeof(char *));
	dict_member_length = malloc(dict_count);
	i = 0;
	while (fscanf(fp, "%s\n", buffer) == 1) {
		if ((buffer[0] == '-') || (buffer[0] == '/')) {	// This handles comments in the dic file
		} else {				// Not a comment, so do duplicate check
			int count;
			int found = 0;
			for (count = 0; count < (i - 1); count++)
				if (strcmp(buffer, dict[count]) == 0)
					found = 1;
			if (found == 0) {	// If not already in dictionary, then add
				dict_member_length[i] = strlen(buffer);
				dict[i] = malloc(dict_member_length[i] + 1);
				strcpy(dict[i], buffer);
				i++;
			}
		}
	}
	dict_count = i;
	fclose(fp);
	return 0;
}

FILE *fout;

// Hash seems to be where the program spends most of its time, so we need to speedup the
// search somehow
// 32 bit value, 4 bytes
// what we do, is pre-sort the hashlist, so they are in order AABBCCDD
// Then index each byte into the list, hence cutting down the search space considerably
#define VER2_SIZE  256
// midsearch should hopefully fit in cache, so will
// help quite a lot with rejection testing.
int midsearch[VER2_SIZE*VER2_SIZE];
// bigsearch is really a cop out, will not fit in cache, but still quicker
// than checking many elements.
int bigsearch[VER2_SIZE*VER2_SIZE*VER2_SIZE];

void fillsearchtable()
{
	unsigned int searchval;
	int hashpos,hashpos2,hashpos3;
	int count,count2,count3;
	// Firstly Sort the hashlist, order AABBCCDD
	int found = 1;
	printf("Sorting Hashlist\n");
	while (found == 1)
	{
		found = 0;
		for (count=0;count<(hash_count-1);count++)
		{
			if (hash[count] > hash[count+1])
			{ //	swap entries if wrong way around
				unsigned int temp = hash[count+1];
				hash[count+1] = hash[count];
				hash[count] = temp;
				found = 1;
			}
		}
	}
	printf("Clearing Search Tree\n");
	// Really lazy slow clear array, but who cares only done once
	for (count=0;count<(VER2_SIZE*VER2_SIZE);count++)
	{
		midsearch[count] = -1;
	}
	for (count=0;count<(VER2_SIZE*VER2_SIZE*VER2_SIZE);count++)
	{
		bigsearch[count] = -1;
	}
	printf("Building Search Tree\n");
	// Now build the toplevel (first) byte
	//#pragma omp parallel for
	for (count=0;count<256;count++)
	{ //	Find the first firstbyte in the hashlist that matches this value
		hashpos = 0;
		searchval = (count<<24);
		while ((hash[hashpos]&0xff000000) < searchval && hashpos < hash_count - 1)
			hashpos++;
		if ((hash[hashpos]&0xff000000) == searchval)
		{
			// Now Search for a twobyte combo
			for (count2=0;count2<256;count2++)
			{ //	Find the first secondbyte in the hashlist from this pos
				hashpos2 = hashpos;
				searchval = (count<<24) | (count2<<16);
				while ((hash[hashpos2]&0xffff0000) < searchval &&
				 hashpos2 < hash_count - 1) hashpos2++;
				if ((hash[hashpos2]&0xffff0000) == searchval)
				{ //	Add this entry
					midsearch[(count<<8)+count2] = hashpos2;

					// Now Search for a threebyte combo
					for (count3=0;count3<256;count3++)
					{ //	Find the first thirdbyte in the hashlist from this pos
						hashpos3 = hashpos2;
						searchval = (count<<24) | (count2<<16) | (count3<<8);
						while ((hash[hashpos3]&0xffffff00) < searchval &&
			 hashpos3 < hash_count - 1) hashpos3++;
						if ((hash[hashpos3]&0xffffff00) == searchval)
						{ //	Add this entry
							bigsearch[(count<<16)+(count2<<8)+count3] = hashpos2;
						}
					}
				}
			}
		}
	}
}

int findhash(char *buffer, int size, int isPS3)
{
	int h;
	unsigned int hashvalue;
	unsigned int index1;
	unsigned int index2;
	unsigned int index3;
	u8 int_buff[MAX_HASH_BUFF];
	u8* buff_ptr;
	const u8 ps3_key[16] = {
		0x67, 0x59, 0x65, 0x99, 0x04, 0x25, 0x04, 0x90,
		0x56, 0x64, 0x27, 0x49, 0x94, 0x89, 0x74, 0x1A };

	if(isPS3)
	{
		buff_ptr = int_buff;
		memcpy(int_buff, buffer, size);
		memcpy(int_buff+size, ps3_key, 16);
		size += 16;
	}
	else
	{
		buff_ptr = buffer;
	}

	//fastSHA1 doesn't support strings larger than MAX_HASH_BUFF-1 bytes
	//and chances are unlikely that function names are that
	//long anyway so reject them before doing processing
	if (size > MAX_HASH_BUFF-1)
		return 0;
	hashvalue = fastSHA1(buff_ptr, size);
	index1 = (hashvalue & 0xff000000)>>24;
	index2 = (hashvalue & 0x00ff0000)>>16;
	index3 = (hashvalue & 0x0000ff00)>>8;
	int pos;
	//	Not sure if this really helps or not, should do.. on early rejection
	//	memory accesses if nothing else
	pos = midsearch[(index1<<8)+index2];
	if (pos != -1)
	{
		// Get threebyte position
		pos = bigsearch[(index1<<16)+(index2<<8)+index3];
		if (pos != -1)
		{ // Found a position, so search from here
			for(h=pos; h<hash_count; h++)
			{
				if (hashvalue >= hash[h])
					if(hashvalue == hash[h])
					{ //	If equal, found
						#pragma omp critical
						{
							printf("Found : 0x%08x	%s	\n",hashvalue,buffer);
							fprintf(fout,"<FUNC><NID>0x%08x</NID><NAME>%s</NAME></FUNC>\n",hashvalue,buffer);
						}
						return 1;
					}
					else	//	If not, reject as above
						return 0;
			}
		}
	}
	return 0;
}

int main(int argc, char **argv)
{
	char gbuffer[0x200];
	struct timespec start, end;
	int is_ps3_flag = 0;

	char *prefix = "";
	int prefixlen = 0;

	printf("SHA1 hash dictionary attack v2.1 by adresd\n");
	printf("based on the original by djhuevo\n");
	printf("PS3 support added by xorloser\n");

	if (argc < 3) {
		printf("usage:\n\t%s <hash_list> <dictionary> [-ps3] [prefix]\n", argv[0]);
		return 1;
	}

	if (load_hash_list(argv[1]) < 0) {
		fprintf(stderr, "can't open the hash file %s\n", argv[1]);
		return 2;
	}

	if (load_dictionary(argv[2]) < 0) {
		fprintf(stderr, "can't open the dictionary file %s\n", argv[2]);
		return 3;
	}

	if (argc > 3) {
		if( !strcmp("-ps3", argv[3]) ) {
			is_ps3_flag = 1;
			if (argc > 4) {
				prefix = argv[4];
				strcpy(gbuffer, prefix);
				prefixlen = strlen(prefix);
			}
		}
		else
		{
			prefix = argv[3];
			strcpy(gbuffer, prefix);
			prefixlen = strlen(prefix);
		}
	}

	if (hash_count < 1 || dict_count < 1) {
		fprintf(stderr, "error on input data.\n");
		fprintf(stderr, "hash_count = %d, dict_count = %d\n", hash_count, dict_count);
		return 4;
	}

	if ((fout = fopen("results.xml", "wba")) <= 0) {
		printf("Failed to open output file\n");
		exit(1);
	}

	printf("\nprefix : '%s'\n", prefix != "" ? prefix : "<None>");
	printf("hash count : %d\n", hash_count);
	printf("dictionary words: %d\n\n", dict_count);

	fillsearchtable();

	printf("\nsearching...\n\n");
	fflush(stdout);
	clock_gettime(CLOCK_MONOTONIC, &start);

	// First Word
	#pragma omp parallel for
	for (int x = 0; x < dict_count; x++) {
		char buffer[0x200];
		int i; // , j, h;
		int y, z, zz, z2;
		char *ptr, *ptr0, *ptr1, *ptr2, *ptr3, *ptr4;
		strcpy(buffer, gbuffer);
		ptr0 = &buffer[prefixlen];
		for (i = 0; i < dict_member_length[x]; i++) {
			*(ptr0++) = dict[x][i];
		}
		*(ptr0) = 0;
		#pragma omp critical
		printf("// processing word: %s\n", buffer);
		//fflush(stdout);
		// Second word
		for (y = 0; y < dict_count; y++) {
			ptr1 = ptr0;
			for (i = 0; i < dict_member_length[y]; i++) {
				*(ptr1++) = dict[y][i];
			}
			*(ptr1) = 0;
			//printf("// processing word: %s\n",buffer);

			// Only do next loop if first and second dont match
			if (strcmp(dict[x], dict[y]) != 0) {
				// Third Word
				for (z = 0; z < dict_count; z++) {
					ptr2 = ptr1;
					for (i = 0; i < dict_member_length[z]; i++) {
						*(ptr2++) = dict[z][i];
					}
					// Only do next loop if second and third dont match
					if (strcmp(dict[y], dict[z]) != 0) {
						// Fourth Word
						for (zz = 0; zz < dict_count; zz++) {
							ptr3 = ptr2;
							for (i = 0; i < dict_member_length[zz]; i++) {
								*(ptr3++) = dict[zz][i];
							}
							// Only do next loop if third and fourth dont match
							if (strcmp(dict[z], dict[zz]) != 0) {
								// Fifth Word
								for (z2 = 0; z2 < dict_count; z2++) {
									ptr4 = ptr3;
									for (i = 0; i < dict_member_length[z2]; i++) {
										*(ptr4++) = dict[z2][i];
									}
									*(ptr4) = 0x00;
									findhash(buffer, ptr4 - buffer, is_ps3_flag);
								}
							}
							*(ptr3) = 0x00;
							findhash(buffer, ptr3 - buffer, is_ps3_flag);
						}
					}
					*(ptr2) = 0x00;
					findhash(buffer, ptr2 - buffer, is_ps3_flag);
				}
			}
			*(ptr1) = 0x00;
			findhash(buffer, ptr1 - buffer, is_ps3_flag);
		}
		*(ptr0) = 0x00;
		findhash(buffer, ptr0 - buffer, is_ps3_flag);
	}
	clock_gettime(CLOCK_MONOTONIC, &end);
	printf("\n\nhash count : %d\n", hash_count);
	printf("dictionary words: %d\n\n", dict_count);
	printf("\n\ntime : %f seconds.\n", difftimespec_ns(end, start) / 1000000000.0);

	fclose(fout);
	return 0;
}
	/*
	SHA1 dictionary attack program v2.0 (c) 2005 adresd
	based on original by djhuevo

	hash searchtable and other mods by adresd
	performance checked by gorim

	added OpenMP support by xerpi

	compile with:
	gcc -march=native -Ofast nidattack.c -o nidattack -fopenmp

	No License, public domain, do as you want, no warranties
	*/

	#include <stdio.h>
	#include <string.h>
	#include <time.h>
	#include <stdlib.h>
	#include <stdint.h>

	typedef int8_t s8;
	typedef int16_t s16;
	typedef int32_t s32;
	typedef uint8_t u8;
	typedef uint16_t u16;
	typedef uint32_t u32;

	/*
	SHA-1 based on Steve Reid SHA1 code <steve@edmweb.com>
	*/

	// this was originally 64, but since ps3 adds 16 bytes
	// to every hash buffer it may need to be increased.
	// Note: The '128' size does not currently work -
	// would anyone like to fix it? :)
	#define MAX_HASH_BUFF 64
	//#define MAX_HASH_BUFF 128

	#define LITTLE_ENDIAN

	#define rol(value, bits) (((value) << (bits)) \| ((value) >> (32 - (bits))))

	/* blk0() and blk() perform the initial expand. */
	/* I got the idea of expanding during the round function from SSLeay */
	#ifdef LITTLE_ENDIAN
	#define blk0(i) (block[i] = (rol(block[i],24)&0xFF00FF00) \
	\|(rol(block[i],8)&0x00FF00FF))
	#else
	#define blk0(i) block[i]
	#endif
	#define blk(i) (block[i&15] = rol(block[(i+13)&15]^block[(i+8)&15] \
	^block[(i+2)&15]^block[i&15],1))

	/* (R0+R1), R2, R3, R4 are the different operations used in SHA1 */
	#define R0(v,w,x,y,z,i) z+=((w&(x^y))^y)+blk0(i)+0x5A827999+rol(v,5);w=rol(w,30);
	#define R1(v,w,x,y,z,i) z+=((w&(x^y))^y)+blk(i)+0x5A827999+rol(v,5);w=rol(w,30);
	#define R2(v,w,x,y,z,i) z+=(w^x^y)+blk(i)+0x6ED9EBA1+rol(v,5);w=rol(w,30);
	#define R3(v,w,x,y,z,i) z+=(((w\|x)&y)\|(w&x))+blk(i)+0x8F1BBCDC+rol(v,5);w=rol(w,30);
	#define R4(v,w,x,y,z,i) z+=(w^x^y)+blk(i)+0xCA62C1D6+rol(v,5);w=rol(w,30);

	u32 fastSHA1(unsigned char *buffer,int len) {
	u8 buf[MAX_HASH_BUFF];
	s32 i;
	u32 a, b, c, d, e;
	u32 *block;

	memcpy(buf, buffer, len);
	block=(u32 *)buf;

	for(i=len+1; i<MAX_HASH_BUFF-1; i++) {
	buf[i]=0x00;
	}

	buf[len]=0x80;
	buf[MAX_HASH_BUFF-2]=(len*8)>>8;
	buf[MAX_HASH_BUFF-1]=(len*8)&0xff;

	a = 0x67452301;
	b = 0xEFCDAB89;
	c = 0x98BADCFE;
	d = 0x10325476;
	e = 0xC3D2E1F0;

	/* 4 rounds of 20 operations each. Loop unrolled. */
	R0(a,b,c,d,e, 0); R0(e,a,b,c,d, 1); R0(d,e,a,b,c, 2); R0(c,d,e,a,b, 3);
	R0(b,c,d,e,a, 4); R0(a,b,c,d,e, 5); R0(e,a,b,c,d, 6); R0(d,e,a,b,c, 7);
	R0(c,d,e,a,b, 8); R0(b,c,d,e,a, 9); R0(a,b,c,d,e,10); R0(e,a,b,c,d,11);
	R0(d,e,a,b,c,12); R0(c,d,e,a,b,13); R0(b,c,d,e,a,14); R0(a,b,c,d,e,15);
	R1(e,a,b,c,d,16); R1(d,e,a,b,c,17); R1(c,d,e,a,b,18); R1(b,c,d,e,a,19);
	R2(a,b,c,d,e,20); R2(e,a,b,c,d,21); R2(d,e,a,b,c,22); R2(c,d,e,a,b,23);
	R2(b,c,d,e,a,24); R2(a,b,c,d,e,25); R2(e,a,b,c,d,26); R2(d,e,a,b,c,27);
	R2(c,d,e,a,b,28); R2(b,c,d,e,a,29); R2(a,b,c,d,e,30); R2(e,a,b,c,d,31);
	R2(d,e,a,b,c,32); R2(c,d,e,a,b,33); R2(b,c,d,e,a,34); R2(a,b,c,d,e,35);
	R2(e,a,b,c,d,36); R2(d,e,a,b,c,37); R2(c,d,e,a,b,38); R2(b,c,d,e,a,39);
	R3(a,b,c,d,e,40); R3(e,a,b,c,d,41); R3(d,e,a,b,c,42); R3(c,d,e,a,b,43);
	R3(b,c,d,e,a,44); R3(a,b,c,d,e,45); R3(e,a,b,c,d,46); R3(d,e,a,b,c,47);
	R3(c,d,e,a,b,48); R3(b,c,d,e,a,49); R3(a,b,c,d,e,50); R3(e,a,b,c,d,51);
	R3(d,e,a,b,c,52); R3(c,d,e,a,b,53); R3(b,c,d,e,a,54); R3(a,b,c,d,e,55);
	R3(e,a,b,c,d,56); R3(d,e,a,b,c,57); R3(c,d,e,a,b,58); R3(b,c,d,e,a,59);
	R4(a,b,c,d,e,60); R4(e,a,b,c,d,61); R4(d,e,a,b,c,62); R4(c,d,e,a,b,63);
	R4(b,c,d,e,a,64); R4(a,b,c,d,e,65); R4(e,a,b,c,d,66); R4(d,e,a,b,c,67);
	R4(c,d,e,a,b,68); R4(b,c,d,e,a,69); R4(a,b,c,d,e,70); R4(e,a,b,c,d,71);
	R4(d,e,a,b,c,72); R4(c,d,e,a,b,73); R4(b,c,d,e,a,74); R4(a,b,c,d,e,75);
	R4(e,a,b,c,d,76); R4(d,e,a,b,c,77); R4(c,d,e,a,b,78); R4(b,c,d,e,a,79);

	a+=0x67452301;
	return (a>>24)\|((a>>8)&0xff00)\|((a<<8)&0xff0000)\|((a<<24));
	}

	static inline int64_t difftimespec_ns(const struct timespec after, const struct timespec before)
	{
	return ((int64_t)after.tv_sec - (int64_t)before.tv_sec) * (int64_t)1000000000
	+ ((int64_t)after.tv_nsec - (int64_t)before.tv_nsec);
	}

	char **dict;
	char *dict_member_length;
	int dict_count;
	unsigned int *hash;
	int hash_count;

	int load_hash_list(char *filename)
	{
	int i;
	unsigned int t;
	FILE *fp;
	printf("Reading hash file '%s'\n", filename);
	if ((fp = fopen(filename, "rt")) == NULL)
	return -1;
	hash_count = 0;
	while (fscanf(fp, "0x%x\n", &t) == 1)
	hash_count++;
	printf("hash_count = %d\n", hash_count);
	fseek(fp, 0, SEEK_SET);
	hash = malloc(hash_count * sizeof(unsigned int));
	i = 0;
	while (fscanf(fp, "0x%x\n", &hash[i++]) == 1);
	fclose(fp);
	return 0;
	}

	int load_dictionary(char *filename)
	{
	int i;
	char buffer[0x200];
	FILE *fp;
	printf("Reading dictionary file '%s'\n", filename);
	if ((fp = fopen(filename, "rt")) == NULL)
	return -1;
	dict_count = 0;
	while (fscanf(fp, "%s\n", buffer) != EOF)
	dict_count++;
	printf("dict_count = %d\n", dict_count);
	fseek(fp, 0, SEEK_SET);
	dict = (char *) malloc(dict_count sizeof(char *));
	dict_member_length = malloc(dict_count);
	i = 0;
	while (fscanf(fp, "%s\n", buffer) == 1) {
	if ((buffer[0] == '-') \|\| (buffer[0] == '/')) { // This handles comments in the dic file
	} else { // Not a comment, so do duplicate check
	int count;
	int found = 0;
	for (count = 0; count < (i - 1); count++)
	if (strcmp(buffer, dict[count]) == 0)
	found = 1;
	if (found == 0) { // If not already in dictionary, then add
	dict_member_length[i] = strlen(buffer);
	dict[i] = malloc(dict_member_length[i] + 1);
	strcpy(dict[i], buffer);
	i++;
	}
	}
	}
	dict_count = i;
	fclose(fp);
	return 0;
	}

	FILE *fout;

	// Hash seems to be where the program spends most of its time, so we need to speedup the
	// search somehow
	// 32 bit value, 4 bytes
	// what we do, is pre-sort the hashlist, so they are in order AABBCCDD
	// Then index each byte into the list, hence cutting down the search space considerably
	#define VER2_SIZE 256
	// midsearch should hopefully fit in cache, so will
	// help quite a lot with rejection testing.
	int midsearch[VER2_SIZE*VER2_SIZE];
	// bigsearch is really a cop out, will not fit in cache, but still quicker
	// than checking many elements.
	int bigsearch[VER2_SIZEVER2_SIZEVER2_SIZE];

	void fillsearchtable()
	{
	unsigned int searchval;
	int hashpos,hashpos2,hashpos3;
	int count,count2,count3;
	// Firstly Sort the hashlist, order AABBCCDD
	int found = 1;
	printf("Sorting Hashlist\n");
	while (found == 1)
	{
	found = 0;
	for (count=0;count<(hash_count-1);count++)
	{
	if (hash[count] > hash[count+1])
	{ // swap entries if wrong way around
	unsigned int temp = hash[count+1];
	hash[count+1] = hash[count];
	hash[count] = temp;
	found = 1;
	}
	}
	}
	printf("Clearing Search Tree\n");
	// Really lazy slow clear array, but who cares only done once
	for (count=0;count<(VER2_SIZE*VER2_SIZE);count++)
	{
	midsearch[count] = -1;
	}
	for (count=0;count<(VER2_SIZEVER2_SIZEVER2_SIZE);count++)
	{
	bigsearch[count] = -1;
	}
	printf("Building Search Tree\n");
	// Now build the toplevel (first) byte
	//#pragma omp parallel for
	for (count=0;count<256;count++)
	{ // Find the first firstbyte in the hashlist that matches this value
	hashpos = 0;
	searchval = (count<<24);
	while ((hash[hashpos]&0xff000000) < searchval && hashpos < hash_count - 1)
	hashpos++;
	if ((hash[hashpos]&0xff000000) == searchval)
	{
	// Now Search for a twobyte combo
	for (count2=0;count2<256;count2++)
	{ // Find the first secondbyte in the hashlist from this pos
	hashpos2 = hashpos;
	searchval = (count<<24) \| (count2<<16);
	while ((hash[hashpos2]&0xffff0000) < searchval &&
	hashpos2 < hash_count - 1) hashpos2++;
	if ((hash[hashpos2]&0xffff0000) == searchval)
	{ // Add this entry
	midsearch[(count<<8)+count2] = hashpos2;

	// Now Search for a threebyte combo
	for (count3=0;count3<256;count3++)
	{ // Find the first thirdbyte in the hashlist from this pos
	hashpos3 = hashpos2;
	searchval = (count<<24) \| (count2<<16) \| (count3<<8);
	while ((hash[hashpos3]&0xffffff00) < searchval &&
	hashpos3 < hash_count - 1) hashpos3++;
	if ((hash[hashpos3]&0xffffff00) == searchval)
	{ // Add this entry
	bigsearch[(count<<16)+(count2<<8)+count3] = hashpos2;
	}
	}
	}
	}
	}
	}
	}

	int findhash(char *buffer, int size, int isPS3)
	{
	int h;
	unsigned int hashvalue;
	unsigned int index1;
	unsigned int index2;
	unsigned int index3;
	u8 int_buff[MAX_HASH_BUFF];
	u8* buff_ptr;
	const u8 ps3_key[16] = {
	0x67, 0x59, 0x65, 0x99, 0x04, 0x25, 0x04, 0x90,
	0x56, 0x64, 0x27, 0x49, 0x94, 0x89, 0x74, 0x1A };

	if(isPS3)
	{
	buff_ptr = int_buff;
	memcpy(int_buff, buffer, size);
	memcpy(int_buff+size, ps3_key, 16);
	size += 16;
	}
	else
	{
	buff_ptr = buffer;
	}

	//fastSHA1 doesn't support strings larger than MAX_HASH_BUFF-1 bytes
	//and chances are unlikely that function names are that
	//long anyway so reject them before doing processing
	if (size > MAX_HASH_BUFF-1)
	return 0;
	hashvalue = fastSHA1(buff_ptr, size);
	index1 = (hashvalue & 0xff000000)>>24;
	index2 = (hashvalue & 0x00ff0000)>>16;
	index3 = (hashvalue & 0x0000ff00)>>8;
	int pos;
	// Not sure if this really helps or not, should do.. on early rejection
	// memory accesses if nothing else
	pos = midsearch[(index1<<8)+index2];
	if (pos != -1)
	{
	// Get threebyte position
	pos = bigsearch[(index1<<16)+(index2<<8)+index3];
	if (pos != -1)
	{ // Found a position, so search from here
	for(h=pos; h<hash_count; h++)
	{
	if (hashvalue >= hash[h])
	if(hashvalue == hash[h])
	{ // If equal, found
	#pragma omp critical
	{
	printf("Found : 0x%08x %s \n",hashvalue,buffer);
	fprintf(fout,"<FUNC><NID>0x%08x</NID><NAME>%s</NAME></FUNC>\n",hashvalue,buffer);
	}
	return 1;
	}
	else // If not, reject as above
	return 0;
	}
	}
	}
	return 0;
	}

	int main(int argc, char **argv)
	{
	char gbuffer[0x200];
	struct timespec start, end;
	int is_ps3_flag = 0;

	char *prefix = "";
	int prefixlen = 0;

	printf("SHA1 hash dictionary attack v2.1 by adresd\n");
	printf("based on the original by djhuevo\n");
	printf("PS3 support added by xorloser\n");

	if (argc < 3) {
	printf("usage:\n\t%s <hash_list> <dictionary> [-ps3] [prefix]\n", argv[0]);
	return 1;
	}

	if (load_hash_list(argv[1]) < 0) {
	fprintf(stderr, "can't open the hash file %s\n", argv[1]);
	return 2;
	}

	if (load_dictionary(argv[2]) < 0) {
	fprintf(stderr, "can't open the dictionary file %s\n", argv[2]);
	return 3;
	}

	if (argc > 3) {
	if( !strcmp("-ps3", argv[3]) ) {
	is_ps3_flag = 1;
	if (argc > 4) {
	prefix = argv[4];
	strcpy(gbuffer, prefix);
	prefixlen = strlen(prefix);
	}
	}
	else
	{
	prefix = argv[3];
	strcpy(gbuffer, prefix);
	prefixlen = strlen(prefix);
	}
	}

	if (hash_count < 1 \|\| dict_count < 1) {
	fprintf(stderr, "error on input data.\n");
	fprintf(stderr, "hash_count = %d, dict_count = %d\n", hash_count, dict_count);
	return 4;
	}

	if ((fout = fopen("results.xml", "wba")) <= 0) {
	printf("Failed to open output file\n");
	exit(1);
	}

	printf("\nprefix : '%s'\n", prefix != "" ? prefix : "<None>");
	printf("hash count : %d\n", hash_count);
	printf("dictionary words: %d\n\n", dict_count);

	fillsearchtable();

	printf("\nsearching...\n\n");
	fflush(stdout);
	clock_gettime(CLOCK_MONOTONIC, &start);

	// First Word
	#pragma omp parallel for
	for (int x = 0; x < dict_count; x++) {
	char buffer[0x200];
	int i; // , j, h;
	int y, z, zz, z2;
	char ptr, ptr0, ptr1, ptr2, ptr3, ptr4;
	strcpy(buffer, gbuffer);
	ptr0 = &buffer[prefixlen];
	for (i = 0; i < dict_member_length[x]; i++) {
	*(ptr0++) = dict[x][i];
	}
	*(ptr0) = 0;
	#pragma omp critical
	printf("// processing word: %s\n", buffer);
	//fflush(stdout);
	// Second word
	for (y = 0; y < dict_count; y++) {
	ptr1 = ptr0;
	for (i = 0; i < dict_member_length[y]; i++) {
	*(ptr1++) = dict[y][i];
	}
	*(ptr1) = 0;
	//printf("// processing word: %s\n",buffer);

	// Only do next loop if first and second dont match
	if (strcmp(dict[x], dict[y]) != 0) {
	// Third Word
	for (z = 0; z < dict_count; z++) {
	ptr2 = ptr1;
	for (i = 0; i < dict_member_length[z]; i++) {
	*(ptr2++) = dict[z][i];
	}
	// Only do next loop if second and third dont match
	if (strcmp(dict[y], dict[z]) != 0) {
	// Fourth Word
	for (zz = 0; zz < dict_count; zz++) {
	ptr3 = ptr2;
	for (i = 0; i < dict_member_length[zz]; i++) {
	*(ptr3++) = dict[zz][i];
	}
	// Only do next loop if third and fourth dont match
	if (strcmp(dict[z], dict[zz]) != 0) {
	// Fifth Word
	for (z2 = 0; z2 < dict_count; z2++) {
	ptr4 = ptr3;
	for (i = 0; i < dict_member_length[z2]; i++) {
	*(ptr4++) = dict[z2][i];
	}
	*(ptr4) = 0x00;
	findhash(buffer, ptr4 - buffer, is_ps3_flag);
	}
	}
	*(ptr3) = 0x00;
	findhash(buffer, ptr3 - buffer, is_ps3_flag);
	}
	}
	*(ptr2) = 0x00;
	findhash(buffer, ptr2 - buffer, is_ps3_flag);
	}
	}
	*(ptr1) = 0x00;
	findhash(buffer, ptr1 - buffer, is_ps3_flag);
	}
	*(ptr0) = 0x00;
	findhash(buffer, ptr0 - buffer, is_ps3_flag);
	}
	clock_gettime(CLOCK_MONOTONIC, &end);
	printf("\n\nhash count : %d\n", hash_count);
	printf("dictionary words: %d\n\n", dict_count);
	printf("\n\ntime : %f seconds.\n", difftimespec_ns(end, start) / 1000000000.0);

	fclose(fout);
	return 0;
	}