--- /dev/null
+//============================================================================\r
+// Name : rcuda_ntlm.inc\r
+// Author : Jan Kyska\r
+// Version : 1.00\r
+// Description : NTLM hash kernel for Generator of FreeRainbowTables\r
+//============================================================================ \r
+\r
+namespace RC_NTLM {\r
+\r
+__device__ __constant__ unsigned int h[4] = { 0x67452301, 0xEFCDAB89, 0x98BADCFE, 0x10325476 };\r
+__device__ __constant__ unsigned char r[48] = { \\r
+ 3, 7, 11, 19, 3, 7, 11, 19, 3, 7, 11, 19, 3, 7, 11, 19, \\r
+ 3, 5, 9, 13, 3, 5, 9, 13, 3, 5, 9, 13, 3, 5, 9, 13, \\r
+ 3, 9, 11, 15, 3, 9, 11, 15, 3, 9, 11, 15, 3, 9, 11, 15 };\r
+__device__ __constant__ unsigned char g[48] = { \\r
+ 0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, \\r
+ 0, 4, 8, 12, 1, 5, 9, 13, 2, 6, 10, 14, 3, 7, 11, 15, \\r
+ 0, 8, 4, 12, 2, 10, 6, 14, 1, 9, 5, 13, 3, 11, 7, 15 };\r
+\r
+__device__ unsigned int FF(unsigned int a, unsigned int b, unsigned int c, unsigned int d, int i, const unsigned int* data) {\r
+ unsigned int ret;\r
+ ret = a + ((b&c)|((~b)&d)) + data[SHIDX(g[i])];\r
+ ret = (ret<<r[i])|(ret>>(32-r[i]));\r
+ return ret;\r
+}\r
+\r
+__device__ unsigned int GG(unsigned int a, unsigned int b, unsigned int c, unsigned int d, int i, const unsigned int* data) {\r
+ unsigned int ret;\r
+ ret = a + ((b&c)|(b&d)|(c&d)) + data[SHIDX(g[i])] + 0x5a827999u;\r
+ ret = (ret<<r[i])|(ret>>(32-r[i]));\r
+ return ret;\r
+}\r
+\r
+__device__ unsigned int HH(unsigned int a, unsigned int b, unsigned int c, unsigned int d, int i, const unsigned int* data) {\r
+ unsigned int ret;\r
+ ret = a + (b^c^d) + data[SHIDX(g[i])] + 0x6ed9eba1u;\r
+ ret = (ret<<r[i])|(ret>>(32-r[i]));\r
+ return ret;\r
+}\r
+\r
+__device__ void MD4(unsigned int* dataHash) {\r
+ unsigned int a = h[0], b = h[1], c = h[2], d = h[3], x;\r
+ int ii;\r
+\r
+ // Round 1\r
+ for(ii = 0; ii < 16; ii++) {\r
+ x = b;\r
+ b = FF(a, b, c, d, ii, dataHash);\r
+ a = d; d = c; c = x;\r
+ }\r
+\r
+ // Round 2\r
+ for(; ii < 32; ii++) {\r
+ x = b;\r
+ b = GG(a, b, c, d, ii, dataHash);\r
+ a = d; d = c; c = x;\r
+ }\r
+ \r
+ // Round 3\r
+ for(; ii < 48; ii++) {\r
+ x = b;\r
+ b = HH(a, b, c, d, ii, dataHash);\r
+ a = d; d = c; c = x;\r
+ }\r
+ \r
+ dataHash[SHIDX(0)] = a + h[0];\r
+ dataHash[SHIDX(1)] = b + h[1];\r
+ dataHash[SHIDX(2)] = c + h[2];\r
+ dataHash[SHIDX(3)] = d + h[3];\r
+}\r
+\r
+}\r
+\r
+__global__ void RTGenNTLMKernel(unsigned int chainStart, unsigned int chainStop) {\r
+ uint3 dimItem;\r
+ uint64 uiDiv64, uiVal64, uiMul64;\r
+ unsigned int uiVal, uiDiv;\r
+ unsigned int size, jj, kk;\r
+ unsigned int plain;\r
+\r
+ RTGEN_PROLOGUE;\r
+ \r
+ // transform to the plain text\r
+ plain = 0x80;\r
+ jj = (PLAIN_MAX_SIZE>>1)+1;\r
+\r
+ for(ii = kk = 0; idx64 > 0xfffffff0ull && ii < PLAIN_MAX_SIZE; ii++) {\r
+ uiVal64 = idx64 + cplStart[ii];\r
+ uiVal64--;\r
+ dimItem = cplDimVec[ii];\r
+\r
+ uiMul64 = (uint64)dimItem.y<<32;\r
+ idx64 = __umul64hi(uiVal64, uiMul64);\r
+ uiDiv64 = uiVal64 - idx64*(uint64)dimItem.x;\r
+ uiVal = __umulhi((unsigned int)uiDiv64, dimItem.y);\r
+ uiDiv = (unsigned int)uiDiv64 - uiVal * dimItem.x;\r
+ idx64 += uiVal;\r
+ if(uiDiv >= dimItem.x) {\r
+ uiDiv -= dimItem.x;\r
+ idx64++;\r
+ }\r
+ plain = (plain<<8);\r
+ if((kk++)&1) {\r
+ hData[SHIDX(jj--)] = plain;\r
+ plain = 0;\r
+ }\r
+ plain = (plain<<8) | cplChrSet[dimItem.z + uiDiv];\r
+ }\r
+\r
+ for(idx = (unsigned int)idx64; idx != 0 && ii < PLAIN_MAX_SIZE; ii++) {\r
+ uiVal = idx + cplStart[ii];\r
+ uiVal--;\r
+ dimItem = cplDimVec[ii];\r
+\r
+ idx = __umulhi(uiVal, dimItem.y);\r
+ uiDiv = uiVal - idx*dimItem.x;\r
+ if(uiDiv >= dimItem.x) {\r
+ uiDiv -= dimItem.x;\r
+ idx++;\r
+ }\r
+ plain = (plain<<8);\r
+ if((kk++)&1) {\r
+ hData[SHIDX(jj--)] = plain;\r
+ plain = 0;\r
+ }\r
+ plain = (plain<<8) | cplChrSet[dimItem.z + uiDiv];\r
+ }\r
+\r
+ // prepare for MD4\r
+ size = (ii<<1);\r
+ ii = (((kk^1)&1)<<4)+8;\r
+ plain = plain<<ii;\r
+ for(jj++, idx = 0; jj <= (PLAIN_MAX_SIZE>>1)+1; plain = hData[SHIDX(jj++)], idx++)\r
+ hData[SHIDX(idx)] = (plain>>ii)|(hData[SHIDX(jj)]<<(32-ii));\r
+ hData[SHIDX(idx)] = plain>>ii;\r
+ for(idx++; idx < 14; idx++)\r
+ hData[SHIDX(idx)] = 0;\r
+ hData[SHIDX(idx++)] = size<<3;\r
+ hData[SHIDX(idx)] = 0;\r
+\r
+ // hash\r
+ RC_NTLM::MD4(hData);\r
+\r
+ RTGEN_EPILOGUE\r
+}\r