binary searching is finished!

This commit is contained in:
cathugger 2017-10-10 01:02:43 +00:00
parent 00df4f8416
commit 586d977fa0
2 changed files with 167 additions and 67 deletions

View file

@ -153,6 +153,26 @@ else
fi fi
fi fi
AC_ARG_ENABLE([binfilterlen],
[AS_HELP_STRING([--enable-binfilterlen=VAL],
[set binary string filter length (if you don't use intfilter) @<:@default=32@:>@])],
[], [enable_binfilterlen=no]
)
if test "x$enable_binfilterlen" != "xyes" -a "x$enable_binfilterlen" != "xno"
then
MYDEFS="$MYDEFS -DBINFILTERLEN=$enable_binfilterlen"
fi
AC_ARG_ENABLE([binsearch],
[AS_HELP_STRING([--enable-binsearch],
[enable binary search algoritm; MUCH faster if there are a lot of filters @<:@default=no@:>@])],
[], [enable_binsearch=no]
)
if test "x$enable_binsearch" = "xyes"
then
MYDEFS="$MYDEFS -DBINSEARCH"
fi
AC_ARG_ENABLE([statistics], AC_ARG_ENABLE([statistics],
[AS_HELP_STRING([--enable-statistics], [AS_HELP_STRING([--enable-statistics],
[collect statistics @<:@default=yes@:>@])], [collect statistics @<:@default=yes@:>@])],

212
main.c
View file

@ -67,8 +67,11 @@ static void termhandler(int sig)
// filters stuff // filters stuff
#ifndef BINFILTERLEN
#define BINFILTERLEN PUBLIC_LEN
#endif
struct binfilter { struct binfilter {
u8 f[PUBLIC_LEN]; u8 f[BINFILTERLEN];
size_t len; // real len minus one size_t len; // real len minus one
u8 mask; u8 mask;
} ; } ;
@ -226,10 +229,7 @@ static void ifilter_addexpanded(
static void ifilter_expand(IFT dmask,IFT smask,IFT cmask,int ishift,int rshift) static void ifilter_expand(IFT dmask,IFT smask,IFT cmask,int ishift,int rshift)
{ {
size_t len = VEC_LENGTH(ifilters); size_t len = VEC_LENGTH(ifilters);
printf(">expand:cm:%08X,len:%d,cm*len:%d\n",
cmask,(int)len,(int)(cmask * len));
VEC_ADDN(ifilters,cmask * len); VEC_ADDN(ifilters,cmask * len);
printf(">expand after\n");
size_t esz = cmask + 1; // size of expanded elements size_t esz = cmask + 1; // size of expanded elements
for (size_t i = len - 1;;--i) { for (size_t i = len - 1;;--i) {
for (IFT j = 0;;++j) { for (IFT j = 0;;++j) {
@ -246,16 +246,13 @@ static void ifilter_expand(IFT dmask,IFT smask,IFT cmask,int ishift,int rshift)
static inline void ifilter_addflatten(struct intfilter *ifltr,IFT mask) static inline void ifilter_addflatten(struct intfilter *ifltr,IFT mask)
{ {
printf(">enter flatten,f:%08X,m:%08X\n",ifltr->f,mask);
if (VEC_LENGTH(ifilters) == 0) { if (VEC_LENGTH(ifilters) == 0) {
printf(">flatten simple\n");
// simple // simple
VEC_ADD(ifilters,*ifltr); VEC_ADD(ifilters,*ifltr);
ifiltermask = mask; ifiltermask = mask;
return; return;
} }
if (ifiltermask == mask) { if (ifiltermask == mask) {
printf(">flatten lucky\n");
// lucky, only need to insert at the right place // lucky, only need to insert at the right place
VEC_FOR(ifilters,i) { VEC_FOR(ifilters,i) {
if (VEC_BUF(ifilters,i).f > ifltr->f) { if (VEC_BUF(ifilters,i).f > ifltr->f) {
@ -266,24 +263,18 @@ static inline void ifilter_addflatten(struct intfilter *ifltr,IFT mask)
VEC_ADD(ifilters,*ifltr); VEC_ADD(ifilters,*ifltr);
return; return;
} }
printf(">flatten complicated; em:0x%08X,m:0x%08X\n",ifiltermask,mask);
IFT cross = ifiltermask ^ mask; IFT cross = ifiltermask ^ mask;
printf(">cross:%08X\n",cross);
int ishift = 0; int ishift = 0;
while ((cross & 1) == 0) { while ((cross & 1) == 0) {
++ishift; ++ishift;
cross >>= 1; cross >>= 1;
} }
printf(">ishift:%d,cross:%08X\n",ishift,cross);
IFT smask = cross & (cross + 1); // shift mask IFT smask = cross & (cross + 1); // shift mask
printf(">smask:%08X\n",smask);
IFT dmask = cross ^ smask; // direct mask IFT dmask = cross ^ smask; // direct mask
printf(">dmask:%08X\n",dmask);
IFT cmask; // combined mask IFT cmask; // combined mask
int rshift = 0; // relative shift int rshift = 0; // relative shift
while (cmask = (smask >> rshift) | dmask,(cmask & (cmask + 1)) != 0) while (cmask = (smask >> rshift) | dmask,(cmask & (cmask + 1)) != 0)
++rshift; ++rshift;
printf(">cmask:%08X,rshift:%d\n",cmask,rshift);
// preparations done // preparations done
if (ifiltermask > mask) { if (ifiltermask > mask) {
// already existing stuff has more precise mask than we // already existing stuff has more precise mask than we
@ -330,10 +321,14 @@ static void filters_add(const char *filter)
} fc,mc; } fc,mc;
#endif #endif
// skip regex start symbol. we do not support regex tho
if (*filter == '^')
++filter;
memset(&bf,0,sizeof(bf)); memset(&bf,0,sizeof(bf));
if (!base32_valid(filter,&ret)) { if (!base32_valid(filter,&ret)) {
fprintf(stderr, "filter \"%s\" is invalid\n", filter); fprintf(stderr,"filter \"%s\" is invalid\n",filter);
return; return;
} }
ret = BASE32_FROM_LEN(ret); ret = BASE32_FROM_LEN(ret);
@ -342,10 +337,10 @@ static void filters_add(const char *filter)
#ifdef INTFILTER #ifdef INTFILTER
if (ret > sizeof(IFT)) if (ret > sizeof(IFT))
#else #else
if (ret > PUBLIC_LEN) if (ret > sizeof(bf.f))
#endif #endif
{ {
fprintf(stderr, "filter \"%s\" is too long\n", filter); fprintf(stderr,"filter \"%s\" is too long\n",filter);
return; return;
} }
ret2 = base32_from(bf.f,&bf.mask,filter); ret2 = base32_from(bf.f,&bf.mask,filter);
@ -403,7 +398,18 @@ static void filters_add(const char *filter)
} }
} }
#ifdef BINSEARCH #ifdef BINSEARCH
// TODO VEC_FOR(bfilters,i) {
/*
* mask is irrelevant, as they're not
* conflicting and have proper order
* (unlike when using little endian words)
*/
if (memcmp(VEC_BUF(bfilters,i).f,bf.f,sizeof(bf.f)) > 0) {
VEC_INSERT(bfilters,i,bf);
return;
}
}
VEC_ADD(bfilters,bf);
#else #else
VEC_FOR(bfilters,i) { VEC_FOR(bfilters,i) {
// filter with least bits first // filter with least bits first
@ -440,21 +446,93 @@ static size_t filters_count()
#ifdef INTFILTER #ifdef INTFILTER
#define FILTERFOR(it) for (it = 0;it < VEC_LENGTH(ifilters);++it)
#ifndef BINSEARCH #ifndef BINSEARCH
#define MATCHFILTER(it,pk) ((*(IFT *)(pk) & VEC_BUF(ifilters,it).m) == VEC_BUF(ifilters,it).f)
#else
#define MATCHFILTER(it,pk) ((*(IFT *)(pk) & ifiltermask) == VEC_BUF(ifilters,it).f)
#endif
#else #define MATCHFILTER(it,pk) \
((*(IFT *)(pk) & VEC_BUF(ifilters,it).m) == VEC_BUF(ifilters,it).f)
#define DOFILTER(it,pk,code) { \
for (it = 0;it < VEC_LENGTH(ifilters);++it) { \
if (unlikely(MATCHFILTER(it,pk))) { \
code; \
break; \
} \
} \
}
#else // BINSEARCH
#define DOFILTER(it,pk,code) { \
for (size_t down = 0,up = VEC_LENGTH(ifilters);down < up;) { \
it = (up + down) / 2; \
if ((*(IFT *)(pk) & ifiltermask) < VEC_BUF(ifilters,it).f) \
up = it; \
else if ((*(IFT *)(pk) & ifiltermask) > VEC_BUF(ifilters,it).f) \
down = it + 1; \
else { \
code; \
break; \
} \
} \
}
#endif // BINSEARCH
#else // INTFILTER
#ifndef BINSEARCH
#define FILTERFOR(it) for (it = 0;it < VEC_LENGTH(bfilters);++it)
#define MATCHFILTER(it,pk) ( \ #define MATCHFILTER(it,pk) ( \
memcmp(pk,VEC_BUF(bfilters,it).f,VEC_BUF(bfilters,it).len) == 0 && \ memcmp(pk,VEC_BUF(bfilters,it).f,VEC_BUF(bfilters,it).len) == 0 && \
(pk[VEC_BUF(bfilters,it).len] & VEC_BUF(bfilters,it).mask) == VEC_BUF(bfilters,it).f[VEC_BUF(bfilters,it).len]) (pk[VEC_BUF(bfilters,it).len] & VEC_BUF(bfilters,it).mask) == VEC_BUF(bfilters,it).f[VEC_BUF(bfilters,it).len])
#endif #define DOFILTER(it,pk,code) { \
for (it = 0;it < VEC_LENGTH(bfilters);++it) { \
if (unlikely(MATCHFILTER(it,pk))) { \
code; \
break; \
} \
} \
}
#else // BINSEARCH
#define DOFILTER(it,pk,code) { \
for (size_t down = 0,up = VEC_LENGTH(bfilters);down < up;) { \
it = (up + down) / 2; \
{ \
register int filterdiff = memcmp(pk,VEC_BUF(bfilters,it).f,VEC_BUF(bfilters,it).len); \
if (filterdiff < 0) { \
up = it; \
continue; \
} \
if (filterdiff > 0) { \
down = it + 1; \
continue; \
} \
} \
if ((pk[VEC_BUF(bfilters,it).len] & VEC_BUF(bfilters,it).mask) < \
VEC_BUF(bfilters,it).f[VEC_BUF(bfilters,it).len]) \
{ \
up = it; \
continue; \
} \
if ((pk[VEC_BUF(bfilters,it).len] & VEC_BUF(bfilters,it).mask) > \
VEC_BUF(bfilters,it).f[VEC_BUF(bfilters,it).len]) \
{ \
down = it + 1; \
continue; \
} \
{ \
code; \
break; \
} \
} \
}
#endif // BINSEARCH
#endif // INTFILTER
static void loadfilterfile(const char *fname) static void loadfilterfile(const char *fname)
{ {
@ -644,6 +722,8 @@ static void *dowork(void *task)
hashsrc[checksumstrlen + PUBLIC_LEN] = 0x03; // version hashsrc[checksumstrlen + PUBLIC_LEN] = 0x03; // version
sname = malloc(workdirlen + ONIONLEN + 63 + 1); sname = malloc(workdirlen + ONIONLEN + 63 + 1);
if (!sname)
abort();
if (workdir) if (workdir)
memcpy(sname,workdir,workdirlen); memcpy(sname,workdir,workdirlen);
@ -664,22 +744,20 @@ again:
++st->numcalc.v; ++st->numcalc.v;
#endif #endif
FILTERFOR(i) { DOFILTER(i,pk,{
if (unlikely(MATCHFILTER(i,pk))) {
#ifdef STATISTICS #ifdef STATISTICS
++st->numsuccess.v; ++st->numsuccess.v;
#endif #endif
// calc checksum // calc checksum
memcpy(&hashsrc[checksumstrlen],pk,PUBLIC_LEN); memcpy(&hashsrc[checksumstrlen],pk,PUBLIC_LEN);
FIPS202_SHA3_256(hashsrc,sizeof(hashsrc),&pk[PUBLIC_LEN]); FIPS202_SHA3_256(hashsrc,sizeof(hashsrc),&pk[PUBLIC_LEN]);
// version byte // version byte
pk[PUBLIC_LEN + 2] = 0x03; pk[PUBLIC_LEN + 2] = 0x03;
// base32 // base32
strcpy(base32_to(&sname[direndpos],pk,PUBONION_LEN), ".onion"); strcpy(base32_to(&sname[direndpos],pk,PUBONION_LEN), ".onion");
onionready(sname, secret, pubonion.raw); onionready(sname, secret, pubonion.raw);
goto initseed; goto initseed;
} });
}
addseed(seed); addseed(seed);
goto again; goto again;
@ -729,6 +807,8 @@ static void *dofastwork(void *task)
hashsrc[checksumstrlen + PUBLIC_LEN] = 0x03; // version hashsrc[checksumstrlen + PUBLIC_LEN] = 0x03; // version
sname = malloc(workdirlen + ONIONLEN + 63 + 1); sname = malloc(workdirlen + ONIONLEN + 63 + 1);
if (!sname)
abort();
if (workdir) if (workdir)
memcpy(sname, workdir, workdirlen); memcpy(sname, workdir, workdirlen);
@ -748,34 +828,32 @@ initseed:
if (unlikely(endwork)) if (unlikely(endwork))
goto end; goto end;
FILTERFOR(i) { DOFILTER(i,pk,{
if (unlikely(MATCHFILTER(i,pk))) { // found!
// found! // update secret key with counter
// update secret key with counter addu64toscalar32(sk,counter);
addu64toscalar32(sk,counter); // sanity check
// sanity check if (((sk[0] & 248) == sk[0]) && (((sk[31] & 63) | 64) == sk[31])) {
if (((sk[0] & 248) == sk[0]) && (((sk[31] & 63) | 64) == sk[31])) { /* These operations should be a no-op. */
/* These operations should be a no-op. */ sk[0] &= 248;
sk[0] &= 248; sk[31] &= 63;
sk[31] &= 63; sk[31] |= 64;
sk[31] |= 64;
}
else goto initseed;
#ifdef STATISTICS
++st->numsuccess.v;
#endif
// calc checksum
memcpy(&hashsrc[checksumstrlen],pk,PUBLIC_LEN);
FIPS202_SHA3_256(hashsrc,sizeof(hashsrc),&pk[PUBLIC_LEN]);
// version byte
pk[PUBLIC_LEN + 2] = 0x03;
// full name
strcpy(base32_to(&sname[direndpos],pk,PUBONION_LEN),".onion");
onionready(sname,secret,pubonion.raw);
// don't reuse same seed
goto initseed;
} }
} else goto initseed;
#ifdef STATISTICS
++st->numsuccess.v;
#endif
// calc checksum
memcpy(&hashsrc[checksumstrlen],pk,PUBLIC_LEN);
FIPS202_SHA3_256(hashsrc,sizeof(hashsrc),&pk[PUBLIC_LEN]);
// version byte
pk[PUBLIC_LEN + 2] = 0x03;
// full name
strcpy(base32_to(&sname[direndpos],pk,PUBONION_LEN),".onion");
onionready(sname,secret,pubonion.raw);
// don't reuse same seed
goto initseed;
});
// next // next
ge_add(&sum, &ge_public,&ge_eightpoint); ge_add(&sum, &ge_public,&ge_eightpoint);
@ -832,6 +910,8 @@ void setworkdir(const char *wd)
if (wd[l-1] != '/') if (wd[l-1] != '/')
needslash = 1; needslash = 1;
char *s = malloc(l + needslash + 1); char *s = malloc(l + needslash + 1);
if (!s)
abort();
memcpy(s, wd, l); memcpy(s, wd, l);
if (needslash) if (needslash)
s[l++] = '/'; s[l++] = '/';