Skip to content

Commit d265b3c

Browse files
committed
Wordlist, rules: Drop the dupe check against the previous word
This check dates back to 1990s when our primary target was descrypt with its length truncation, its computation was much slower, and we didn't have the generic dupe suppressor. In the suppressor, a word matching the previous one would be an L1 cache hit, so we don't gain much by pre-checking for that special case. And if the suppressor is disabled, that's probably because we don't want any overhead like that. Besides, this check didn't behave correctly along with an external filter() possibly modifying the word (a bug that also dates back to 1990s). OTOH, we do not currently support the suppressor on top of stacked rules (we do before stacked rules), so we do lose a bit of functionality with this change.
1 parent e1ae810 commit d265b3c

File tree

5 files changed

+28
-92
lines changed

5 files changed

+28
-92
lines changed

src/pp.c

+2-8
Original file line numberDiff line numberDiff line change
@@ -1192,11 +1192,6 @@ void do_prince_crack(struct db_main *db, const char *wordlist, int rules)
11921192
setmode (fileno (stdout), O_BINARY);
11931193
#endif
11941194
#else
1195-
union {
1196-
char buffer[LINE_BUFFER_SIZE];
1197-
ARCH_WORD dummy;
1198-
} aligned;
1199-
char *last = aligned.buffer;
12001195
int loopback = (options.flags & FLG_PRINCE_LOOPBACK) ? 1 : 0;
12011196
int mask_mult = MAX(1, mask_num_qw);
12021197
int our_fmt_len = (db->format->params.plaintext_length + ((mask_mult - 1) * mask_add_len)) / mask_mult - mask_add_len;
@@ -1371,7 +1366,7 @@ void do_prince_crack(struct db_main *db, const char *wordlist, int rules)
13711366
do {
13721367
char *rule;
13731368

1374-
if ((rule = rules_reject(prerule, -1, last, db)))
1369+
if ((rule = rules_reject(prerule, -1, db)))
13751370
{
13761371
list_add(rule_list, rule);
13771372
active_rules++;
@@ -2334,8 +2329,7 @@ void do_prince_crack(struct db_main *db, const char *wordlist, int rules)
23342329
do {
23352330
char *word;
23362331

2337-
if ((word = rules_apply(pw_buf, rule->data, -1, last))) {
2338-
last = word;
2332+
if ((word = rules_apply(pw_buf, rule->data, -1))) {
23392333
#if HAVE_REXGEN
23402334
if (regex) {
23412335
if ((jtr_done = do_regex_hybrid_crack(db, regex, word,

src/rules.c

+12-47
Original file line numberDiff line numberDiff line change
@@ -107,12 +107,10 @@ static struct {
107107
*/
108108
int pass;
109109
/*
110-
* Some rule commands may temporarily double the length, and we skip a few
111-
* machine words to avoid cache bank conflicts when copying data between the
112-
* buffers. We need three buffers because some rule commands require separate
113-
* input and output buffers and we also need a buffer either for leaving the
114-
* previous mangled word intact for a subsequent comparison (in wordlist mode)
115-
* or for switching between two input words (in "single crack" mode).
110+
* Some rule commands may temporarily double the length.
111+
* We need three buffers because some rule commands require separate input and
112+
* output buffers and we also need a buffer for switching between two input
113+
* words in "single crack" mode.
116114
* rules_apply() tries to minimize data copying, and thus it may return a
117115
* pointer to any of the three buffers.
118116
*
@@ -576,7 +574,7 @@ int rules_init_stack(char *ruleset, rule_stack *stack_ctx,
576574
do {
577575
rule_number++;
578576

579-
if ((rule = rules_reject(prerule, -1, NULL, db))) {
577+
if ((rule = rules_reject(prerule, -1, db))) {
580578
list_add(stack_ctx->stack_rule, rule);
581579
active_rules++;
582580

@@ -642,7 +640,7 @@ void rules_init(struct db_main *db, int max_length)
642640
rules_stacked_after = (options.flags & (FLG_RULES_CHK | FLG_SINGLE_CHK | FLG_BATCH_CHK)) && (options.flags & FLG_RULES_STACK_CHK);
643641
}
644642

645-
char *rules_reject(char *rule, int split, char *last, struct db_main *db)
643+
char *rules_reject(char *rule, int split, struct db_main *db)
646644
{
647645
static char out_rule[RULE_BUFFER_SIZE];
648646

@@ -748,15 +746,15 @@ char *rules_reject(char *rule, int split, char *last, struct db_main *db)
748746
accept:
749747
rules_pass--;
750748
strnzcpy(out_rule, rule - 1, sizeof(out_rule));
751-
rules_apply(safe_null_string, out_rule, split, last);
749+
rules_apply(safe_null_string, out_rule, split);
752750
rules_pass++;
753751

754752
return out_rule;
755753
}
756754

757755
#define STACK_MAXLEN (rules_stacked_after ? RULE_WORD_SIZE : rules_max_length)
758756

759-
char *rules_apply(char *word_in, char *rule, int split, char *last)
757+
char *rules_apply(char *word_in, char *rule, int split)
760758
{
761759
union {
762760
char aligned[PLAINTEXT_BUFFER_SIZE];
@@ -776,8 +774,6 @@ char *rules_apply(char *word_in, char *rule, int split, char *last)
776774
memory = word = word_in;
777775

778776
in = buffer[0][STAGE];
779-
if (in == last)
780-
in = buffer[2][STAGE];
781777

782778
length = 0;
783779
while (length < RULE_WORD_SIZE) {
@@ -797,8 +793,6 @@ char *rules_apply(char *word_in, char *rule, int split, char *last)
797793
REJECT
798794

799795
alt = buffer[1][STAGE];
800-
if (alt == last)
801-
alt = buffer[2][STAGE];
802796

803797
/*
804798
* This assumes that RULE_WORD_SIZE is small enough that length can't reach or
@@ -1771,22 +1765,6 @@ char *rules_apply(char *word_in, char *rule, int split, char *last)
17711765
length = strlen(in);
17721766
}
17731767

1774-
if (last) {
1775-
if (length > STACK_MAXLEN)
1776-
length = STACK_MAXLEN;
1777-
if (length >= ARCH_SIZE - 1) {
1778-
if (*(ARCH_WORD *)in != *(ARCH_WORD *)last)
1779-
return in;
1780-
if (strcmp(&in[ARCH_SIZE - 1], &last[ARCH_SIZE - 1]))
1781-
return in;
1782-
return NULL;
1783-
}
1784-
if (last[length])
1785-
return in;
1786-
if (memcmp(in, last, length))
1787-
return in;
1788-
return NULL;
1789-
}
17901768
return in;
17911769

17921770
out_which:
@@ -1849,11 +1827,6 @@ int rules_advance_stack(rule_stack *ctx, int quiet)
18491827
*/
18501828
char *rules_process_stack(char *key, rule_stack *ctx)
18511829
{
1852-
static union {
1853-
char buf[LINE_BUFFER_SIZE];
1854-
ARCH_WORD dummy;
1855-
} aligned;
1856-
static char *last = aligned.buf;
18571830
char *word;
18581831

18591832
if (!ctx->rule) {
@@ -1865,8 +1838,7 @@ char *rules_process_stack(char *key, rule_stack *ctx)
18651838

18661839
rules_stacked_after = 0;
18671840

1868-
if ((word = rules_apply(key, ctx->rule->data, -1, last)))
1869-
last = word;
1841+
word = rules_apply(key, ctx->rule->data, -1);
18701842

18711843
rules_stacked_after = !!(options.flags & (FLG_RULES_CHK | FLG_SINGLE_CHK | FLG_BATCH_CHK));
18721844

@@ -1878,11 +1850,6 @@ char *rules_process_stack(char *key, rule_stack *ctx)
18781850
*/
18791851
char *rules_process_stack_all(char *key, rule_stack *ctx)
18801852
{
1881-
static union {
1882-
char buf[LINE_BUFFER_SIZE];
1883-
ARCH_WORD dummy;
1884-
} aligned;
1885-
static char *last = aligned.buf;
18861853
char *word;
18871854

18881855
if (!ctx->rule) {
@@ -1896,10 +1863,8 @@ char *rules_process_stack_all(char *key, rule_stack *ctx)
18961863
rules_stacked_after = 0;
18971864

18981865
while (ctx->rule) {
1899-
if ((word = rules_apply(key, ctx->rule->data, -1, last))) {
1900-
last = word;
1866+
if ((word = rules_apply(key, ctx->rule->data, -1)))
19011867
return word;
1902-
} else
19031868
if ((ctx->rule = ctx->rule->next)) {
19041869
rules_stacked_number++;
19051870
if (!stack_rules_mute)
@@ -1943,7 +1908,7 @@ static int rules_check(struct rpp_context *start, int split)
19431908

19441909
rules_pass = -1; /* rules_reject() will turn this into -2 */
19451910
while ((rule = rpp_next(&ctx))) {
1946-
rules_reject(rule, split, NULL, NULL);
1911+
rules_reject(rule, split, NULL);
19471912
if (rules_errno) break;
19481913

19491914
if (ctx.input) rules_line = ctx.input->number;
@@ -1981,7 +1946,7 @@ static void rules_load_normalized_list(struct cfg_line *pLine)
19811946
/*
19821947
* this will 'reduce' the rule by stripping no-op's.
19831948
*/
1984-
char *rule = rules_reject(pLine->data, -1, NULL, NULL);
1949+
char *rule = rules_reject(pLine->data, -1, NULL);
19851950
if (rule) {
19861951
rules_normalize_add_line(rule, pLine->id);
19871952
++rules_tmp_dup_removal_cnt;

src/rules.h

+2-10
Original file line numberDiff line numberDiff line change
@@ -60,11 +60,8 @@ extern void rules_init(struct db_main *db, int max_length);
6060
*
6161
* split == 0 "single crack" mode rules allowed
6262
* split < 0 "single crack" mode rules are invalid
63-
*
64-
* last may specify which internal buffer must not be touched.
6563
*/
66-
extern char *rules_reject(char *rule, int split, char *last,
67-
struct db_main *db);
64+
extern char *rules_reject(char *rule, int split, struct db_main *db);
6865

6966
/*
7067
* Applies rule to a word. Returns the updated word, or NULL if rejected or
@@ -73,13 +70,8 @@ extern char *rules_reject(char *rule, int split, char *last,
7370
* split > 0 "single crack" mode, split is the second word's position
7471
* split == 0 "single crack" mode, only one word
7572
* split < 0 other cracking modes, "single crack" mode rules are invalid
76-
*
77-
* If last is non-NULL, it should be the previous mangled word and it is
78-
* assumed to be properly aligned for ARCH_WORD accesses (pointers returned by
79-
* rules_apply() are properly aligned). If the new mangled word matches the
80-
* previous one, it will be rejected (rules_apply() will return NULL).
8173
*/
82-
extern char *rules_apply(char *word, char *rule, int split, char *last);
74+
extern char *rules_apply(char *word, char *rule, int split);
8375

8476
/*
8577
* Similar to rules_check(), but displays a message and does not return on

src/single.c

+4-4
Original file line numberDiff line numberDiff line change
@@ -674,7 +674,7 @@ static int single_process_pw(struct db_salt *salt, struct db_password *pw,
674674
do {
675675
if (first == global_head)
676676
first_global = 1;
677-
if ((key = rules_apply(first->data, rule, 0, NULL)))
677+
if ((key = rules_apply(first->data, rule, 0)))
678678
if (ext_filter(key))
679679
if (single_add_key(salt, key, 0))
680680
return 1;
@@ -701,7 +701,7 @@ static int single_process_pw(struct db_salt *salt, struct db_password *pw,
701701
strnzcpy(pair, first->data, RULE_WORD_SIZE);
702702
strnzcat(pair, second->data, RULE_WORD_SIZE);
703703

704-
if ((key = rules_apply(pair, rule, split, NULL)))
704+
if ((key = rules_apply(pair, rule, split)))
705705
if (ext_filter(key))
706706
if (single_add_key(salt, key, 0))
707707
return 1;
@@ -716,7 +716,7 @@ static int single_process_pw(struct db_salt *salt, struct db_password *pw,
716716
pair[1] = 0;
717717
strnzcat(pair, second->data, RULE_WORD_SIZE);
718718

719-
if ((key = rules_apply(pair, rule, 1, NULL)))
719+
if ((key = rules_apply(pair, rule, 1)))
720720
if (ext_filter(key))
721721
if (single_add_key(salt, key, 0))
722722
return 1;
@@ -817,7 +817,7 @@ static void single_run(void)
817817
}
818818
}
819819

820-
if (!(rule = rules_reject(prerule, 0, NULL, single_db))) {
820+
if (!(rule = rules_reject(prerule, 0, single_db))) {
821821
rule_number++;
822822
if (options.verbosity >= VERB_DEFAULT &&
823823
!rules_mute &&

src/wordlist.c

+8-23
Original file line numberDiff line numberDiff line change
@@ -303,7 +303,7 @@ static double get_progress(void)
303303
(rule_count * size * mask_mult));
304304
}
305305

306-
static char *dummy_rules_apply(char *word, char *rule, int split, char *last)
306+
static char *dummy_rules_apply(char *word, char *rule, int split)
307307
{
308308
return word;
309309
}
@@ -459,18 +459,17 @@ static MAYBE_INLINE int wbuf_unique(char *line)
459459
void do_wordlist_crack(struct db_main *db, const char *name, int rules)
460460
{
461461
union {
462-
char buffer[2][LINE_BUFFER_SIZE + CACHE_BANK_SHIFT];
462+
char buffer[LINE_BUFFER_SIZE];
463463
#if MGETL_HAS_SIMD
464464
vtype dummy;
465465
#else
466466
ARCH_WORD dummy;
467467
#endif
468468
} aligned;
469-
char *line = aligned.buffer[0];
470-
char *last = aligned.buffer[1];
469+
char *line = aligned.buffer;
471470
struct rpp_context ctx;
472471
char *prerule="", *rule="", *word="";
473-
char *(*apply)(char *word, char *rule, int split, char *last) = NULL;
472+
char *(*apply)(char *word, char *rule, int split) = NULL;
474473
int dist_switch=0;
475474
uint64_t my_words=0, their_words=0, my_words_left=0;
476475
int64_t i, file_len = 0;
@@ -1085,11 +1084,6 @@ void do_wordlist_crack(struct db_main *db, const char *name, int rules)
10851084
if (rules)
10861085
prerule = rpp_next(&ctx);
10871086

1088-
/* A string that can't be produced by fgetl(). */
1089-
last = aligned.buffer[1];
1090-
last[0] = '\n';
1091-
last[1] = 0;
1092-
10931087
dist_rules = 0;
10941088
dist_switch = rule_count; /* never */
10951089
my_words = ~0UL; /* all */
@@ -1151,7 +1145,7 @@ void do_wordlist_crack(struct db_main *db, const char *name, int rules)
11511145
for_node > options.node_max)
11521146
goto next_rule;
11531147
}
1154-
if ((rule = rules_reject(prerule, -1, last, db))) {
1148+
if ((rule = rules_reject(prerule, -1, db))) {
11551149
if (strcmp(prerule, rule)) {
11561150
if (!rules_mute)
11571151
log_event("- Rule #%d: '%.100s'"
@@ -1186,8 +1180,7 @@ void do_wordlist_crack(struct db_main *db, const char *name, int rules)
11861180
}
11871181
}
11881182
loop_line_no++;
1189-
if ((word = apply(joined->data, rule, -1, last))) {
1190-
last = word;
1183+
if ((word = apply(joined->data, rule, -1))) {
11911184
#if HAVE_REXGEN
11921185
if (regex) {
11931186
if (do_regex_hybrid_crack(db, regex,
@@ -1255,8 +1248,7 @@ void do_wordlist_crack(struct db_main *db, const char *name, int rules)
12551248
#endif
12561249
line_number++;
12571250

1258-
if ((word = apply(line, rule, -1, last))) {
1259-
last = word;
1251+
if ((word = apply(line, rule, -1))) {
12601252
#if HAVE_REXGEN
12611253
if (regex) {
12621254
if (do_regex_hybrid_crack(db, regex,
@@ -1326,16 +1318,9 @@ void do_wordlist_crack(struct db_main *db, const char *name, int rules)
13261318
goto next_word;
13271319
}
13281320
line[length] = 0;
1329-
1330-
if (!strcmp(line, last))
1331-
goto next_word;
13321321
}
13331322

1334-
if ((word = apply(line, rule, -1, last))) {
1335-
if (rules)
1336-
last = word;
1337-
else
1338-
strcpy(last, word);
1323+
if ((word = apply(line, rule, -1))) {
13391324
#if HAVE_REXGEN
13401325
if (regex) {
13411326
if (do_regex_hybrid_crack(

0 commit comments

Comments
 (0)