Do not count the end of a line in the bigram table. Newlines are stripped

before coding anyway, and the bigram output was screwing up (and often
pessimising) the table.
This commit is contained in:
mycroft 2000-05-06 10:26:45 +00:00
parent e8509e9145
commit 73816a58f3

View File

@ -1,4 +1,4 @@
/* $NetBSD: locate.bigram.c,v 1.8 2000/03/22 21:45:02 simonb Exp $ */ /* $NetBSD: locate.bigram.c,v 1.9 2000/05/06 10:26:45 mycroft Exp $ */
/* /*
* Copyright (c) 1989, 1993 * Copyright (c) 1989, 1993
@ -46,7 +46,7 @@ __COPYRIGHT("@(#) Copyright (c) 1989, 1993\n\
#if 0 #if 0
static char sccsid[] = "@(#)locate.bigram.c 8.2 (Berkeley) 4/28/95"; static char sccsid[] = "@(#)locate.bigram.c 8.2 (Berkeley) 4/28/95";
#endif #endif
__RCSID("$NetBSD: locate.bigram.c,v 1.8 2000/03/22 21:45:02 simonb Exp $"); __RCSID("$NetBSD: locate.bigram.c,v 1.9 2000/05/06 10:26:45 mycroft Exp $");
#endif /* not lint */ #endif /* not lint */
/* /*
@ -79,16 +79,7 @@ static void
add_bigram(i1, i2) add_bigram(i1, i2)
u_char i1, i2; u_char i1, i2;
{ {
if (i1 == '\n') { if (i1 != '\n' && i2 != '\n')
bigrams[0].count++;
i1 = 0;
}
if (i2 == '\n') {
bigrams[0].count++;
i2 = i1;
i1 = 0;
}
bigrams[(i1<<8)+i2].count++; bigrams[(i1<<8)+i2].count++;
} }