568 lines
11 KiB
C
568 lines
11 KiB
C
/* $NetBSD: xstr.c,v 1.19 2004/06/06 07:09:55 christos Exp $ */
|
|
|
|
/*
|
|
* Copyright (c) 1980, 1993
|
|
* The Regents of the University of California. All rights reserved.
|
|
*
|
|
* Redistribution and use in source and binary forms, with or without
|
|
* modification, are permitted provided that the following conditions
|
|
* are met:
|
|
* 1. Redistributions of source code must retain the above copyright
|
|
* notice, this list of conditions and the following disclaimer.
|
|
* 2. Redistributions in binary form must reproduce the above copyright
|
|
* notice, this list of conditions and the following disclaimer in the
|
|
* documentation and/or other materials provided with the distribution.
|
|
* 3. Neither the name of the University nor the names of its contributors
|
|
* may be used to endorse or promote products derived from this software
|
|
* without specific prior written permission.
|
|
*
|
|
* THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
|
|
* ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
|
|
* IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
|
|
* ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
|
|
* FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
|
|
* DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
|
|
* OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
|
|
* HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
|
|
* LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
|
|
* OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
|
|
* SUCH DAMAGE.
|
|
*/
|
|
|
|
#include <sys/cdefs.h>
|
|
#ifndef lint
|
|
__COPYRIGHT("@(#) Copyright (c) 1980, 1993\n\
|
|
The Regents of the University of California. All rights reserved.\n");
|
|
#endif /* not lint */
|
|
|
|
#ifndef lint
|
|
#if 0
|
|
static char sccsid[] = "@(#)xstr.c 8.1 (Berkeley) 6/9/93";
|
|
#else
|
|
__RCSID("$NetBSD: xstr.c,v 1.19 2004/06/06 07:09:55 christos Exp $");
|
|
#endif
|
|
#endif /* not lint */
|
|
|
|
#include <sys/types.h>
|
|
#include <signal.h>
|
|
#include <errno.h>
|
|
#include <unistd.h>
|
|
#include <stdio.h>
|
|
#include <ctype.h>
|
|
#include <string.h>
|
|
#include <stdlib.h>
|
|
#include <err.h>
|
|
#include "pathnames.h"
|
|
|
|
/*
|
|
* xstr - extract and hash strings in a C program
|
|
*
|
|
* Bill Joy UCB
|
|
* November, 1978
|
|
*/
|
|
|
|
static off_t hashit(const char *, int);
|
|
static void onintr(int);
|
|
static off_t yankstr(char **);
|
|
static int octdigit(char);
|
|
static void inithash(void);
|
|
static int fgetNUL(char *, int, FILE *);
|
|
static int xgetc(FILE *);
|
|
static void flushsh(void);
|
|
static void found(int, off_t, const char *);
|
|
static void prstr(const char *);
|
|
static void xsdotc(void);
|
|
static char lastchr(const char *);
|
|
static int istail(const char *, const char *);
|
|
static void process(const char *);
|
|
static void usage(void);
|
|
|
|
static off_t tellpt;
|
|
static off_t mesgpt;
|
|
static char *strings = "strings";
|
|
static char *array = 0;
|
|
static int cflg;
|
|
static int vflg;
|
|
static int readstd;
|
|
static char linebuf[8192];
|
|
|
|
#define BUCKETS 128
|
|
|
|
static struct hash {
|
|
off_t hpt;
|
|
char *hstr;
|
|
struct hash *hnext;
|
|
short hnew;
|
|
} bucket[BUCKETS];
|
|
|
|
int main(int, char *[]);
|
|
|
|
int
|
|
main(int argc, char *argv[])
|
|
{
|
|
int c;
|
|
|
|
while ((c = getopt(argc, argv, "-cvl:")) != -1)
|
|
switch (c) {
|
|
case '-':
|
|
readstd++;
|
|
break;
|
|
case 'c':
|
|
cflg++;
|
|
break;
|
|
case 'v':
|
|
vflg++;
|
|
break;
|
|
case 'l':
|
|
array = optarg;
|
|
break;
|
|
default:
|
|
usage();
|
|
}
|
|
argc -= optind;
|
|
argv += optind;
|
|
|
|
if (array == 0)
|
|
array = "xstr";
|
|
|
|
if (signal(SIGINT, SIG_IGN) == SIG_DFL)
|
|
(void)signal(SIGINT, onintr);
|
|
if (cflg || (argc == 0 && !readstd))
|
|
inithash();
|
|
else {
|
|
int fd;
|
|
|
|
strings = strdup(_PATH_TMP);
|
|
fd = mkstemp(strings);
|
|
if (fd == -1)
|
|
err(1, "mkstemp failed");
|
|
close(fd);
|
|
}
|
|
while (readstd || argc > 0) {
|
|
if (freopen("x.c", "w", stdout) == NULL)
|
|
err(1, "Cannot open `%s'", "x.c");
|
|
if (!readstd && freopen(argv[0], "r", stdin) == NULL)
|
|
err(1, "Cannot open `%s'", argv[0]);
|
|
process("x.c");
|
|
if (readstd == 0)
|
|
argc--, argv++;
|
|
else
|
|
readstd = 0;
|
|
};
|
|
flushsh();
|
|
if (cflg == 0)
|
|
xsdotc();
|
|
if (strings[0] == '/')
|
|
(void)unlink(strings);
|
|
exit(0);
|
|
}
|
|
|
|
static void
|
|
process(const char *name)
|
|
{
|
|
char *cp;
|
|
int c;
|
|
int incomm = 0;
|
|
int inasm = 0;
|
|
int asmparnest = 0;
|
|
int ret;
|
|
|
|
printf("extern char\t%s[];\n", array);
|
|
for (;;) {
|
|
if (fgets(linebuf, sizeof linebuf, stdin) == NULL) {
|
|
if (ferror(stdin))
|
|
err(1, "Error reading `%s'", name);
|
|
break;
|
|
}
|
|
if (linebuf[0] == '#') {
|
|
printf("%s", linebuf);
|
|
continue;
|
|
}
|
|
for (cp = linebuf; (c = *cp++);)
|
|
switch (c) {
|
|
|
|
case '"':
|
|
if (incomm || inasm)
|
|
goto def;
|
|
if ((ret = (int) yankstr(&cp)) == -1)
|
|
goto out;
|
|
printf("(&%s[%d])", array, ret);
|
|
break;
|
|
|
|
case '\'':
|
|
if (incomm || inasm)
|
|
goto def;
|
|
putchar(c);
|
|
if (*cp)
|
|
putchar(*cp++);
|
|
break;
|
|
|
|
case '/':
|
|
if (incomm || *cp != '*')
|
|
goto def;
|
|
incomm = 1;
|
|
cp++;
|
|
printf("/*");
|
|
continue;
|
|
|
|
case '*':
|
|
if (incomm && *cp == '/') {
|
|
incomm = 0;
|
|
cp++;
|
|
printf("*/");
|
|
continue;
|
|
}
|
|
goto def;
|
|
|
|
case '(':
|
|
if (!incomm && inasm)
|
|
asmparnest++;
|
|
goto def;
|
|
|
|
case ')':
|
|
if (!incomm && inasm && !--asmparnest)
|
|
inasm = 0;
|
|
goto def;
|
|
|
|
case '_':
|
|
if (incomm || inasm)
|
|
goto def;
|
|
if (!strncmp(cp, "_asm", 4)) {
|
|
cp += 4;
|
|
printf("__asm");
|
|
if (!strncmp(cp, "__", 2)) {
|
|
cp += 2;
|
|
printf("__");
|
|
}
|
|
if (isalnum((unsigned char)*cp) ||
|
|
*cp == '_')
|
|
goto def;
|
|
asmparnest = 0;
|
|
inasm = 1;
|
|
} else
|
|
goto def;
|
|
break;
|
|
def:
|
|
default:
|
|
putchar(c);
|
|
break;
|
|
}
|
|
}
|
|
out:
|
|
if (ferror(stdout)) {
|
|
warn("Error reading `%s'", "x.c");
|
|
onintr(1);
|
|
}
|
|
}
|
|
|
|
static off_t
|
|
yankstr(char **cpp)
|
|
{
|
|
char *cp = *cpp;
|
|
int c, ch;
|
|
char *dbuf, *dp, *edp;
|
|
char *tp;
|
|
off_t hash;
|
|
size_t bsiz = BUFSIZ;
|
|
|
|
if ((dp = dbuf = malloc(bsiz)) == NULL)
|
|
err(1, "malloc");
|
|
edp = dbuf + bsiz;
|
|
|
|
while ((c = *cp++) != '\0') {
|
|
switch (c) {
|
|
|
|
case '"':
|
|
/* Look for a concatenated string */
|
|
for (;;) {
|
|
while (isspace((unsigned char)*cp))
|
|
cp++;
|
|
if (*cp == '\0') {
|
|
if (fgets(linebuf,
|
|
sizeof linebuf, stdin) == NULL) {
|
|
if (ferror(stdin))
|
|
err(1,
|
|
"Error reading `x.c'");
|
|
goto out;
|
|
}
|
|
cp = linebuf;
|
|
} else {
|
|
if (*cp == '"') {
|
|
cp++;
|
|
if (*cp == '"') {
|
|
cp++;
|
|
continue;
|
|
} else {
|
|
c = *cp++;
|
|
goto gotc;
|
|
}
|
|
} else {
|
|
cp++;
|
|
goto out;
|
|
}
|
|
}
|
|
}
|
|
/*NOTREACHED*/
|
|
case '\\':
|
|
c = *cp++;
|
|
if (c == 0)
|
|
break;
|
|
if (c == '\n') {
|
|
if (fgets(linebuf, sizeof linebuf, stdin)
|
|
== NULL) {
|
|
if (ferror(stdin))
|
|
err(1, "Error reading `x.c'");
|
|
return(-1);
|
|
}
|
|
cp = linebuf;
|
|
continue;
|
|
}
|
|
for (tp = "b\bt\tr\rn\nf\f\\\\\"\""; (ch = *tp++); tp++)
|
|
if (c == ch) {
|
|
c = *tp;
|
|
goto gotc;
|
|
}
|
|
if (!octdigit(c)) {
|
|
*dp++ = '\\';
|
|
break;
|
|
}
|
|
c -= '0';
|
|
if (!octdigit(*cp))
|
|
break;
|
|
c <<= 3, c += *cp++ - '0';
|
|
if (!octdigit(*cp))
|
|
break;
|
|
c <<= 3, c += *cp++ - '0';
|
|
break;
|
|
}
|
|
gotc:
|
|
if (dp >= edp - 1) {
|
|
char *nbuf;
|
|
bsiz += BUFSIZ;
|
|
if ((nbuf = realloc(dbuf, bsiz)) == NULL) {
|
|
free(dbuf);
|
|
err(1, "realloc");
|
|
}
|
|
dp = nbuf + (dp - dbuf);
|
|
edp = nbuf + bsiz;
|
|
dbuf = nbuf;
|
|
}
|
|
*dp++ = c;
|
|
}
|
|
out:
|
|
*cpp = --cp;
|
|
*dp = '\0';
|
|
hash = hashit(dbuf, 1);
|
|
free(dbuf);
|
|
return hash;
|
|
}
|
|
|
|
static int
|
|
octdigit(c)
|
|
char c;
|
|
{
|
|
|
|
return (isdigit((unsigned char)c) && c != '8' && c != '9');
|
|
}
|
|
|
|
static void
|
|
inithash(void)
|
|
{
|
|
char buf[BUFSIZ];
|
|
FILE *mesgread = fopen(strings, "r");
|
|
|
|
if (mesgread == NULL)
|
|
return;
|
|
for (;;) {
|
|
mesgpt = tellpt;
|
|
if (fgetNUL(buf, sizeof buf, mesgread) == 0)
|
|
break;
|
|
(void)hashit(buf, 0);
|
|
}
|
|
(void)fclose(mesgread);
|
|
}
|
|
|
|
static int
|
|
fgetNUL(char *obuf, int rmdr, FILE *file)
|
|
{
|
|
int c;
|
|
char *buf = obuf;
|
|
|
|
while (--rmdr > 0 && (c = xgetc(file) != 0 && c != EOF))
|
|
*buf++ = c;
|
|
*buf++ = 0;
|
|
return (feof(file) || ferror(file)) ? 0 : 1;
|
|
}
|
|
|
|
static int
|
|
xgetc(FILE *file)
|
|
{
|
|
|
|
tellpt++;
|
|
return getc(file);
|
|
}
|
|
|
|
|
|
static off_t
|
|
hashit(const char *str, int new)
|
|
{
|
|
int i;
|
|
struct hash *hp, *hp0;
|
|
|
|
hp = hp0 = &bucket[lastchr(str) & 0177];
|
|
while (hp->hnext) {
|
|
hp = hp->hnext;
|
|
i = istail(str, hp->hstr);
|
|
if (i >= 0)
|
|
return (hp->hpt + i);
|
|
}
|
|
if ((hp = calloc(1, sizeof (*hp))) == NULL)
|
|
err(1, NULL);
|
|
hp->hpt = mesgpt;
|
|
if ((hp->hstr = strdup(str)) == NULL)
|
|
err(1, NULL);
|
|
mesgpt += strlen(hp->hstr) + 1;
|
|
hp->hnext = hp0->hnext;
|
|
hp->hnew = new;
|
|
hp0->hnext = hp;
|
|
return (hp->hpt);
|
|
}
|
|
|
|
static void
|
|
flushsh(void)
|
|
{
|
|
int i;
|
|
struct hash *hp;
|
|
FILE *mesgwrit;
|
|
int old = 0, new = 0;
|
|
|
|
for (i = 0; i < BUCKETS; i++)
|
|
for (hp = bucket[i].hnext; hp != NULL; hp = hp->hnext)
|
|
if (hp->hnew)
|
|
new++;
|
|
else
|
|
old++;
|
|
if (new == 0 && old != 0)
|
|
return;
|
|
mesgwrit = fopen(strings, old ? "r+" : "w");
|
|
if (mesgwrit == NULL)
|
|
err(1, "Cannot open `%s'", strings);
|
|
for (i = 0; i < BUCKETS; i++)
|
|
for (hp = bucket[i].hnext; hp != NULL; hp = hp->hnext) {
|
|
found(hp->hnew, hp->hpt, hp->hstr);
|
|
if (hp->hnew) {
|
|
(void)fseek(mesgwrit, hp->hpt, 0);
|
|
(void)fwrite(hp->hstr, strlen(hp->hstr) + 1, 1,
|
|
mesgwrit);
|
|
if (ferror(mesgwrit))
|
|
err(1, "Error writing `%s'", strings);
|
|
}
|
|
}
|
|
if (fclose(mesgwrit) == EOF)
|
|
err(1, "Error closing `%s'", strings);
|
|
}
|
|
|
|
static void
|
|
found(int new, off_t off, const char *str)
|
|
{
|
|
if (vflg == 0)
|
|
return;
|
|
if (!new)
|
|
(void)fprintf(stderr, "found at %d:", (int) off);
|
|
else
|
|
(void)fprintf(stderr, "new at %d:", (int) off);
|
|
prstr(str);
|
|
(void)fprintf(stderr, "\n");
|
|
}
|
|
|
|
static void
|
|
prstr(const char *cp)
|
|
{
|
|
int c;
|
|
|
|
while ((c = (*cp++ & 0377)) != '\0')
|
|
if (c < ' ')
|
|
(void)fprintf(stderr, "^%c", c + '`');
|
|
else if (c == 0177)
|
|
(void)fprintf(stderr, "^?");
|
|
else if (c > 0200)
|
|
(void)fprintf(stderr, "\\%03o", c);
|
|
else
|
|
(void)fprintf(stderr, "%c", c);
|
|
}
|
|
|
|
static void
|
|
xsdotc(void)
|
|
{
|
|
FILE *strf = fopen(strings, "r");
|
|
FILE *xdotcf;
|
|
|
|
if (strf == NULL)
|
|
err(1, "Cannot open `%s'", strings);
|
|
xdotcf = fopen("xs.c", "w");
|
|
if (xdotcf == NULL)
|
|
err(1, "Cannot open `%s'", "xs.c");
|
|
(void)fprintf(xdotcf, "char\t%s[] = {\n", array);
|
|
for (;;) {
|
|
int i, c;
|
|
|
|
for (i = 0; i < 8; i++) {
|
|
c = getc(strf);
|
|
if (ferror(strf)) {
|
|
warn("Error reading `%s'", strings);
|
|
onintr(1);
|
|
}
|
|
if (feof(strf)) {
|
|
(void)fprintf(xdotcf, "\n");
|
|
goto out;
|
|
}
|
|
(void)fprintf(xdotcf, "0x%02x,", c);
|
|
}
|
|
(void)fprintf(xdotcf, "\n");
|
|
}
|
|
out:
|
|
(void)fprintf(xdotcf, "};\n");
|
|
(void)fclose(xdotcf);
|
|
(void)fclose(strf);
|
|
}
|
|
|
|
static char
|
|
lastchr(const char *cp)
|
|
{
|
|
|
|
while (cp[0] && cp[1])
|
|
cp++;
|
|
return (*cp);
|
|
}
|
|
|
|
static int
|
|
istail(const char *str, const char *of)
|
|
{
|
|
int d = strlen(of) - strlen(str);
|
|
|
|
if (d < 0 || strcmp(&of[d], str) != 0)
|
|
return (-1);
|
|
return (d);
|
|
}
|
|
|
|
static void
|
|
onintr(int dummy)
|
|
{
|
|
|
|
(void)signal(SIGINT, SIG_IGN);
|
|
if (strings[0] == '/')
|
|
(void)unlink(strings);
|
|
(void)unlink("x.c");
|
|
(void)unlink("xs.c");
|
|
exit(dummy);
|
|
}
|
|
|
|
static void
|
|
usage(void)
|
|
{
|
|
|
|
(void)fprintf(stderr, "usage: %s [-vc] [-l array] [-] [<name> ...]\n",
|
|
getprogname());
|
|
exit(1);
|
|
}
|