/*
 * Simple test program for regexp(3) stuff.  Knows about debugging hooks.
 *
 *	Copyright (c) 1986 by University of Toronto.
 *	Written by Henry Spencer.  Not derived from licensed software.
 *
 *	Permission is granted to anyone to use this software for any
 *	purpose on any computer system, and to redistribute it freely,
 *	subject to the following restrictions:
 *
 *	1. The author is not responsible for the consequences of use of
 *		this software, no matter how awful, even if they arise
 *		from defects in it.
 *
 *	2. The origin of this software must not be misrepresented, either
 *		by explicit claim or by omission.
 *
 *	3. Altered versions must be plainly marked as such, and must not
 *		be misrepresented as being the original software.
 *
 * Usage: try re [string [output [-]]]
 * The re is compiled and dumped, regexeced against the string, the result
 * is applied to output using regsub().  The - triggers a running narrative
 * from regexec().  Dumping and narrative don't happen unless DEBUG.
 *
 * If there are no arguments, stdin is assumed to be a stream of lines with
 * five fields:  a r.e., a string to match it against, a result code, a
 * source string for regsub, and the proper result.  Result codes are 'c'
 * for compile failure, 'y' for match success, 'n' for match failure.
 * Field separator is tab.
 */
#include <stdio.h>
#include <regexp.h>

/* build test strings in ++jrb */
char *test_input[] = {
    "abc	abc	y	&	abc",
    "abc	xbc	n	-	-",
    "abc	axc	n	-	-",
    "abc	abx	n	-	-",
    "abc	xabcy	y	&	abc",
    "abc	ababc	y	&	abc",
    "ab*c	abc	y	&	abc",
    "ab*bc	abc	y	&	abc",
    "ab*bc	abbc	y	&	abbc",
    "ab*bc	abbbbc	y	&	abbbbc",
    "ab+bc	abbc	y	&	abbc",
    "ab+bc	abc	n	-	-",
    "ab+bc	abq	n	-	-",
    "ab+bc	abbbbc	y	&	abbbbc",
    "ab?bc	abbc	y	&	abbc",
    "ab?bc	abc	y	&	abc",
    "ab?bc	abbbbc	n	-	-",
    "ab?c	abc	y	&	abc",
    "^abc$	abc	y	&	abc",
    "^abc$	abcc	n	-	-",
    "^abc	abcc	y	&	abc",
    "^abc$	aabc	n	-	-",
    "abc$	aabc	y	&	abc",
    "^	abc	y	&	",
    "$	abc	y	&	",
    "a.c	abc	y	&	abc",
    "a.c	axc	y	&	axc",
    "a.*c	axyzc	y	&	axyzc",
    "a.*c	axyzd	n	-	-",
    "a[bc]d	abc	n	-	-",
    "a[bc]d	abd	y	&	abd",
    "a[b-d]e	abd	n	-	-",
    "a[b-d]e	ace	y	&	ace",
    "a[b-d]	aac	y	&	ac",
    "a[-b]	a-	y	&	a-",
    "a[b-]	a-	y	&	a-",
    "a[b-a]	-	c	-	-",
    "a[]b	-	c	-	-",
    "a[	-	c	-	-",
    "a]	a]	y	&	a]",
    "a[]]b	a]b	y	&	a]b",
    "a[^bc]d	aed	y	&	aed",
    "a[^bc]d	abd	n	-	-",
    "a[^-b]c	adc	y	&	adc",
    "a[^-b]c	a-c	n	-	-",
    "a[^]b]c	a]c	n	-	-",
    "a[^]b]c	adc	y	&	adc",
    "ab|cd	abc	y	&	ab",
    "ab|cd	abcd	y	&	ab",
    "()ef	def	y	&-\\1	ef-",
    "()*	-	c	-	-",
    "*a	-	c	-	-",
    "^*	-	c	-	-",
    "$*	-	c	-	-",
    "(*)b	-	c	-	-",
    "$b	b	n	-	-",
    "a\\	-	c	-	-",
    "a\\(b	a(b	y	&-\\1	a(b-",
    "a\\(*b	ab	y	&	ab",
    "a\\(*b	a((b	y	&	a((b",
    "a\\\\b	a\\b	y	&	a\\b",
    "abc)	-	c	-	-",
    "(abc	-	c	-	-",
    "((a))	abc	y	&-\\1-\\2	a-a-a",
    "(a)b(c)	abc	y	&-\\1-\\2	abc-a-c",
    "a+b+c	aabbabc	y	&	abc",
    "a**	-	c	-	-",
    "a*?	-	c	-	-",
    "(a*)*	-	c	-	-",
    "(a*)+	-	c	-	-",
    "(a|)*	-	c	-	-",
    "(a*|b)*	-	c	-	-",
    "(a+|b)*	ab	y	&-\\1	ab-b",
    "(a+|b)+	ab	y	&-\\1	ab-b",
    "(a+|b)?	ab	y	&-\\1	a-a",
    "[^ab]*	cde	y	&	cde",
    "(^)*	-	c	-	-",
    "(ab|)*	-	c	-	-",
    ")(	-	c	-	-",
    "	abc	y	&	",
    "abc		n	-	-",
    "a*		y	&	",
    "([abc])*d	abbbcd	y	&-\\1	abbbcd-c",
    "([abc])*bcd	abcd	y	&-\\1	abcd-a",
    "a|b|c|d|e	e	y	&	e",
    "(a|b|c|d|e)f	ef	y	&-\\1	ef-e",
    "((a*|b))*	-	c	-	-",
    "abcd*efg	abcdefg	y	&	abcdefg",
    "ab*	xabyabbbz	y	&	ab",
    "ab*	xayabbbz	y	&	a",
    "(ab|cd)e	abcde	y	&-\\1	cde-cd",
    "[abhgefdc]ij	hij	y	&	hij",
    "^(ab|cd)e	abcde	n	x\\1y	xy",
    "(abc|)ef	abcdef	y	&-\\1	ef-",
    "(a|b)c*d	abcd	y	&-\\1	bcd-b",
    "(ab|ab*)bc	abc	y	&-\\1	abc-a",
    "a([bc]*)c*	abc	y	&-\\1	abc-bc",
    "a([bc]*)(c*d)	abcd	y	&-\\1-\\2	abcd-bc-d",
    "a([bc]+)(c*d)	abcd	y	&-\\1-\\2	abcd-bc-d",
    "a([bc]*)(c+d)	abcd	y	&-\\1-\\2	abcd-b-cd",
    "a[bcd]*dcdcde	adcdcde	y	&	adcdcde",
    "a[bcd]+dcdcde	adcdcde	n	-	-",
    "(ab|a)b*c	abc	y	&-\\1	abc-ab",
    "((a)(b)c)(d)	abcd	y	\\1-\\2-\\3-\\4	abc-a-b-d",
    "[a-zA-Z_][a-zA-Z0-9_]*	alpha	y	&	alpha",
    "^a(bc+|b[eh])g|.h$	abh	y	&-\\1	bh-",
    "(bc+d$|ef*g.|h?i(j|k))	effgz	y	&-\\1-\\2	effgz-effgz-",
    "(bc+d$|ef*g.|h?i(j|k))	ij	y	&-\\1-\\2	ij-ij-j",
    "(bc+d$|ef*g.|h?i(j|k))	effg	n	-	-",
    "(bc+d$|ef*g.|h?i(j|k))	bcdd	n	-	-",
    "(bc+d$|ef*g.|h?i(j|k))	reffgz	y	&-\\1-\\2	effgz-effgz-",
    "((((((((((a))))))))))	-	c	-	-",
    "(((((((((a)))))))))	a	y	&	a",
    "multiple words of text	uh-uh	n	-	-",
    "multiple words	multiple words, yeah	y	&	multiple words",
    "(.*)c(.*)	abcde	y	&-\\1-\\2	abcde-ab-de",
    "\\((.*), (.*)\\)	(a, b)	y	(\\2, \\1)	(b, a)",
    "abcd	abcd	y	&-\\&-\\\\&	abcd-&-\\abcd",
    "a(bc)d	abcd	y	\\1-\\\\1-\\\\\\1	bc-\\1-\\bc",
    "[ -~]*	abc	y	&	abc",
    "[ -~ -~]*	abc	y	&	abc",
    "[ -~ -~ -~]*	abc	y	&	abc",
    "[ -~ -~ -~ -~]*	abc	y	&	abc",
    "[ -~ -~ -~ -~ -~]*	abc	y	&	abc",
    "[ -~ -~ -~ -~ -~ -~]*	abc	y	&	abc",
    "[ -~ -~ -~ -~ -~ -~ -~]*	abc	y	&	abc",
  (char *)NULL
};

#ifdef ERRAVAIL
char *progname;
extern char *mkprogname();
#endif

#ifdef DEBUG
extern int regnarrate;
#endif

char buf[BUFSIZ];

int errreport = 0;		/* Report errors via errseen? */
char *errseen = NULL;		/* Error message. */
int status = 0;			/* Exit status. */

/* ARGSUSED */
int main(argc, argv)
int argc;
char *argv[];
{
	regexp *r;
	int i;

#ifdef ERRAVAIL
	progname = mkprogname(argv[0]);
#endif

	if (argc == 1) {
		multiple();
		return(status);
	}

	r = regcomp(argv[1]);
	if (r == NULL)
		error("regcomp failure", "");
#ifdef DEBUG
	regdump(r);
	if (argc > 4)
		regnarrate++;
#endif
	if (argc > 2) {
		i = regexec(r, argv[2], 1);
		printf("%d", i);
		for (i = 1; i < NSUBEXP; i++)
			if (r->startp[i] != NULL && r->endp[i] != NULL)
				printf(" \\%d", i);
		printf("\n");
	}
	if (argc > 3) {
		regsub(r, argv[3], buf);
		printf("%s\n", buf);
	}
	return(status);
}

void
regerror(s)
char *s;
{
	if (errreport)
		errseen = s;
	else
		error(s, "");
}

#ifndef ERRAVAIL
error(s1, s2)
char *s1;
char *s2;
{
	fprintf(stderr, "regexp: ");
	fprintf(stderr, s1, s2);
	fprintf(stderr, "\n");
	exit(1);
}
#endif

int lineno;

regexp badregexp;		/* Implicit init to 0. */

char rbuf[1024];
multiple()
{
	char *field[5];
	char *scan;
	int i, j;
	regexp *r;
	extern char *strchr();

	errreport = 1;
	lineno = 0;
        for(j = 0; test_input[j]; j++) {
		strcpy(rbuf, test_input[j]);
		lineno++;
		scan = rbuf;
		for (i = 0; i < 5; i++) {
			field[i] = scan;
			if (field[i] == NULL) {
				complain("bad testfile format", "");
				exit(1);
			}
			scan = strchr(scan, '\t');
			if (scan != NULL)
				*scan++ = '\0';
		}
		try(field);
	}

	/* And finish up with some internal testing... */
	lineno = 9990;
	errseen = NULL;
	if (regcomp((char *)NULL) != NULL || errseen == NULL)
		complain("regcomp(NULL) doesn't complain", "");
	lineno = 9991;
	errseen = NULL;
	if (regexec((regexp *)NULL, "foo", 1) || errseen == NULL)
		complain("regexec(NULL, ...) doesn't complain", "");
	lineno = 9992;
	r = regcomp("foo");
	if (r == NULL) {
		complain("regcomp(\"foo\") fails", "");
		return;
	}
	lineno = 9993;
	errseen = NULL;
	if (regexec(r, (char *)NULL, 1) || errseen == NULL)
		complain("regexec(..., NULL) doesn't complain", "");
	lineno = 9994;
	errseen = NULL;
	regsub((regexp *)NULL, "foo", rbuf);
	if (errseen == NULL)
		complain("regsub(NULL, ..., ...) doesn't complain", "");
	lineno = 9995;
	errseen = NULL;
	regsub(r, (char *)NULL, rbuf);
	if (errseen == NULL)
		complain("regsub(..., NULL, ...) doesn't complain", "");
	lineno = 9996;
	errseen = NULL;
	regsub(r, "foo", (char *)NULL);
	if (errseen == NULL)
		complain("regsub(..., ..., NULL) doesn't complain", "");
	lineno = 9997;
	errseen = NULL;
	if (regexec(&badregexp, "foo", 1) || errseen == NULL)
		complain("regexec(nonsense, ...) doesn't complain", "");
	lineno = 9998;
	errseen = NULL;
	regsub(&badregexp, "foo", rbuf);
	if (errseen == NULL)
		complain("regsub(nonsense, ..., ...) doesn't complain", "");
}

try(fields)
char **fields;
{
	regexp *r;
	char dbuf[BUFSIZ];

	errseen = NULL;
	r = regcomp(fields[0]);
	if (r == NULL) {
		if (*fields[2] != 'c')
			complain("regcomp failure in `%s'", fields[0]);
		return;
	}
	if (*fields[2] == 'c') {
		complain("unexpected regcomp success in `%s'", fields[0]);
		free((char *)r);
		return;
	}
	if (!regexec(r, fields[1], 1)) {
		if (*fields[2] != 'n')
			complain("regexec failure in `%s'", "");
		free((char *)r);
		return;
	}
	if (*fields[2] == 'n') {
		complain("unexpected regexec success", "");
		free((char *)r);
		return;
	}
	errseen = NULL;
	regsub(r, fields[3], dbuf);
	if (errseen != NULL) {
		complain("regsub complaint", "");
		free((char *)r);
		return;
	}
	if (strcmp(dbuf, fields[4]) != 0)
		complain("regsub result `%s' wrong", dbuf);
	free((char *)r);
}

complain(s1, s2)
char *s1;
char *s2;
{
	fprintf(stderr, "try: %d: ", lineno);
	fprintf(stderr, s1, s2);
	fprintf(stderr, " (%s)\n", (errseen != NULL) ? errseen : "");
	status = 1;
}
