usr.bin/make/str.c

1590Srgrimes/*-
1590Srgrimes * Copyright (c) 1988, 1989, 1990, 1993
1590Srgrimes *	The Regents of the University of California.  All rights reserved.
1590Srgrimes * Copyright (c) 1989 by Berkeley Softworks
1590Srgrimes * All rights reserved.
1590Srgrimes *
1590Srgrimes * This code is derived from software contributed to Berkeley by
1590Srgrimes * Adam de Boor.
1590Srgrimes *
1590Srgrimes * Redistribution and use in source and binary forms, with or without
1590Srgrimes * modification, are permitted provided that the following conditions
1590Srgrimes * are met:
1590Srgrimes * 1. Redistributions of source code must retain the above copyright
1590Srgrimes *    notice, this list of conditions and the following disclaimer.
1590Srgrimes * 2. Redistributions in binary form must reproduce the above copyright
1590Srgrimes *    notice, this list of conditions and the following disclaimer in the
1590Srgrimes *    documentation and/or other materials provided with the distribution.
1590Srgrimes * 3. All advertising materials mentioning features or use of this software
1590Srgrimes *    must display the following acknowledgement:
1590Srgrimes *	This product includes software developed by the University of
1590Srgrimes *	California, Berkeley and its contributors.
1590Srgrimes * 4. Neither the name of the University nor the names of its contributors
1590Srgrimes *    may be used to endorse or promote products derived from this software
1590Srgrimes *    without specific prior written permission.
1590Srgrimes *
1590Srgrimes * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
1590Srgrimes * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
1590Srgrimes * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
1590Srgrimes * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
1590Srgrimes * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
1590Srgrimes * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
1590Srgrimes * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
1590Srgrimes * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
1590Srgrimes * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
1590Srgrimes * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
1590Srgrimes * SUCH DAMAGE.
62833Swsanchez *
62833Swsanchez * @(#)str.c	5.8 (Berkeley) 6/1/90
1590Srgrimes */
1590Srgrimes
62833Swsanchez#include <sys/cdefs.h>
94587Sobrien__FBSDID("$FreeBSD: head/usr.bin/make/str.c 104696 2002-10-09 03:42:10Z jmallett $");
1590Srgrimes
1590Srgrimes#include "make.h"
1590Srgrimes
5814Sjkhstatic char **argv, *buffer;
5814Sjkhstatic int argmax, curlen;
5814Sjkh
5814Sjkh/*
5814Sjkh * str_init --
5814Sjkh *	Initialize the strings package
5814Sjkh *
5814Sjkh */
5814Sjkhvoid
104696Sjmallettstr_init(void)
5814Sjkh{
5814Sjkh    char *p1;
18730Ssteve    argv = (char **)emalloc(((argmax = 50) + 1) * sizeof(char *));
5814Sjkh    argv[0] = Var_Value(".MAKE", VAR_GLOBAL, &p1);
5814Sjkh}
5814Sjkh
5814Sjkh
5814Sjkh/*
5814Sjkh * str_end --
5814Sjkh *	Cleanup the strings package
5814Sjkh *
5814Sjkh */
5814Sjkhvoid
104696Sjmallettstr_end(void)
5814Sjkh{
9254Sache    if (argv) {
9254Sache	if (argv[0])
9254Sache	    free(argv[0]);
69531Swill	free(argv);
9254Sache    }
5814Sjkh    if (buffer)
5814Sjkh	free(buffer);
5814Sjkh}
5814Sjkh
1590Srgrimes/*-
1590Srgrimes * str_concat --
1590Srgrimes *	concatenate the two strings, inserting a space or slash between them,
1590Srgrimes *	freeing them if requested.
1590Srgrimes *
1590Srgrimes * returns --
1590Srgrimes *	the resulting string in allocated space.
1590Srgrimes */
1590Srgrimeschar *
104696Sjmallettstr_concat(char *s1, char *s2, int flags)
1590Srgrimes{
94584Sobrien	int len1, len2;
94584Sobrien	char *result;
1590Srgrimes
1590Srgrimes	/* get the length of both strings */
94638Sobrien	len1 = strlen(s1);
94638Sobrien	len2 = strlen(s2);
1590Srgrimes
1590Srgrimes	/* allocate length plus separator plus EOS */
1590Srgrimes	result = emalloc((u_int)(len1 + len2 + 2));
1590Srgrimes
1590Srgrimes	/* copy first string into place */
94638Sobrien	memcpy(result, s1, len1);
1590Srgrimes
1590Srgrimes	/* add separator character */
94638Sobrien	if (flags & STR_ADDSPACE) {
94638Sobrien		result[len1] = ' ';
94638Sobrien		++len1;
94638Sobrien	} else if (flags & STR_ADDSLASH) {
94638Sobrien		result[len1] = '/';
94638Sobrien		++len1;
1590Srgrimes	}
1590Srgrimes
94638Sobrien	/* copy second string plus EOS into place */
94638Sobrien	memcpy(result + len1, s2, len2 + 1);
1590Srgrimes
1590Srgrimes	/* free original strings */
1590Srgrimes	if (flags & STR_DOFREE) {
97123Sjmallett		(void)efree(s1);
97123Sjmallett		(void)efree(s2);
1590Srgrimes	}
1590Srgrimes	return(result);
1590Srgrimes}
1590Srgrimes
1590Srgrimes/*-
1590Srgrimes * brk_string --
1590Srgrimes *	Fracture a string into an array of words (as delineated by tabs or
1590Srgrimes *	spaces) taking quotation marks into account.  Leading tabs/spaces
1590Srgrimes *	are ignored.
1590Srgrimes *
1590Srgrimes * returns --
1590Srgrimes *	Pointer to the array of pointers to the words.  To make life easier,
1590Srgrimes *	the first word is always the value of the .MAKE variable.
1590Srgrimes */
1590Srgrimeschar **
104696Sjmallettbrk_string(char *str, int *store_argc, Boolean expand)
1590Srgrimes{
94584Sobrien	int argc, ch;
94584Sobrien	char inquote, *p, *start, *t;
1590Srgrimes	int len;
1590Srgrimes
1590Srgrimes	/* skip leading space chars. */
1590Srgrimes	for (; *str == ' ' || *str == '\t'; ++str)
1590Srgrimes		continue;
1590Srgrimes
1590Srgrimes	/* allocate room for a copy of the string */
5814Sjkh	if ((len = strlen(str) + 1) > curlen) {
5814Sjkh		if (buffer)
5814Sjkh		    free(buffer);
5814Sjkh		buffer = emalloc(curlen = len);
5814Sjkh	}
1590Srgrimes
1590Srgrimes	/*
1590Srgrimes	 * copy the string; at the same time, parse backslashes,
1590Srgrimes	 * quotes and build the argument list.
1590Srgrimes	 */
1590Srgrimes	argc = 1;
1590Srgrimes	inquote = '\0';
5814Sjkh	for (p = str, start = t = buffer;; ++p) {
1590Srgrimes		switch(ch = *p) {
1590Srgrimes		case '"':
1590Srgrimes		case '\'':
49938Shoek			if (inquote) {
1590Srgrimes				if (inquote == ch)
1590Srgrimes					inquote = '\0';
1590Srgrimes				else
1590Srgrimes					break;
49938Shoek			} else {
1590Srgrimes				inquote = (char) ch;
5814Sjkh				/* Don't miss "" or '' */
5814Sjkh				if (start == NULL && p[1] == inquote) {
5814Sjkh					start = t + 1;
5814Sjkh					break;
5814Sjkh				}
2266Ssef			}
5814Sjkh			if (!expand) {
5814Sjkh				if (!start)
5814Sjkh					start = t;
5814Sjkh				*t++ = ch;
5814Sjkh			}
5814Sjkh			continue;
1590Srgrimes		case ' ':
1590Srgrimes		case '\t':
5814Sjkh		case '\n':
1590Srgrimes			if (inquote)
1590Srgrimes				break;
1590Srgrimes			if (!start)
1590Srgrimes				continue;
1590Srgrimes			/* FALLTHROUGH */
1590Srgrimes		case '\0':
1590Srgrimes			/*
1590Srgrimes			 * end of a token -- make sure there's enough argv
1590Srgrimes			 * space and save off a pointer.
1590Srgrimes			 */
5814Sjkh			if (!start)
5814Sjkh			    goto done;
5814Sjkh
1590Srgrimes			*t++ = '\0';
1590Srgrimes			if (argc == argmax) {
1590Srgrimes				argmax *= 2;		/* ramp up fast */
18730Ssteve				argv = (char **)erealloc(argv,
18730Ssteve				    (argmax + 1) * sizeof(char *));
1590Srgrimes			}
1590Srgrimes			argv[argc++] = start;
1590Srgrimes			start = (char *)NULL;
1590Srgrimes			if (ch == '\n' || ch == '\0')
1590Srgrimes				goto done;
1590Srgrimes			continue;
1590Srgrimes		case '\\':
5814Sjkh			if (!expand) {
5814Sjkh				if (!start)
5814Sjkh					start = t;
5814Sjkh				*t++ = '\\';
5814Sjkh				ch = *++p;
5814Sjkh				break;
5814Sjkh			}
8874Srgrimes
1590Srgrimes			switch (ch = *++p) {
1590Srgrimes			case '\0':
1590Srgrimes			case '\n':
1590Srgrimes				/* hmmm; fix it up as best we can */
1590Srgrimes				ch = '\\';
1590Srgrimes				--p;
1590Srgrimes				break;
1590Srgrimes			case 'b':
1590Srgrimes				ch = '\b';
1590Srgrimes				break;
1590Srgrimes			case 'f':
1590Srgrimes				ch = '\f';
1590Srgrimes				break;
1590Srgrimes			case 'n':
1590Srgrimes				ch = '\n';
1590Srgrimes				break;
1590Srgrimes			case 'r':
1590Srgrimes				ch = '\r';
1590Srgrimes				break;
1590Srgrimes			case 't':
1590Srgrimes				ch = '\t';
1590Srgrimes				break;
104108Sjmallett			default:
104108Sjmallett				break;
1590Srgrimes			}
1590Srgrimes			break;
104108Sjmallett		default:
104108Sjmallett			break;
1590Srgrimes		}
1590Srgrimes		if (!start)
1590Srgrimes			start = t;
1590Srgrimes		*t++ = (char) ch;
1590Srgrimes	}
1590Srgrimesdone:	argv[argc] = (char *)NULL;
1590Srgrimes	*store_argc = argc;
1590Srgrimes	return(argv);
1590Srgrimes}
1590Srgrimes
1590Srgrimes/*
1590Srgrimes * Str_FindSubstring -- See if a string contains a particular substring.
8874Srgrimes *
1590Srgrimes * Results: If string contains substring, the return value is the location of
1590Srgrimes * the first matching instance of substring in string.  If string doesn't
1590Srgrimes * contain substring, the return value is NULL.  Matching is done on an exact
1590Srgrimes * character-for-character basis with no wildcards or special characters.
8874Srgrimes *
1590Srgrimes * Side effects: None.
104696Sjmallett *
104696Sjmallett * XXX should be strstr(3).
1590Srgrimes */
1590Srgrimeschar *
104696SjmallettStr_FindSubstring(char *string, char *substring)
1590Srgrimes{
94584Sobrien	char *a, *b;
1590Srgrimes
1590Srgrimes	/*
1590Srgrimes	 * First scan quickly through the two strings looking for a single-
1590Srgrimes	 * character match.  When it's found, then compare the rest of the
1590Srgrimes	 * substring.
1590Srgrimes	 */
1590Srgrimes
1590Srgrimes	for (b = substring; *string != 0; string += 1) {
1590Srgrimes		if (*string != *b)
1590Srgrimes			continue;
1590Srgrimes		a = string;
1590Srgrimes		for (;;) {
1590Srgrimes			if (*b == 0)
1590Srgrimes				return(string);
1590Srgrimes			if (*a++ != *b++)
1590Srgrimes				break;
1590Srgrimes		}
1590Srgrimes		b = substring;
1590Srgrimes	}
1590Srgrimes	return((char *) NULL);
1590Srgrimes}
1590Srgrimes
1590Srgrimes/*
1590Srgrimes * Str_Match --
8874Srgrimes *
1590Srgrimes * See if a particular string matches a particular pattern.
8874Srgrimes *
1590Srgrimes * Results: Non-zero is returned if string matches pattern, 0 otherwise. The
1590Srgrimes * matching operation permits the following special characters in the
1590Srgrimes * pattern: *?\[] (see the man page for details on what these mean).
8874Srgrimes *
1590Srgrimes * Side effects: None.
1590Srgrimes */
1590Srgrimesint
104696SjmallettStr_Match(char *string, char *pattern)
1590Srgrimes{
1590Srgrimes	char c2;
1590Srgrimes
1590Srgrimes	for (;;) {
1590Srgrimes		/*
1590Srgrimes		 * See if we're at the end of both the pattern and the
1590Srgrimes		 * string. If, we succeeded.  If we're at the end of the
1590Srgrimes		 * pattern but not at the end of the string, we failed.
1590Srgrimes		 */
1590Srgrimes		if (*pattern == 0)
1590Srgrimes			return(!*string);
1590Srgrimes		if (*string == 0 && *pattern != '*')
1590Srgrimes			return(0);
1590Srgrimes		/*
1590Srgrimes		 * Check for a "*" as the next pattern character.  It matches
1590Srgrimes		 * any substring.  We handle this by calling ourselves
1590Srgrimes		 * recursively for each postfix of string, until either we
1590Srgrimes		 * match or we reach the end of the string.
1590Srgrimes		 */
1590Srgrimes		if (*pattern == '*') {
1590Srgrimes			pattern += 1;
1590Srgrimes			if (*pattern == 0)
1590Srgrimes				return(1);
1590Srgrimes			while (*string != 0) {
1590Srgrimes				if (Str_Match(string, pattern))
1590Srgrimes					return(1);
1590Srgrimes				++string;
1590Srgrimes			}
1590Srgrimes			return(0);
1590Srgrimes		}
1590Srgrimes		/*
1590Srgrimes		 * Check for a "?" as the next pattern character.  It matches
1590Srgrimes		 * any single character.
1590Srgrimes		 */
1590Srgrimes		if (*pattern == '?')
1590Srgrimes			goto thisCharOK;
1590Srgrimes		/*
1590Srgrimes		 * Check for a "[" as the next pattern character.  It is
1590Srgrimes		 * followed by a list of characters that are acceptable, or
1590Srgrimes		 * by a range (two characters separated by "-").
1590Srgrimes		 */
1590Srgrimes		if (*pattern == '[') {
1590Srgrimes			++pattern;
1590Srgrimes			for (;;) {
1590Srgrimes				if ((*pattern == ']') || (*pattern == 0))
1590Srgrimes					return(0);
1590Srgrimes				if (*pattern == *string)
1590Srgrimes					break;
1590Srgrimes				if (pattern[1] == '-') {
1590Srgrimes					c2 = pattern[2];
1590Srgrimes					if (c2 == 0)
1590Srgrimes						return(0);
1590Srgrimes					if ((*pattern <= *string) &&
1590Srgrimes					    (c2 >= *string))
1590Srgrimes						break;
1590Srgrimes					if ((*pattern >= *string) &&
1590Srgrimes					    (c2 <= *string))
1590Srgrimes						break;
1590Srgrimes					pattern += 2;
1590Srgrimes				}
1590Srgrimes				++pattern;
1590Srgrimes			}
1590Srgrimes			while ((*pattern != ']') && (*pattern != 0))
1590Srgrimes				++pattern;
1590Srgrimes			goto thisCharOK;
1590Srgrimes		}
1590Srgrimes		/*
1590Srgrimes		 * If the next pattern character is '/', just strip off the
1590Srgrimes		 * '/' so we do exact matching on the character that follows.
1590Srgrimes		 */
1590Srgrimes		if (*pattern == '\\') {
1590Srgrimes			++pattern;
1590Srgrimes			if (*pattern == 0)
1590Srgrimes				return(0);
1590Srgrimes		}
1590Srgrimes		/*
1590Srgrimes		 * There's no special character.  Just make sure that the
1590Srgrimes		 * next characters of each string match.
1590Srgrimes		 */
1590Srgrimes		if (*pattern != *string)
1590Srgrimes			return(0);
1590SrgrimesthisCharOK:	++pattern;
1590Srgrimes		++string;
1590Srgrimes	}
1590Srgrimes}
1590Srgrimes
1590Srgrimes
1590Srgrimes/*-
1590Srgrimes *-----------------------------------------------------------------------
1590Srgrimes * Str_SYSVMatch --
8874Srgrimes *	Check word against pattern for a match (% is wild),
8874Srgrimes *
1590Srgrimes * Results:
1590Srgrimes *	Returns the beginning position of a match or null. The number
1590Srgrimes *	of characters matched is returned in len.
1590Srgrimes *
1590Srgrimes * Side Effects:
1590Srgrimes *	None
1590Srgrimes *
1590Srgrimes *-----------------------------------------------------------------------
1590Srgrimes */
1590Srgrimeschar *
104696SjmallettStr_SYSVMatch(char *word, char *pattern, int *len)
1590Srgrimes{
1590Srgrimes    char *p = pattern;
1590Srgrimes    char *w = word;
1590Srgrimes    char *m;
1590Srgrimes
96071Sjmallett    if (*w == '\0') {
96071Sjmallett	/* Zero-length word cannot be matched against */
96071Sjmallett	*len = 0;
96071Sjmallett	return NULL;
96071Sjmallett    }
96071Sjmallett
1590Srgrimes    if (*p == '\0') {
1590Srgrimes	/* Null pattern is the whole string */
1590Srgrimes	*len = strlen(w);
1590Srgrimes	return w;
1590Srgrimes    }
1590Srgrimes
1590Srgrimes    if ((m = strchr(p, '%')) != NULL) {
1590Srgrimes	/* check that the prefix matches */
1590Srgrimes	for (; p != m && *w && *w == *p; w++, p++)
1590Srgrimes	     continue;
1590Srgrimes
1590Srgrimes	if (p != m)
1590Srgrimes	    return NULL;	/* No match */
1590Srgrimes
1590Srgrimes	if (*++p == '\0') {
1590Srgrimes	    /* No more pattern, return the rest of the string */
1590Srgrimes	    *len = strlen(w);
1590Srgrimes	    return w;
1590Srgrimes	}
1590Srgrimes    }
1590Srgrimes
1590Srgrimes    m = w;
1590Srgrimes
1590Srgrimes    /* Find a matching tail */
1590Srgrimes    do
1590Srgrimes	if (strcmp(p, w) == 0) {
1590Srgrimes	    *len = w - m;
1590Srgrimes	    return m;
1590Srgrimes	}
1590Srgrimes    while (*w++ != '\0');
8874Srgrimes
1590Srgrimes    return NULL;
1590Srgrimes}
1590Srgrimes
1590Srgrimes
1590Srgrimes/*-
1590Srgrimes *-----------------------------------------------------------------------
1590Srgrimes * Str_SYSVSubst --
1590Srgrimes *	Substitute '%' on the pattern with len characters from src.
1590Srgrimes *	If the pattern does not contain a '%' prepend len characters
1590Srgrimes *	from src.
8874Srgrimes *
1590Srgrimes * Results:
1590Srgrimes *	None
1590Srgrimes *
1590Srgrimes * Side Effects:
1590Srgrimes *	Places result on buf
1590Srgrimes *
1590Srgrimes *-----------------------------------------------------------------------
1590Srgrimes */
1590Srgrimesvoid
104696SjmallettStr_SYSVSubst(Buffer buf, char *pat, char *src, int len)
1590Srgrimes{
1590Srgrimes    char *m;
1590Srgrimes
1590Srgrimes    if ((m = strchr(pat, '%')) != NULL) {
1590Srgrimes	/* Copy the prefix */
1590Srgrimes	Buf_AddBytes(buf, m - pat, (Byte *) pat);
1590Srgrimes	/* skip the % */
1590Srgrimes	pat = m + 1;
1590Srgrimes    }
1590Srgrimes
1590Srgrimes    /* Copy the pattern */
1590Srgrimes    Buf_AddBytes(buf, len, (Byte *) src);
1590Srgrimes
1590Srgrimes    /* append the rest */
1590Srgrimes    Buf_AddBytes(buf, strlen(pat), (Byte *) pat);
1590Srgrimes}