I _think_ this implements ${foo/bar/baz} logic (bar is a glob pattern)
todo tomorrow:
• test case (compare with e.g. GNU bash)
• manpage
• version bump
sqchar is a bit ugly, but \/ must be preserved, as we don’t get wdencoded
strings later on in the process (eval.c CSUBST) and I didn’t want to have
an implementation like ${foo: 2: 3} this time
			
			
This commit is contained in:
		
							
								
								
									
										92
									
								
								eval.c
									
									
									
									
									
								
							
							
						
						
									
										92
									
								
								eval.c
									
									
									
									
									
								
							| @@ -2,7 +2,7 @@ | |||||||
|  |  | ||||||
| #include "sh.h" | #include "sh.h" | ||||||
|  |  | ||||||
| __RCSID("$MirOS: src/bin/mksh/eval.c,v 1.36 2007/10/25 15:34:29 tg Exp $"); | __RCSID("$MirOS: src/bin/mksh/eval.c,v 1.37 2008/02/27 01:00:09 tg Exp $"); | ||||||
|  |  | ||||||
| #ifdef MKSH_SMALL | #ifdef MKSH_SMALL | ||||||
| #define MKSH_NOPWNAM | #define MKSH_NOPWNAM | ||||||
| @@ -166,6 +166,7 @@ expand(const char *cp,	/* input word */ | |||||||
| 	int newlines = 0; /* For trailing newlines in COMSUB */ | 	int newlines = 0; /* For trailing newlines in COMSUB */ | ||||||
| 	int saw_eq, tilde_ok; | 	int saw_eq, tilde_ok; | ||||||
| 	int make_magic; | 	int make_magic; | ||||||
|  | 	int sqchar = 0;		/* char to keep bksl before (${…/…\/…/…}) */ | ||||||
| 	size_t len; | 	size_t len; | ||||||
|  |  | ||||||
| 	if (cp == NULL) | 	if (cp == NULL) | ||||||
| @@ -373,6 +374,13 @@ expand(const char *cp,	/* input word */ | |||||||
| 						*dp++ = MAGIC; | 						*dp++ = MAGIC; | ||||||
| 						*dp++ = (char)('@' | 0x80); | 						*dp++ = (char)('@' | 0x80); | ||||||
| 						break; | 						break; | ||||||
|  | 					case '/': | ||||||
|  | 						/* ! DOBLANK,DOBRACE_,DOTILDE */ | ||||||
|  | 						f = DOPAT | (f&DONTRUNCOMMAND) | | ||||||
|  | 						    DOTEMP_; | ||||||
|  | 						quote = 0; | ||||||
|  | 						sqchar = '/'; | ||||||
|  | 						break; | ||||||
| 					case '=': | 					case '=': | ||||||
| 						/* Enabling tilde expansion | 						/* Enabling tilde expansion | ||||||
| 						 * after :s here is | 						 * after :s here is | ||||||
| @@ -416,6 +424,7 @@ expand(const char *cp,	/* input word */ | |||||||
| 				tilde_ok = 0;	/* in case of ${unset:-} */ | 				tilde_ok = 0;	/* in case of ${unset:-} */ | ||||||
| 				*dp = '\0'; | 				*dp = '\0'; | ||||||
| 				quote = st->quote; | 				quote = st->quote; | ||||||
|  | 				sqchar = 0; | ||||||
| 				f = st->f; | 				f = st->f; | ||||||
| 				if (f&DOBLANK) | 				if (f&DOBLANK) | ||||||
| 					doblank--; | 					doblank--; | ||||||
| @@ -423,7 +432,10 @@ expand(const char *cp,	/* input word */ | |||||||
| 				case '#': | 				case '#': | ||||||
| 				case '%': | 				case '%': | ||||||
| 					/* Append end-pattern */ | 					/* Append end-pattern */ | ||||||
| 					*dp++ = MAGIC; *dp++ = ')'; *dp = '\0'; | 					*dp++ = MAGIC; *dp++ = ')'; | ||||||
|  | 					/* FALLTHROUGH */ | ||||||
|  | 				case '/': | ||||||
|  | 					*dp = '\0'; | ||||||
| 					dp = Xrestpos(ds, dp, st->base); | 					dp = Xrestpos(ds, dp, st->base); | ||||||
| 					/* Must use st->var since calling | 					/* Must use st->var since calling | ||||||
| 					 * global would break things | 					 * global would break things | ||||||
| @@ -588,6 +600,9 @@ expand(const char *cp,	/* input word */ | |||||||
| 			break; | 			break; | ||||||
| 		} | 		} | ||||||
|  |  | ||||||
|  | 		if (quote && sqchar == c) | ||||||
|  | 			*dp++ = '\\'; | ||||||
|  |  | ||||||
| 		/* check for end of word or IFS separation */ | 		/* check for end of word or IFS separation */ | ||||||
| 		if (c == 0 || (!quote && (f & DOBLANK) && doblank && | 		if (c == 0 || (!quote && (f & DOBLANK) && doblank && | ||||||
| 		    !make_magic && ctype(c, C_IFS))) { | 		    !make_magic && ctype(c, C_IFS))) { | ||||||
| @@ -823,6 +838,7 @@ varsub(Expand *xp, const char *sp, const char *word, | |||||||
| 		switch (stype & 0x7f) { | 		switch (stype & 0x7f) { | ||||||
| 		case '=':	/* can't assign to a vector */ | 		case '=':	/* can't assign to a vector */ | ||||||
| 		case '%':	/* can't trim a vector (yet) */ | 		case '%':	/* can't trim a vector (yet) */ | ||||||
|  | 		case '/': | ||||||
| 		case '#': | 		case '#': | ||||||
| 			return -1; | 			return -1; | ||||||
| 		} | 		} | ||||||
| @@ -845,6 +861,7 @@ varsub(Expand *xp, const char *sp, const char *word, | |||||||
| 			case '=':	/* can't assign to a vector */ | 			case '=':	/* can't assign to a vector */ | ||||||
| 			case '%':	/* can't trim a vector (yet) */ | 			case '%':	/* can't trim a vector (yet) */ | ||||||
| 			case '#': | 			case '#': | ||||||
|  | 			case '/': | ||||||
| 			case '?': | 			case '?': | ||||||
| 				return -1; | 				return -1; | ||||||
| 			} | 			} | ||||||
| @@ -951,7 +968,7 @@ trimsub(char *str, char *pat, int how) | |||||||
| 	char *end = strnul(str); | 	char *end = strnul(str); | ||||||
| 	char *p, c; | 	char *p, c; | ||||||
|  |  | ||||||
| 	switch (how&0xff) {	/* UCHAR_MAX maybe? */ | 	switch (how & 0xFF) { | ||||||
| 	case '#':		/* shortest at beginning */ | 	case '#':		/* shortest at beginning */ | ||||||
| 		for (p = str; p <= end; p++) { | 		for (p = str; p <= end; p++) { | ||||||
| 			c = *p; *p = '\0'; | 			c = *p; *p = '\0'; | ||||||
| @@ -962,7 +979,7 @@ trimsub(char *str, char *pat, int how) | |||||||
| 			*p = c; | 			*p = c; | ||||||
| 		} | 		} | ||||||
| 		break; | 		break; | ||||||
| 	case '#'|0x80:	/* longest match at beginning */ | 	case '#'|0x80:		/* longest match at beginning */ | ||||||
| 		for (p = end; p >= str; p--) { | 		for (p = end; p >= str; p--) { | ||||||
| 			c = *p; *p = '\0'; | 			c = *p; *p = '\0'; | ||||||
| 			if (gmatchx(str, pat, false)) { | 			if (gmatchx(str, pat, false)) { | ||||||
| @@ -978,12 +995,77 @@ trimsub(char *str, char *pat, int how) | |||||||
| 				return str_nsave(str, p - str, ATEMP); | 				return str_nsave(str, p - str, ATEMP); | ||||||
| 		} | 		} | ||||||
| 		break; | 		break; | ||||||
| 	case '%'|0x80:	/* longest match at end */ | 	case '%'|0x80:		/* longest match at end */ | ||||||
| 		for (p = str; p <= end; p++) { | 		for (p = str; p <= end; p++) { | ||||||
| 			if (gmatchx(p, pat, false)) | 			if (gmatchx(p, pat, false)) | ||||||
| 				return str_nsave(str, p - str, ATEMP); | 				return str_nsave(str, p - str, ATEMP); | ||||||
| 		} | 		} | ||||||
| 		break; | 		break; | ||||||
|  | 	case '/':		/* replace once - SLOW! */ | ||||||
|  | 	case '/'|0x80:		/* replace all - SLOWER! */ | ||||||
|  | 	    { | ||||||
|  | 		char *rpat, *rrep, *tpat1, *tpat2, *sbeg, *s, *d; | ||||||
|  | 		bool gotmatch = false; | ||||||
|  |  | ||||||
|  | 		sbeg = s = str; | ||||||
|  | 		/* separate search pattern and replacement string */ | ||||||
|  | 		p = d = rpat = str_save(pat, ATEMP); | ||||||
|  |  		while (*p) | ||||||
|  | 			if (*p == '\\') { | ||||||
|  | 				p++; | ||||||
|  | 				if (*p) | ||||||
|  | 					p++; | ||||||
|  | 			} else if (*p == '/') { | ||||||
|  | 				*p++ = '\0'; | ||||||
|  | 				d = p; | ||||||
|  | 				gotmatch = true; | ||||||
|  | 				break; | ||||||
|  | 			} else | ||||||
|  | 				p++; | ||||||
|  | 		rrep = gotmatch ? d : null; | ||||||
|  |  | ||||||
|  | 		/* first see if we have any match at all */ | ||||||
|  | 		tpat1 = shf_smprintf("%c%c%c*%s%c*%c)", MAGIC, '@' | 0x80, | ||||||
|  | 		    MAGIC, rpat, MAGIC, MAGIC); | ||||||
|  | 		tpat2 = shf_smprintf("%c%c%s%c*%c)", MAGIC, '@' | 0x80, | ||||||
|  | 		    rpat, MAGIC, MAGIC); | ||||||
|  |  again_repl: | ||||||
|  | 		/* this would not be necessary if gmatchx would return | ||||||
|  | 		 * the start and end values of a match found, like re* | ||||||
|  | 		 */ | ||||||
|  | 		if (!gmatchx(s, tpat1, false)) | ||||||
|  | 			goto end_repl; | ||||||
|  | 		/* now anchor the beginning of the match */ | ||||||
|  | 		while (sbeg <= end) | ||||||
|  | 			if (gmatchx(sbeg, tpat2, false)) | ||||||
|  | 				break; | ||||||
|  | 			else | ||||||
|  | 				sbeg++; | ||||||
|  | 		/* now anchor the end of the match */ | ||||||
|  | 		for (p = end; p >= sbeg; p--) { | ||||||
|  | 			c = *p; *p = '\0'; | ||||||
|  | 			gotmatch = gmatchx(sbeg, rpat, false); | ||||||
|  | 			*p = c; | ||||||
|  | 			if (gotmatch) | ||||||
|  | 				break; | ||||||
|  | 		} | ||||||
|  | 		end = str_nsave(s, sbeg - s, ATEMP); | ||||||
|  | 		d = shf_smprintf("%s%s%s", end, rrep, p); | ||||||
|  | 		afree(end, ATEMP); | ||||||
|  | 		sbeg = d + (sbeg - s) + strlen(rrep); | ||||||
|  | 		if (s != str) | ||||||
|  | 			afree(s, ATEMP); | ||||||
|  | 		s = d; | ||||||
|  | 		end = strnul(s); | ||||||
|  | 		if ((how & 0xFF) != '/') | ||||||
|  | 			goto again_repl; | ||||||
|  |  end_repl: | ||||||
|  | 		afree(rpat, ATEMP); | ||||||
|  | 		afree(tpat1, ATEMP); | ||||||
|  | 		afree(tpat2, ATEMP); | ||||||
|  | 		return (s); | ||||||
|  | 		break; | ||||||
|  | 	    } | ||||||
| 	} | 	} | ||||||
|  |  | ||||||
| 	return str;		/* no match, return string */ | 	return str;		/* no match, return string */ | ||||||
|   | |||||||
							
								
								
									
										4
									
								
								lex.c
									
									
									
									
									
								
							
							
						
						
									
										4
									
								
								lex.c
									
									
									
									
									
								
							| @@ -2,7 +2,7 @@ | |||||||
|  |  | ||||||
| #include "sh.h" | #include "sh.h" | ||||||
|  |  | ||||||
| __RCSID("$MirOS: src/bin/mksh/lex.c,v 1.52 2008/02/26 21:08:33 tg Exp $"); | __RCSID("$MirOS: src/bin/mksh/lex.c,v 1.53 2008/02/27 01:00:09 tg Exp $"); | ||||||
|  |  | ||||||
| /* | /* | ||||||
|  * states while lexing word |  * states while lexing word | ||||||
| @@ -395,7 +395,7 @@ yylex(int cf) | |||||||
| 					/* If this is a trim operation, | 					/* If this is a trim operation, | ||||||
| 					 * treat (,|,) specially in STBRACE. | 					 * treat (,|,) specially in STBRACE. | ||||||
| 					 */ | 					 */ | ||||||
| 					if (c == '#' || c == '%') { | 					if (ctype(c, C_SUBOP2)) { | ||||||
| 						ungetsc(c); | 						ungetsc(c); | ||||||
| 						PUSH_STATE(STBRACE); | 						PUSH_STATE(STBRACE); | ||||||
| 					} else { | 					} else { | ||||||
|   | |||||||
							
								
								
									
										8
									
								
								misc.c
									
									
									
									
									
								
							
							
						
						
									
										8
									
								
								misc.c
									
									
									
									
									
								
							| @@ -6,7 +6,7 @@ | |||||||
| #include <grp.h> | #include <grp.h> | ||||||
| #endif | #endif | ||||||
|  |  | ||||||
| __RCSID("$MirOS: src/bin/mksh/misc.c,v 1.67 2007/10/25 15:19:16 tg Exp $\t" | __RCSID("$MirOS: src/bin/mksh/misc.c,v 1.68 2008/02/27 01:00:09 tg Exp $\t" | ||||||
| 	MKSH_SH_H_ID); | 	MKSH_SH_H_ID); | ||||||
|  |  | ||||||
| #undef USE_CHVT | #undef USE_CHVT | ||||||
| @@ -38,12 +38,12 @@ setctypes(const char *s, int t) | |||||||
| 	unsigned i; | 	unsigned i; | ||||||
|  |  | ||||||
| 	if (t & C_IFS) { | 	if (t & C_IFS) { | ||||||
| 		for (i = 0; i < UCHAR_MAX+1; i++) | 		for (i = 0; i < UCHAR_MAX + 1; i++) | ||||||
| 			chtypes[i] &= ~C_IFS; | 			chtypes[i] &= ~C_IFS; | ||||||
| 		chtypes[0] |= C_IFS; /* include \0 in C_IFS */ | 		chtypes[0] |= C_IFS; /* include \0 in C_IFS */ | ||||||
| 	} | 	} | ||||||
| 	while (*s != 0) | 	while (*s != 0) | ||||||
| 		chtypes[(unsigned char) *s++] |= t; | 		chtypes[(unsigned char)*s++] |= t; | ||||||
| } | } | ||||||
|  |  | ||||||
| void | void | ||||||
| @@ -499,7 +499,7 @@ bi_getn(const char *as, int *ai) | |||||||
|  */ |  */ | ||||||
|  |  | ||||||
| int | int | ||||||
| gmatchx(const char *s, const char *p, int isfile) | gmatchx(const char *s, const char *p, bool isfile) | ||||||
| { | { | ||||||
| 	const char *se, *pe; | 	const char *se, *pe; | ||||||
|  |  | ||||||
|   | |||||||
							
								
								
									
										7
									
								
								sh.h
									
									
									
									
									
								
							
							
						
						
									
										7
									
								
								sh.h
									
									
									
									
									
								
							| @@ -8,7 +8,7 @@ | |||||||
| /*	$OpenBSD: c_test.h,v 1.4 2004/12/20 11:34:26 otto Exp $	*/ | /*	$OpenBSD: c_test.h,v 1.4 2004/12/20 11:34:26 otto Exp $	*/ | ||||||
| /*	$OpenBSD: tty.h,v 1.5 2004/12/20 11:34:26 otto Exp $	*/ | /*	$OpenBSD: tty.h,v 1.5 2004/12/20 11:34:26 otto Exp $	*/ | ||||||
|  |  | ||||||
| #define MKSH_SH_H_ID "$MirOS: src/bin/mksh/sh.h,v 1.187 2008/02/26 20:43:11 tg Exp $" | #define MKSH_SH_H_ID "$MirOS: src/bin/mksh/sh.h,v 1.188 2008/02/27 01:00:10 tg Exp $" | ||||||
| #define MKSH_VERSION "R33 2008/02/26" | #define MKSH_VERSION "R33 2008/02/26" | ||||||
|  |  | ||||||
| #if HAVE_SYS_PARAM_H | #if HAVE_SYS_PARAM_H | ||||||
| @@ -543,7 +543,8 @@ EXTERN int really_exit; | |||||||
| extern unsigned char chtypes[]; | extern unsigned char chtypes[]; | ||||||
|  |  | ||||||
| #define ctype(c, t)	!!( ((t) == C_SUBOP2) ?				\ | #define ctype(c, t)	!!( ((t) == C_SUBOP2) ?				\ | ||||||
| 			    (((c) == '#' || (c) == '%') ? 1 : 0) :	\ | 			    (((c) == '#' || (c) == '%' || 		\ | ||||||
|  | 			      (c) == '/') ? 1 : 0) :			\ | ||||||
| 			    (chtypes[(unsigned char)(c)]&(t)) ) | 			    (chtypes[(unsigned char)(c)]&(t)) ) | ||||||
| #define ksh_isalphx(c)	ctype((c), C_ALPHA) | #define ksh_isalphx(c)	ctype((c), C_ALPHA) | ||||||
| #define ksh_isalnux(c)	ctype((c), C_ALPHA | C_DIGIT) | #define ksh_isalnux(c)	ctype((c), C_ALPHA | C_DIGIT) | ||||||
| @@ -1394,7 +1395,7 @@ void change_flag(enum sh_flag, int, char); | |||||||
| int parse_args(const char **, int, int *); | int parse_args(const char **, int, int *); | ||||||
| int getn(const char *, int *); | int getn(const char *, int *); | ||||||
| int bi_getn(const char *, int *); | int bi_getn(const char *, int *); | ||||||
| int gmatchx(const char *, const char *, int); | int gmatchx(const char *, const char *, bool); | ||||||
| int has_globbing(const char *, const char *); | int has_globbing(const char *, const char *); | ||||||
| const unsigned char *pat_scan(const unsigned char *, const unsigned char *, int); | const unsigned char *pat_scan(const unsigned char *, const unsigned char *, int); | ||||||
| int xstrcmp(const void *, const void *); | int xstrcmp(const void *, const void *); | ||||||
|   | |||||||
		Reference in New Issue
	
	Block a user