I _think_ this implements ${foo/bar/baz} logic (bar is a glob pattern)

todo tomorrow:
• test case (compare with e.g. GNU bash)
• manpage
• version bump

sqchar is a bit ugly, but \/ must be preserved, as we don’t get wdencoded
strings later on in the process (eval.c CSUBST) and I didn’t want to have
an implementation like ${foo: 2: 3} this time
This commit is contained in:
tg 2008-02-27 01:00:10 +00:00
parent 0f1501326b
commit 01b54f1fd5
4 changed files with 97 additions and 14 deletions

88
eval.c
View File

@ -2,7 +2,7 @@
#include "sh.h" #include "sh.h"
__RCSID("$MirOS: src/bin/mksh/eval.c,v 1.36 2007/10/25 15:34:29 tg Exp $"); __RCSID("$MirOS: src/bin/mksh/eval.c,v 1.37 2008/02/27 01:00:09 tg Exp $");
#ifdef MKSH_SMALL #ifdef MKSH_SMALL
#define MKSH_NOPWNAM #define MKSH_NOPWNAM
@ -166,6 +166,7 @@ expand(const char *cp, /* input word */
int newlines = 0; /* For trailing newlines in COMSUB */ int newlines = 0; /* For trailing newlines in COMSUB */
int saw_eq, tilde_ok; int saw_eq, tilde_ok;
int make_magic; int make_magic;
int sqchar = 0; /* char to keep bksl before (${…/…\/…/…}) */
size_t len; size_t len;
if (cp == NULL) if (cp == NULL)
@ -373,6 +374,13 @@ expand(const char *cp, /* input word */
*dp++ = MAGIC; *dp++ = MAGIC;
*dp++ = (char)('@' | 0x80); *dp++ = (char)('@' | 0x80);
break; break;
case '/':
/* ! DOBLANK,DOBRACE_,DOTILDE */
f = DOPAT | (f&DONTRUNCOMMAND) |
DOTEMP_;
quote = 0;
sqchar = '/';
break;
case '=': case '=':
/* Enabling tilde expansion /* Enabling tilde expansion
* after :s here is * after :s here is
@ -416,6 +424,7 @@ expand(const char *cp, /* input word */
tilde_ok = 0; /* in case of ${unset:-} */ tilde_ok = 0; /* in case of ${unset:-} */
*dp = '\0'; *dp = '\0';
quote = st->quote; quote = st->quote;
sqchar = 0;
f = st->f; f = st->f;
if (f&DOBLANK) if (f&DOBLANK)
doblank--; doblank--;
@ -423,7 +432,10 @@ expand(const char *cp, /* input word */
case '#': case '#':
case '%': case '%':
/* Append end-pattern */ /* Append end-pattern */
*dp++ = MAGIC; *dp++ = ')'; *dp = '\0'; *dp++ = MAGIC; *dp++ = ')';
/* FALLTHROUGH */
case '/':
*dp = '\0';
dp = Xrestpos(ds, dp, st->base); dp = Xrestpos(ds, dp, st->base);
/* Must use st->var since calling /* Must use st->var since calling
* global would break things * global would break things
@ -588,6 +600,9 @@ expand(const char *cp, /* input word */
break; break;
} }
if (quote && sqchar == c)
*dp++ = '\\';
/* check for end of word or IFS separation */ /* check for end of word or IFS separation */
if (c == 0 || (!quote && (f & DOBLANK) && doblank && if (c == 0 || (!quote && (f & DOBLANK) && doblank &&
!make_magic && ctype(c, C_IFS))) { !make_magic && ctype(c, C_IFS))) {
@ -823,6 +838,7 @@ varsub(Expand *xp, const char *sp, const char *word,
switch (stype & 0x7f) { switch (stype & 0x7f) {
case '=': /* can't assign to a vector */ case '=': /* can't assign to a vector */
case '%': /* can't trim a vector (yet) */ case '%': /* can't trim a vector (yet) */
case '/':
case '#': case '#':
return -1; return -1;
} }
@ -845,6 +861,7 @@ varsub(Expand *xp, const char *sp, const char *word,
case '=': /* can't assign to a vector */ case '=': /* can't assign to a vector */
case '%': /* can't trim a vector (yet) */ case '%': /* can't trim a vector (yet) */
case '#': case '#':
case '/':
case '?': case '?':
return -1; return -1;
} }
@ -951,7 +968,7 @@ trimsub(char *str, char *pat, int how)
char *end = strnul(str); char *end = strnul(str);
char *p, c; char *p, c;
switch (how&0xff) { /* UCHAR_MAX maybe? */ switch (how & 0xFF) {
case '#': /* shortest at beginning */ case '#': /* shortest at beginning */
for (p = str; p <= end; p++) { for (p = str; p <= end; p++) {
c = *p; *p = '\0'; c = *p; *p = '\0';
@ -984,6 +1001,71 @@ trimsub(char *str, char *pat, int how)
return str_nsave(str, p - str, ATEMP); return str_nsave(str, p - str, ATEMP);
} }
break; break;
case '/': /* replace once - SLOW! */
case '/'|0x80: /* replace all - SLOWER! */
{
char *rpat, *rrep, *tpat1, *tpat2, *sbeg, *s, *d;
bool gotmatch = false;
sbeg = s = str;
/* separate search pattern and replacement string */
p = d = rpat = str_save(pat, ATEMP);
while (*p)
if (*p == '\\') {
p++;
if (*p)
p++;
} else if (*p == '/') {
*p++ = '\0';
d = p;
gotmatch = true;
break;
} else
p++;
rrep = gotmatch ? d : null;
/* first see if we have any match at all */
tpat1 = shf_smprintf("%c%c%c*%s%c*%c)", MAGIC, '@' | 0x80,
MAGIC, rpat, MAGIC, MAGIC);
tpat2 = shf_smprintf("%c%c%s%c*%c)", MAGIC, '@' | 0x80,
rpat, MAGIC, MAGIC);
again_repl:
/* this would not be necessary if gmatchx would return
* the start and end values of a match found, like re*
*/
if (!gmatchx(s, tpat1, false))
goto end_repl;
/* now anchor the beginning of the match */
while (sbeg <= end)
if (gmatchx(sbeg, tpat2, false))
break;
else
sbeg++;
/* now anchor the end of the match */
for (p = end; p >= sbeg; p--) {
c = *p; *p = '\0';
gotmatch = gmatchx(sbeg, rpat, false);
*p = c;
if (gotmatch)
break;
}
end = str_nsave(s, sbeg - s, ATEMP);
d = shf_smprintf("%s%s%s", end, rrep, p);
afree(end, ATEMP);
sbeg = d + (sbeg - s) + strlen(rrep);
if (s != str)
afree(s, ATEMP);
s = d;
end = strnul(s);
if ((how & 0xFF) != '/')
goto again_repl;
end_repl:
afree(rpat, ATEMP);
afree(tpat1, ATEMP);
afree(tpat2, ATEMP);
return (s);
break;
}
} }
return str; /* no match, return string */ return str; /* no match, return string */

4
lex.c
View File

@ -2,7 +2,7 @@
#include "sh.h" #include "sh.h"
__RCSID("$MirOS: src/bin/mksh/lex.c,v 1.52 2008/02/26 21:08:33 tg Exp $"); __RCSID("$MirOS: src/bin/mksh/lex.c,v 1.53 2008/02/27 01:00:09 tg Exp $");
/* /*
* states while lexing word * states while lexing word
@ -395,7 +395,7 @@ yylex(int cf)
/* If this is a trim operation, /* If this is a trim operation,
* treat (,|,) specially in STBRACE. * treat (,|,) specially in STBRACE.
*/ */
if (c == '#' || c == '%') { if (ctype(c, C_SUBOP2)) {
ungetsc(c); ungetsc(c);
PUSH_STATE(STBRACE); PUSH_STATE(STBRACE);
} else { } else {

4
misc.c
View File

@ -6,7 +6,7 @@
#include <grp.h> #include <grp.h>
#endif #endif
__RCSID("$MirOS: src/bin/mksh/misc.c,v 1.67 2007/10/25 15:19:16 tg Exp $\t" __RCSID("$MirOS: src/bin/mksh/misc.c,v 1.68 2008/02/27 01:00:09 tg Exp $\t"
MKSH_SH_H_ID); MKSH_SH_H_ID);
#undef USE_CHVT #undef USE_CHVT
@ -499,7 +499,7 @@ bi_getn(const char *as, int *ai)
*/ */
int int
gmatchx(const char *s, const char *p, int isfile) gmatchx(const char *s, const char *p, bool isfile)
{ {
const char *se, *pe; const char *se, *pe;

7
sh.h
View File

@ -8,7 +8,7 @@
/* $OpenBSD: c_test.h,v 1.4 2004/12/20 11:34:26 otto Exp $ */ /* $OpenBSD: c_test.h,v 1.4 2004/12/20 11:34:26 otto Exp $ */
/* $OpenBSD: tty.h,v 1.5 2004/12/20 11:34:26 otto Exp $ */ /* $OpenBSD: tty.h,v 1.5 2004/12/20 11:34:26 otto Exp $ */
#define MKSH_SH_H_ID "$MirOS: src/bin/mksh/sh.h,v 1.187 2008/02/26 20:43:11 tg Exp $" #define MKSH_SH_H_ID "$MirOS: src/bin/mksh/sh.h,v 1.188 2008/02/27 01:00:10 tg Exp $"
#define MKSH_VERSION "R33 2008/02/26" #define MKSH_VERSION "R33 2008/02/26"
#if HAVE_SYS_PARAM_H #if HAVE_SYS_PARAM_H
@ -543,7 +543,8 @@ EXTERN int really_exit;
extern unsigned char chtypes[]; extern unsigned char chtypes[];
#define ctype(c, t) !!( ((t) == C_SUBOP2) ? \ #define ctype(c, t) !!( ((t) == C_SUBOP2) ? \
(((c) == '#' || (c) == '%') ? 1 : 0) : \ (((c) == '#' || (c) == '%' || \
(c) == '/') ? 1 : 0) : \
(chtypes[(unsigned char)(c)]&(t)) ) (chtypes[(unsigned char)(c)]&(t)) )
#define ksh_isalphx(c) ctype((c), C_ALPHA) #define ksh_isalphx(c) ctype((c), C_ALPHA)
#define ksh_isalnux(c) ctype((c), C_ALPHA | C_DIGIT) #define ksh_isalnux(c) ctype((c), C_ALPHA | C_DIGIT)
@ -1394,7 +1395,7 @@ void change_flag(enum sh_flag, int, char);
int parse_args(const char **, int, int *); int parse_args(const char **, int, int *);
int getn(const char *, int *); int getn(const char *, int *);
int bi_getn(const char *, int *); int bi_getn(const char *, int *);
int gmatchx(const char *, const char *, int); int gmatchx(const char *, const char *, bool);
int has_globbing(const char *, const char *); int has_globbing(const char *, const char *);
const unsigned char *pat_scan(const unsigned char *, const unsigned char *, int); const unsigned char *pat_scan(const unsigned char *, const unsigned char *, int);
int xstrcmp(const void *, const void *); int xstrcmp(const void *, const void *);