awk: fix -F 'regex' bug (miscounted fields if last field is empty)

This commit is contained in:
Denis Vlasenko 2007-07-18 18:32:25 +00:00
parent b78c782c85
commit af1bd09625

View File

@ -1522,9 +1522,12 @@ static int awk_split(const char *s, node *spl, char **slist)
if (*getvar_s(intvar[RS]) == '\0') if (*getvar_s(intvar[RS]) == '\0')
c[2] = '\n'; c[2] = '\n';
if ((spl->info & OPCLSMASK) == OC_REGEXP) { /* regex split */ if ((spl->info & OPCLSMASK) == OC_REGEXP) { /* regex split */
while (*s) { if (!*s)
l = strcspn(s, c+2); return n; /* "": zero fields */
n++; /* at least one field will be there */
do {
l = strcspn(s, c+2); /* len till next NUL or \n */
if (regexec(icase ? spl->r.ire : spl->l.re, s, 1, pmatch, 0) == 0 if (regexec(icase ? spl->r.ire : spl->l.re, s, 1, pmatch, 0) == 0
&& pmatch[0].rm_so <= l && pmatch[0].rm_so <= l
) { ) {
@ -1533,24 +1536,27 @@ static int awk_split(const char *s, node *spl, char **slist)
l++; l++;
pmatch[0].rm_eo++; pmatch[0].rm_eo++;
} }
n++; /* we saw yet another delimiter */
} else { } else {
pmatch[0].rm_eo = l; pmatch[0].rm_eo = l;
if (s[l]) pmatch[0].rm_eo++; if (s[l]) pmatch[0].rm_eo++;
} }
memcpy(s1, s, l); memcpy(s1, s, l);
s1[l] = '\0'; s1[l] = '\0';
nextword(&s1); nextword(&s1);
s += pmatch[0].rm_eo; s += pmatch[0].rm_eo;
n++; } while (*s);
} return n;
} else if (c[0] == '\0') { /* null split */ }
if (c[0] == '\0') { /* null split */
while (*s) { while (*s) {
*s1++ = *s++; *s1++ = *s++;
*s1++ = '\0'; *s1++ = '\0';
n++; n++;
} }
} else if (c[0] != ' ') { /* single-character split */ return n;
}
if (c[0] != ' ') { /* single-character split */
if (icase) { if (icase) {
c[0] = toupper(c[0]); c[0] = toupper(c[0]);
c[1] = tolower(c[1]); c[1] = tolower(c[1]);
@ -1560,21 +1566,23 @@ static int awk_split(const char *s, node *spl, char **slist)
*s1++ = '\0'; *s1++ = '\0';
n++; n++;
} }
} else { /* space split */ return n;
while (*s) { }
s = skip_whitespace(s); /* space split */
if (!*s) break; while (*s) {
n++; s = skip_whitespace(s);
while (*s && !isspace(*s)) if (!*s) break;
*s1++ = *s++; n++;
*s1++ = '\0'; while (*s && !isspace(*s))
} *s1++ = *s++;
*s1++ = '\0';
} }
return n; return n;
} }
static void split_f0(void) static void split_f0(void)
{ {
/* static char *fstrings; */
#define fstrings (G.split_f0__fstrings) #define fstrings (G.split_f0__fstrings)
int i, n; int i, n;