awk: fix -F 'regex' bug (miscounted fields if last field is empty)
This commit is contained in:
parent
b78c782c85
commit
af1bd09625
@ -1522,9 +1522,12 @@ static int awk_split(const char *s, node *spl, char **slist)
|
|||||||
if (*getvar_s(intvar[RS]) == '\0')
|
if (*getvar_s(intvar[RS]) == '\0')
|
||||||
c[2] = '\n';
|
c[2] = '\n';
|
||||||
|
|
||||||
if ((spl->info & OPCLSMASK) == OC_REGEXP) { /* regex split */
|
if ((spl->info & OPCLSMASK) == OC_REGEXP) { /* regex split */
|
||||||
while (*s) {
|
if (!*s)
|
||||||
l = strcspn(s, c+2);
|
return n; /* "": zero fields */
|
||||||
|
n++; /* at least one field will be there */
|
||||||
|
do {
|
||||||
|
l = strcspn(s, c+2); /* len till next NUL or \n */
|
||||||
if (regexec(icase ? spl->r.ire : spl->l.re, s, 1, pmatch, 0) == 0
|
if (regexec(icase ? spl->r.ire : spl->l.re, s, 1, pmatch, 0) == 0
|
||||||
&& pmatch[0].rm_so <= l
|
&& pmatch[0].rm_so <= l
|
||||||
) {
|
) {
|
||||||
@ -1533,24 +1536,27 @@ static int awk_split(const char *s, node *spl, char **slist)
|
|||||||
l++;
|
l++;
|
||||||
pmatch[0].rm_eo++;
|
pmatch[0].rm_eo++;
|
||||||
}
|
}
|
||||||
|
n++; /* we saw yet another delimiter */
|
||||||
} else {
|
} else {
|
||||||
pmatch[0].rm_eo = l;
|
pmatch[0].rm_eo = l;
|
||||||
if (s[l]) pmatch[0].rm_eo++;
|
if (s[l]) pmatch[0].rm_eo++;
|
||||||
}
|
}
|
||||||
|
|
||||||
memcpy(s1, s, l);
|
memcpy(s1, s, l);
|
||||||
s1[l] = '\0';
|
s1[l] = '\0';
|
||||||
nextword(&s1);
|
nextword(&s1);
|
||||||
s += pmatch[0].rm_eo;
|
s += pmatch[0].rm_eo;
|
||||||
n++;
|
} while (*s);
|
||||||
}
|
return n;
|
||||||
} else if (c[0] == '\0') { /* null split */
|
}
|
||||||
|
if (c[0] == '\0') { /* null split */
|
||||||
while (*s) {
|
while (*s) {
|
||||||
*s1++ = *s++;
|
*s1++ = *s++;
|
||||||
*s1++ = '\0';
|
*s1++ = '\0';
|
||||||
n++;
|
n++;
|
||||||
}
|
}
|
||||||
} else if (c[0] != ' ') { /* single-character split */
|
return n;
|
||||||
|
}
|
||||||
|
if (c[0] != ' ') { /* single-character split */
|
||||||
if (icase) {
|
if (icase) {
|
||||||
c[0] = toupper(c[0]);
|
c[0] = toupper(c[0]);
|
||||||
c[1] = tolower(c[1]);
|
c[1] = tolower(c[1]);
|
||||||
@ -1560,21 +1566,23 @@ static int awk_split(const char *s, node *spl, char **slist)
|
|||||||
*s1++ = '\0';
|
*s1++ = '\0';
|
||||||
n++;
|
n++;
|
||||||
}
|
}
|
||||||
} else { /* space split */
|
return n;
|
||||||
while (*s) {
|
}
|
||||||
s = skip_whitespace(s);
|
/* space split */
|
||||||
if (!*s) break;
|
while (*s) {
|
||||||
n++;
|
s = skip_whitespace(s);
|
||||||
while (*s && !isspace(*s))
|
if (!*s) break;
|
||||||
*s1++ = *s++;
|
n++;
|
||||||
*s1++ = '\0';
|
while (*s && !isspace(*s))
|
||||||
}
|
*s1++ = *s++;
|
||||||
|
*s1++ = '\0';
|
||||||
}
|
}
|
||||||
return n;
|
return n;
|
||||||
}
|
}
|
||||||
|
|
||||||
static void split_f0(void)
|
static void split_f0(void)
|
||||||
{
|
{
|
||||||
|
/* static char *fstrings; */
|
||||||
#define fstrings (G.split_f0__fstrings)
|
#define fstrings (G.split_f0__fstrings)
|
||||||
|
|
||||||
int i, n;
|
int i, n;
|
||||||
|
Loading…
x
Reference in New Issue
Block a user