Fix s/[/]// handling (noted by Dumas Patrice).
[oweals/busybox.git] / editors / sed.c
index 73ed058e237fa1a2486bad4d194e74b87d7257f5..989df7cb4be609fa173e7e770db13bd26d8c7c25 100644 (file)
@@ -144,8 +144,21 @@ static void destroy_cmd_strs()
  */
 static int index_of_next_unescaped_regexp_delim(struct sed_cmd *sed_cmd, const char *str, int idx)
 {
+       int bracket = -1;
+       int escaped = 0;
+
        for ( ; str[idx]; idx++) {
-               if (str[idx] == sed_cmd->delimiter && str[idx-1] != '\\')
+               if (bracket != -1) {
+                       if (str[idx] == ']' && !(bracket == idx - 1 ||
+                                                                        (bracket == idx - 2 && str[idx-1] == '^')))
+                               bracket = -1;
+               } else if (escaped)
+                       escaped = 0;
+               else if (str[idx] == '\\')
+                       escaped = 1;
+               else if (str[idx] == '[')
+                       bracket = idx;
+               else if (str[idx] == sed_cmd->delimiter)
                        return idx;
        }
 
@@ -195,15 +208,6 @@ static int get_address(struct sed_cmd *sed_cmd, const char *str, int *linenum, r
        return idx;
 }
 
-static char *strdup_substr(const char *str, int start, int end)
-{
-       int size = end - start + 1;
-       char *newstr = xmalloc(size);
-       memcpy(newstr, str+start, size-1);
-       newstr[size-1] = '\0';
-       return newstr;
-}
-
 static int parse_subst_cmd(struct sed_cmd *sed_cmd, const char *substr)
 {
        int oldidx, cflags = REG_NEWLINE;
@@ -232,7 +236,7 @@ static int parse_subst_cmd(struct sed_cmd *sed_cmd, const char *substr)
        idx = index_of_next_unescaped_regexp_delim(sed_cmd, substr, ++idx);
        if (idx == -1)
                error_msg_and_die("bad format in substitution expression");
-       match = strdup_substr(substr, oldidx, idx);
+       match = xstrndup(substr + oldidx, idx - oldidx);
 
        /* determine the number of back references in the match string */
        /* Note: we compute this here rather than in the do_subst_command()
@@ -251,7 +255,7 @@ static int parse_subst_cmd(struct sed_cmd *sed_cmd, const char *substr)
        idx = index_of_next_unescaped_regexp_delim(sed_cmd, substr, ++idx);
        if (idx == -1)
                error_msg_and_die("bad format in substitution expression");
-       sed_cmd->replace = strdup_substr(substr, oldidx, idx);
+       sed_cmd->replace = xstrndup(substr + oldidx, idx - oldidx);
 
        /* process the flags */
        while (substr[++idx]) {
@@ -499,8 +503,23 @@ static void load_cmd_file(char *filename)
        }
 }
 
-static void print_subst_w_backrefs(const char *line, const char *replace, regmatch_t *regmatch)
+#define PIPE_MAGIC 0x7f
+#define PIPE_GROW 64  
+#define pipeputc(c) \
+{ if (pipeline[pipeline_idx] == PIPE_MAGIC) { \
+       pipeline = xrealloc(pipeline, pipeline_len+PIPE_GROW); \
+       memset(pipeline+pipeline_len, 0, PIPE_GROW); \
+       pipeline_len += PIPE_GROW; \
+       pipeline[pipeline_len-1] = PIPE_MAGIC; } \
+       pipeline[pipeline_idx++] = (c); }
+
+static void print_subst_w_backrefs(const char *line, const char *replace, 
+       regmatch_t *regmatch, char **pipeline_p, int *pipeline_idx_p, 
+       int *pipeline_len_p, int matches)
 {
+       char *pipeline = *pipeline_p;
+       int pipeline_idx = *pipeline_idx_p;
+       int pipeline_len = *pipeline_len_p;
        int i;
 
        /* go through the replacement string */
@@ -515,14 +534,15 @@ static void print_subst_w_backrefs(const char *line, const char *replace, regmat
                        tmpstr[1] = 0;
                        backref = atoi(tmpstr);
                        /* print out the text held in regmatch[backref] */
-                       for (j = regmatch[backref].rm_so; j < regmatch[backref].rm_eo; j++)
-                               fputc(line[j], stdout);
+                       if (backref <= matches && regmatch[backref].rm_so != -1)
+                               for (j = regmatch[backref].rm_so; j < regmatch[backref].rm_eo; j++)
+                                       pipeputc(line[j]);
                }
 
                /* if we find a backslash escaped character, print the character */
                else if (replace[i] == '\\') {
                        ++i;
-                       fputc(replace[i], stdout);
+                       pipeputc(replace[i]);
                }
 
                /* if we find an unescaped '&' print out the whole matched text.
@@ -532,27 +552,41 @@ static void print_subst_w_backrefs(const char *line, const char *replace, regmat
                else if (replace[i] == '&' && replace[i-1] != '\\') {
                        int j;
                        for (j = regmatch[0].rm_so; j < regmatch[0].rm_eo; j++)
-                               fputc(line[j], stdout);
+                               pipeputc(line[j]);
                }
                /* nothing special, just print this char of the replacement string to stdout */
                else
-                       fputc(replace[i], stdout);
+                       pipeputc(replace[i]);
        }
+       *pipeline_p = pipeline;
+       *pipeline_idx_p = pipeline_idx;
+       *pipeline_len_p = pipeline_len;
 }
 
-static int do_subst_command(const struct sed_cmd *sed_cmd, const char *line)
+static int do_subst_command(const struct sed_cmd *sed_cmd, char **line)
 {
-       char *hackline = (char *)line;
+       char *hackline = *line;
+       char *pipeline = 0;
+       int pipeline_idx = 0;
+       int pipeline_len = 0;
        int altered = 0;
        regmatch_t *regmatch = NULL;
 
        /* we only proceed if the substitution 'search' expression matches */
-       if (regexec(sed_cmd->sub_match, line, 0, NULL, 0) == REG_NOMATCH)
+       if (regexec(sed_cmd->sub_match, hackline, 0, NULL, 0) == REG_NOMATCH)
                return 0;
 
        /* whaddaya know, it matched. get the number of back references */
        regmatch = xmalloc(sizeof(regmatch_t) * (sed_cmd->num_backrefs+1));
 
+       /* allocate more PIPE_GROW bytes
+          if replaced string is larger than original */
+       pipeline_len = strlen(hackline)+PIPE_GROW;
+       pipeline = xmalloc(pipeline_len);
+       memset(pipeline, 0, pipeline_len);
+       /* buffer magic */
+       pipeline[pipeline_len-1] = PIPE_MAGIC;
+
        /* and now, as long as we've got a line to try matching and if we can match
         * the search string, we make substitutions */
        while (*hackline && (regexec(sed_cmd->sub_match, hackline,
@@ -561,10 +595,12 @@ static int do_subst_command(const struct sed_cmd *sed_cmd, const char *line)
 
                /* print everything before the match */
                for (i = 0; i < regmatch[0].rm_so; i++)
-                       fputc(hackline[i], stdout);
+                       pipeputc(hackline[i]);
 
                /* then print the substitution string */
-               print_subst_w_backrefs(hackline, sed_cmd->replace, regmatch);
+               print_subst_w_backrefs(hackline, sed_cmd->replace, regmatch, 
+                               &pipeline, &pipeline_idx, &pipeline_len,
+                               sed_cmd->num_backrefs);
 
                /* advance past the match */
                hackline += regmatch[0].rm_eo;
@@ -576,11 +612,14 @@ static int do_subst_command(const struct sed_cmd *sed_cmd, const char *line)
                        break;
        }
 
-       puts(hackline);
+       for (; *hackline; hackline++) pipeputc(*hackline);
+       if (pipeline[pipeline_idx] == PIPE_MAGIC) pipeline[pipeline_idx] = 0;
 
        /* cleanup */
        free(regmatch);
 
+       free(*line);
+       *line = pipeline;
        return altered;
 }
 
@@ -608,6 +647,10 @@ static void process_file(FILE *file)
                         * entry point into sedding...
                         */
                        if (
+                                       /* no range necessary */
+                                       (sed_cmds[i].beg_line == 0 && sed_cmds[i].end_line == 0 &&
+                                        sed_cmds[i].beg_match == NULL &&
+                                        sed_cmds[i].end_match == NULL) ||
                                        /* this line number is the first address we're looking for */
                                        (sed_cmds[i].beg_line && (sed_cmds[i].beg_line == linenum)) ||
                                        /* this line matches our first address regex */
@@ -655,12 +698,14 @@ static void process_file(FILE *file)
 
                                                /* we print the line once, unless we were told to be quiet */
                                                if (!be_quiet)
-                                                       altered = do_subst_command(&sed_cmds[i], line);
+                                                       altered |= do_subst_command(&sed_cmds[i], &line);
 
                                                /* we also print the line if we were given the 'p' flag
                                                 * (this is quite possibly the second printing) */
                                                if (sed_cmds[i].sub_p)
-                                                       altered = do_subst_command(&sed_cmds[i], line);
+                                                       altered |= do_subst_command(&sed_cmds[i], &line);
+                                               if (altered && (i+1 >= ncmds || sed_cmds[i+1].cmd != 's'))
+                                                       puts(line);
 
                                                break;