Patch from Kent Robotti to being fdisk in sync with v2.12 final.
[oweals/busybox.git] / editors / sed.c
index 5dd5b2654596cfa438d418bbe846d30187b668bb..6beba0661893edae23b60811193dda4cbee92164 100644 (file)
@@ -68,6 +68,13 @@ typedef struct sed_cmd_s {
        regex_t *beg_match;     /* sed -e '/match/cmd' */
        regex_t *end_match;     /* sed -e '/match/,/end_match/cmd' */
 
+       int beg_line;           /* 'sed 1p'   0 == no begining line, apply commands to all lines */
+       int end_line;           /* 'sed 1,3p' 0 == no end line, use only beginning. -1 == $ */
+
+       /* inversion flag */
+       int invert;                     /* the '!' after the address */
+//     int block_cmd;  /* This command is part of a group that has a command address */
+
        /* SUBSTITUTION COMMAND SPECIFIC FIELDS */
 
        /* sed -e 's/sub_match/replace/' */
@@ -80,9 +87,6 @@ typedef struct sed_cmd_s {
        /* FILE COMMAND (r) SPECIFIC FIELDS */
        char *filename;
 
-       /* address storage */
-       int beg_line;           /* 'sed 1p'   0 == no begining line, apply commands to all lines */
-       int end_line;           /* 'sed 1,3p' 0 == no end line, use only beginning. -1 == $ */
        /* SUBSTITUTION COMMAND SPECIFIC FIELDS */
 
        unsigned int num_backrefs:4;    /* how many back references (\1..\9) */
@@ -98,9 +102,6 @@ typedef struct sed_cmd_s {
        /* the command */
        char cmd;                       /* p,d,s (add more at your leisure :-) */
 
-       /* inversion flag */
-       int invert;                     /* the '!' after the address */
-
        /* Branch commands */
        char *label;
 
@@ -124,9 +125,7 @@ static const char bad_format_in_subst[] =
 /* linked list of sed commands */
 static sed_cmd_t sed_cmd_head;
 static sed_cmd_t *sed_cmd_tail = &sed_cmd_head;
-static sed_cmd_t *block_cmd;
 
-static int in_block = 0;
 const char *const semicolon_whitespace = "; \n\r\t\v\0";
 static regex_t *previous_regex_ptr = NULL;
 
@@ -165,7 +164,7 @@ static void destroy_cmd_strs(void)
  * a backslash ('\').
  */
 static int index_of_next_unescaped_regexp_delim(const char delimiter,
-                                                                                               const char *str)
+       const char *str)
 {
        int bracket = -1;
        int escaped = 0;
@@ -174,8 +173,8 @@ static int index_of_next_unescaped_regexp_delim(const char delimiter,
 
        for (; (ch = str[idx]); idx++) {
                if (bracket != -1) {
-                       if (ch == ']' && !(bracket == idx - 1 ||
-                                                          (bracket == idx - 2 && str[idx - 1] == '^')))
+                       if (ch == ']' && !(bracket == idx - 1 || (bracket == idx - 2
+                                               && str[idx - 1] == '^')))
                                bracket = -1;
                } else if (escaped)
                        escaped = 0;
@@ -392,7 +391,7 @@ static int parse_edit_cmd(sed_cmd_t * sed_cmd, const char *editstr)
        /* store the edit line text */
        sed_cmd->editline = xmalloc(strlen(&editstr[2]) + 2);
        for (i = 2, j = 0;
-                editstr[i] != '\0' && strchr("\r\n", editstr[i]) == NULL; i++, j++) {
+               editstr[i] != '\0' && strchr("\r\n", editstr[i]) == NULL; i++, j++) {
                if ((editstr[i] == '\\') && strchr("\n\r", editstr[i + 1]) != NULL) {
                        sed_cmd->editline[j] = '\n';
                        i++;
@@ -449,7 +448,7 @@ static int parse_file_cmd(sed_cmd_t * sed_cmd, const char *filecmdstr)
 /*
  *  Process the commands arguments
  */
-static char *parse_cmd_str(sed_cmd_t *sed_cmd, char *cmdstr)
+static char *parse_cmd_str(sed_cmd_t * sed_cmd, char *cmdstr)
 {
        /* handle (s)ubstitution command */
        if (sed_cmd->cmd == 's') {
@@ -484,7 +483,7 @@ static char *parse_cmd_str(sed_cmd_t *sed_cmd, char *cmdstr)
        /* if it wasnt a single-letter command that takes no arguments
         * then it must be an invalid command.
         */
-       else if (strchr("dghnNpPqx=", sed_cmd->cmd) == 0) {
+       else if (strchr("dgGhHnNpPqx={}", sed_cmd->cmd) == 0) {
                bb_error_msg_and_die("Unsupported command %c", sed_cmd->cmd);
        }
 
@@ -512,13 +511,6 @@ static char *add_cmd(sed_cmd_t * sed_cmd, char *cmdstr)
                return (strpbrk(cmdstr, "\n\r"));
        }
 
-       /* Test for end of block */
-       if (*cmdstr == '}') {
-               in_block = 0;
-               cmdstr++;
-               return (cmdstr);
-       }
-
        /* parse the command
         * format is: [addr][,addr]cmd
         *            |----||-----||-|
@@ -536,7 +528,7 @@ static char *add_cmd(sed_cmd_t * sed_cmd, char *cmdstr)
                idx = get_address(cmdstr, &sed_cmd->end_line, &sed_cmd->end_match);
                if (idx == 0) {
                        bb_error_msg_and_die("get_address: no address found in string\n"
-                                                                "\t(you probably didn't check the string you passed me)");
+                               "\t(you probably didn't check the string you passed me)");
                }
                cmdstr += idx;
        }
@@ -571,28 +563,9 @@ static char *add_cmd(sed_cmd_t * sed_cmd, char *cmdstr)
        if (*cmdstr == '\0')
                bb_error_msg_and_die("missing command");
 
-       /* This is the start of a block of commands */
-       if (*cmdstr == '{') {
-               if (in_block != 0) {
-                       bb_error_msg_and_die("cant handle sub-blocks");
-               }
-               in_block = 1;
-               block_cmd = sed_cmd;
-
-               return (cmdstr + 1);
-       }
-
        sed_cmd->cmd = *cmdstr;
        cmdstr++;
 
-       if (in_block == 1) {
-               sed_cmd->beg_match = block_cmd->beg_match;
-               sed_cmd->end_match = block_cmd->end_match;
-               sed_cmd->beg_line = block_cmd->beg_line;
-               sed_cmd->end_line = block_cmd->end_line;
-               sed_cmd->invert = block_cmd->invert;
-       }
-
        cmdstr = parse_cmd_str(sed_cmd, cmdstr);
 
        /* Add the command to the command array */
@@ -637,8 +610,8 @@ static void load_cmd_file(char *filename)
        while ((line = bb_get_line_from_file(cmdfile)) != NULL) {
                /* if a line ends with '\' it needs the next line appended to it */
                while (((e = last_char_is(line, '\n')) != NULL)
-                          && (e > line) && (e[-1] == '\\')
-                          && ((nextline = bb_get_line_from_file(cmdfile)) != NULL)) {
+                       && (e > line) && (e[-1] == '\\')
+                       && ((nextline = bb_get_line_from_file(cmdfile)) != NULL)) {
                        line = xrealloc(line, (e - line) + 1 + strlen(nextline) + 1);
                        strcat(line, nextline);
                        free(nextline);
@@ -686,9 +659,7 @@ void pipe_putc(struct pipeline *const pipeline, char c)
 #endif
 
 static void print_subst_w_backrefs(const char *line, const char *replace,
-                                                                  regmatch_t * regmatch,
-                                                                  struct pipeline *const pipeline,
-                                                                  int matches)
+       regmatch_t * regmatch, struct pipeline *const pipeline, int matches)
 {
        int i;
 
@@ -707,7 +678,7 @@ static void print_subst_w_backrefs(const char *line, const char *replace,
                        /* print out the text held in regmatch[backref] */
                        if (backref <= matches && regmatch[backref].rm_so != -1)
                                for (j = regmatch[backref].rm_so; j < regmatch[backref].rm_eo;
-                                        j++)
+                                       j++)
                                        pipeputc(line[j]);
                }
 
@@ -723,6 +694,7 @@ static void print_subst_w_backrefs(const char *line, const char *replace,
                 * purpose...) */
                else if (replace[i] == '&') {
                        int j;
+
                        for (j = regmatch[0].rm_so; j < regmatch[0].rm_eo; j++)
                                pipeputc(line[j]);
                }
@@ -766,9 +738,9 @@ static int do_subst_command(sed_cmd_t * sed_cmd, char **line)
 
        /* and now, as long as we've got a line to try matching and if we can match
         * the search string, we make substitutions */
-       while ((*hackline || !altered) && (regexec(current_regex, hackline,
-                                                                                          sed_cmd->num_backrefs + 1,
-                                                                                          regmatch, 0) != REG_NOMATCH)) {
+       while ((*hackline || !altered)
+               && (regexec(current_regex, hackline, sed_cmd->num_backrefs + 1,
+                               regmatch, 0) != REG_NOMATCH)) {
                int i;
 
                /* print everything before the match */
@@ -776,8 +748,8 @@ static int do_subst_command(sed_cmd_t * sed_cmd, char **line)
                        pipeputc(hackline[i]);
 
                /* then print the substitution string */
-               print_subst_w_backrefs(hackline, sed_cmd->replace, regmatch,
-                                                          pipeline, sed_cmd->num_backrefs);
+               print_subst_w_backrefs(hackline, sed_cmd->replace, regmatch, pipeline,
+                       sed_cmd->num_backrefs);
 
                /* advance past the match */
                hackline += regmatch[0].rm_eo;
@@ -805,6 +777,7 @@ static int do_subst_command(sed_cmd_t * sed_cmd, char **line)
 static sed_cmd_t *branch_to(const char *label)
 {
        sed_cmd_t *sed_cmd;
+
        for (sed_cmd = sed_cmd_head.next; sed_cmd; sed_cmd = sed_cmd->next) {
                if ((sed_cmd->label) && (strcmp(sed_cmd->label, label) == 0)) {
                        break;
@@ -828,12 +801,14 @@ static void process_file(FILE * file)
        if (pattern_space == NULL) {
                return;
        }
-
        /* go through every line in the file */
        do {
                char *next_line;
                sed_cmd_t *sed_cmd;
                int substituted = 0;
+               /* This enables whole blocks of commands to be mask'ed out if the lead address doesnt match */
+               int block_mask = 1;
 
                /* Read one line in advance so we can act on the last line, the '$' address */
                next_line = bb_get_chomped_line_from_file(file);
@@ -843,34 +818,34 @@ static void process_file(FILE * file)
                force_print = 0;
 
                /* for every line, go through all the commands */
-               for (sed_cmd = sed_cmd_head.next; sed_cmd;
-                        sed_cmd = sed_cmd->next) {
+               for (sed_cmd = sed_cmd_head.next; sed_cmd; sed_cmd = sed_cmd->next) {
                        int deleted = 0;
 
                        /*
                         * entry point into sedding...
                         */
                        int matched = (
-                                                         /* no range necessary */
-                                                         (sed_cmd->beg_line == 0
-                                                          && sed_cmd->end_line == 0
-                                                          && sed_cmd->beg_match == NULL
-                                                          && sed_cmd->end_match == NULL) ||
-                                                         /* this line number is the first address we're looking for */
-                                                         (sed_cmd->beg_line
-                                                          && (sed_cmd->beg_line == linenum)) ||
-                                                         /* this line matches our first address regex */
-                                                         (sed_cmd->beg_match
-                                                          &&
-                                                          (regexec
-                                                               (sed_cmd->beg_match, pattern_space, 0, NULL,
-                                                                0) == 0)) ||
-                                                         /* we are currently within the beginning & ending address range */
-                                                         still_in_range || ((sed_cmd->beg_line == -1)
-                                                                                                && (next_line == NULL))
+                               /* no range necessary */
+                               (sed_cmd->beg_line == 0 && sed_cmd->end_line == 0
+                                       && sed_cmd->beg_match == NULL
+                                       && sed_cmd->end_match == NULL) ||
+                               /* this line number is the first address we're looking for */
+                               (sed_cmd->beg_line > 0 && (sed_cmd->beg_line == linenum)) ||
+                               /* this line matches our first address regex */
+                               (sed_cmd->beg_match
+                                       && (regexec(sed_cmd->beg_match, pattern_space, 0, NULL,
+                                                       0) == 0)) ||
+                               /* we are currently within the beginning & ending address range */
+                               still_in_range || ((sed_cmd->beg_line == -1)
+                                       && (next_line == NULL))
                                );
 
-                       if (sed_cmd->invert ^ matched) {
+                       if (sed_cmd->cmd == '{') {
+                               block_mask = block_mask & matched;
+                       }
+//                     matched &= block_mask;
+
+                       if (sed_cmd->invert ^ (matched & block_mask)) {
                                /* Update last used regex incase a blank substitute BRE is found */
                                if (sed_cmd->beg_match) {
                                        previous_regex_ptr = sed_cmd->beg_match;
@@ -927,7 +902,7 @@ static void process_file(FILE * file)
 
                                                pattern_space =
                                                        xrealloc(pattern_space,
-                                                                        strlen(pattern_space) + 2);
+                                                       strlen(pattern_space) + 2);
                                                tmp = strchr(pattern_space + offset, '\n');
                                                memmove(tmp + 1, tmp, strlen(tmp) + 1);
                                                tmp[0] = '\\';
@@ -952,8 +927,7 @@ static void process_file(FILE * file)
 #endif
                                        altered |= substituted;
                                        if (!be_quiet && altered && ((sed_cmd->next == NULL)
-                                                                                                || (sed_cmd->next->cmd !=
-                                                                                                        's'))) {
+                                                       || (sed_cmd->next->cmd != 's'))) {
                                                force_print = 1;
                                        }
 
@@ -979,10 +953,8 @@ static void process_file(FILE * file)
                                                /* multi-address case */
                                                /* - matching text */
                                                || (sed_cmd->end_match
-                                                       &&
-                                                       (regexec
-                                                        (sed_cmd->end_match, pattern_space, 0, NULL,
-                                                         0) == 0))
+                                                       && (regexec(sed_cmd->end_match, pattern_space, 0,
+                                                                       NULL, 0) == 0))
                                                /* - matching line numbers */
                                                || (sed_cmd->end_line > 0
                                                        && sed_cmd->end_line == linenum)) {
@@ -994,11 +966,17 @@ static void process_file(FILE * file)
 
                                case 'r':{
                                        FILE *outfile;
+
                                        outfile = fopen(sed_cmd->filename, "r");
                                        if (outfile) {
                                                char *line;
-                                               while ((line = bb_get_chomped_line_from_file(outfile)) != NULL) {
-                                                       pattern_space = xrealloc(pattern_space, strlen(line) + strlen(pattern_space) + 2);
+
+                                               while ((line =
+                                                               bb_get_chomped_line_from_file(outfile)) !=
+                                                       NULL) {
+                                                       pattern_space =
+                                                               xrealloc(pattern_space,
+                                                               strlen(line) + strlen(pattern_space) + 2);
                                                        strcat(pattern_space, "\n");
                                                        strcat(pattern_space, line);
                                                }
@@ -1023,8 +1001,7 @@ static void process_file(FILE * file)
                                        if (next_line) {
                                                pattern_space =
                                                        realloc(pattern_space,
-                                                                       strlen(pattern_space) +
-                                                                       strlen(next_line) + 2);
+                                                       strlen(pattern_space) + strlen(next_line) + 2);
                                                strcat(pattern_space, "\n");
                                                strcat(pattern_space, next_line);
                                                next_line = bb_get_chomped_line_from_file(file);
@@ -1057,17 +1034,36 @@ static void process_file(FILE * file)
                                        free(pattern_space);
                                        pattern_space = strdup(hold_space);
                                        break;
+                               case 'G': {     /* Append newline and hold space to pattern space */
+                                       int pattern_space_size = 0;
+                                       if (pattern_space) {
+                                               pattern_space_size = strlen(pattern_space);
+                                       }
+                                       pattern_space = xrealloc(pattern_space, pattern_space_size + strlen(hold_space) + 2);
+                                       strcat(pattern_space, "\n");
+                                       strcat(pattern_space, hold_space); 
+                                       break;
+                               }
                                case 'h':       /* Replace hold space with pattern space */
                                        free(hold_space);
                                        hold_space = strdup(pattern_space);
                                        break;
+                               case 'H': {     /* Append newline and pattern space to hold space */
+                                       int hold_space_size = 0;
+                                       if (hold_space) {
+                                               hold_space_size = strlen(hold_space);
+                                       }
+                                       hold_space = xrealloc(hold_space, hold_space_size + strlen(pattern_space) + 2);
+                                       strcat(hold_space, "\n");
+                                       strcat(hold_space, pattern_space); 
+                                       break;
+                               }
                                case 'x':{
                                        /* Swap hold and pattern space */
-                                       char *tmp;
-
-                                       tmp = pattern_space;
+                                       char *tmp = pattern_space;
                                        pattern_space = hold_space;
                                        hold_space = tmp;
+                                       break;
                                }
                                }
                        }
@@ -1077,43 +1073,31 @@ static void process_file(FILE * file)
                         */
                        if (matched) {
                                if (
-                                          /* this is a single-address command or... */
-                                          (sed_cmd->end_line == 0 && sed_cmd->end_match == NULL)
-                                          || (
-                                                         /* If only one address */
-                                                         /* we were in the middle of our address range (this
-                                                          * isn't the first time through) and.. */
-                                                         (still_in_range == 1) && (
-                                                                                                                  /* this line number is the last address we're looking for or... */
-                                                                                                                  (sed_cmd->
-                                                                                                                       end_line
-                                                                                                                       && (sed_cmd->
-                                                                                                                               end_line ==
-                                                                                                                               linenum))
-                                                                                                                  ||
-                                                                                                                  /* this line matches our last address regex */
-                                                                                                                  (sed_cmd->
-                                                                                                                       end_match
-                                                                                                                       &&
-                                                                                                                       (regexec
-                                                                                                                        (sed_cmd->
-                                                                                                                         end_match,
-                                                                                                                         pattern_space,
-                                                                                                                         0, NULL,
-                                                                                                                         0) == 0))
-                                                         )
-                                          )
-                                       ) {
+                                       /* this is a single-address command or... */
+                                       (sed_cmd->end_line == 0 && sed_cmd->end_match == NULL)
+                                       /* If only one address */
+                                       /* we were in the middle of our address range (this
+                                        * isn't the first time through) and.. */
+                                       || ((still_in_range == 1)
+                                               /* this line number is the last address we're looking for or... */
+                                               && ((sed_cmd->end_line > 0
+                                                               && (sed_cmd->end_line == linenum))
+                                                       /* this line matches our last address regex */
+                                                       || (sed_cmd->end_match
+                                                               && (regexec(sed_cmd->end_match, pattern_space,
+                                                                               0, NULL, 0) == 0))))) {
                                        /* we're out of our address range */
                                        still_in_range = 0;
-                               }
-
-                               /* didn't hit the exit? then we're still in the middle of an address range */
-                               else {
+                               } else {
+                                       /* didn't hit the exit? then we're still in the middle of an address range */
                                        still_in_range = 1;
                                }
                        }
 
+                       if (sed_cmd->cmd == '}') {
+                               block_mask = 1;
+                       }
+
                        if (deleted)
                                break;
                }