aboutsummaryrefslogtreecommitdiff
path: root/toys/posix/sed.c
blob: 15099cc61d6556cd9b91a992811ae59468d1c800 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
/* sed.c - Stream editor.
 *
 * Copyright 2012 Rob Landley <rob@landley.net>
 *
 * See http://opengroup.org/onlinepubs/9699919799/utilities/sed.c

USE_SED(NEWTOY(sed, "irne*", TOYFLAG_BIN))

config SED
  bool "sed"
  default n
  help
    usage: sed [-irn] {command | [-e command]...} [FILE...]

    Stream EDitor, transforms text by appling script of command to each line
    of input.

    -e  Add expression to the command script (if no -e, use first argument)
    -i	Modify file in place
    -n  No default output (p commands only)
    -r  Use extended regular expression syntex
*/

#define FOR_sed
#include "toys.h"
#include "lib/xregcomp.h"

GLOBALS(
  struct arg_list *scripts;
  struct double_list *commands;

  void *parsed;
)

// Digested version of what sed commands can actually tell use to do.


struct sed_command {
  // double_list compatibility (easier to create in-order)
  struct sed_command *next, *prev;

  // data string for (saicytb)
  char c, *data;
  // Regexes for s/match/data/ and /begin/,/end/command
  regex_t *match, *begin, *end;
  // For numeric ranges ala 10,20command
  long lstart, lstop;
  // Which match to replace, 0 for all. s and w commands can write to a file
  int which, outfd;
};

//  Space. Space. Gotta get past space. Spaaaaaaaace! (But not newline.)
void spaceorb(char **s)
{
  while (**s == ' ' || **s == '\t') *s++;
}

void parse_scripts(void)
{
  struct sed_command *commands = 0;
  struct arg_list *script;
  int which = 0;
  long l;

  for (script = TT.scripts; *script; script = script->next) {
    char *str = script->arg, *s;
    struct sed_command *cmd;

    which++;
    for (i=1;;) {
      if (!*str) break;

      cmd = xzalloc(sizeof(struct sed_command));

      // Identify prefix
      for (;;) {
        long l;

        spaceorb(&str);
        if (*str == '$') {
          l = -1;
          str++;
        } else if (isdigit(*str)) l = strtol(str, &str, 10);
        else if (!cmd->lstart) break;
        else goto parse_fail;

        spaceorb(&str);
        if (!cmd->lstart) {
          if (!l) goto parse_fail;
          cmd->lstart = l;
          if (*str != ',') break;
          str++;
          continue;
        }
        cmd->lstop = l;
        break;
      } else if (*str == '/') {
        printf("regex\n");
      }
      l = stridx("{bcdDgGhHlnNpPstwxyrqia= \t#:}", *str);
      if (l == -1) goto parse_fail;


    }
  }

  return;

parse_fail:
  error_exit("bad expression %d@%d: %s", which, i, script->arg+i);
}

void sed_main(void)
{
  char **files=toys.optargs;

  // If no -e, use first argument
  if (!TT.scripts) {
    if (!*files) error_exit("Need script");
    (TT.scripts=xzalloc(sizeof(struct arg_list)))->arg=*(files++);
  }


  {
    struct arg_list *test;

    for (test = TT.commands; test; test = test->next)
      dprintf(2,"command=%s\n",test->arg);
    while (*files) dprintf(2,"file=%s\n", *(files++));
  }
}