2 3940506b 2005-01-13 devnull * sed -- stream editor
6 3940506b 2005-01-13 devnull #include <u.h>
7 3940506b 2005-01-13 devnull #include <libc.h>
8 3940506b 2005-01-13 devnull #include <bio.h>
9 3940506b 2005-01-13 devnull #include <regexp.h>
12 3940506b 2005-01-13 devnull DEPTH = 20, /* max nesting depth of {} */
13 3940506b 2005-01-13 devnull MAXCMDS = 512, /* max sed commands */
14 3940506b 2005-01-13 devnull ADDSIZE = 10000, /* size of add & read buffer */
15 3940506b 2005-01-13 devnull MAXADDS = 20, /* max pending adds and reads */
16 3940506b 2005-01-13 devnull LBSIZE = 8192, /* input line size */
17 3940506b 2005-01-13 devnull LABSIZE = 50, /* max label name size */
18 3940506b 2005-01-13 devnull MAXSUB = 10, /* max number of sub reg exp */
19 3940506b 2005-01-13 devnull MAXFILES = 120, /* max output files */
21 3940506b 2005-01-13 devnull /* An address is a line #, a R.E., "$", a reference to the last
22 3940506b 2005-01-13 devnull * R.E., or nothing.
24 3940506b 2005-01-13 devnull typedef struct {
33 3940506b 2005-01-13 devnull long line; /* Line # */
34 3940506b 2005-01-13 devnull Reprog *rp; /* Compiled R.E. */
38 3940506b 2005-01-13 devnull typedef struct SEDCOM {
39 3940506b 2005-01-13 devnull Addr ad1; /* optional start address */
40 3940506b 2005-01-13 devnull Addr ad2; /* optional end address */
42 3940506b 2005-01-13 devnull Reprog *re1; /* compiled R.E. */
43 3940506b 2005-01-13 devnull Rune *text; /* added text or file name */
44 3940506b 2005-01-13 devnull struct SEDCOM *lb1; /* destination command of branch */
46 3940506b 2005-01-13 devnull Rune *rhs; /* Right-hand side of substitution */
47 3940506b 2005-01-13 devnull Biobuf* fcode; /* File ID for read and write */
48 3940506b 2005-01-13 devnull char command; /* command code -see below */
49 3940506b 2005-01-13 devnull char gfl; /* 'Global' flag for substitutions */
50 3940506b 2005-01-13 devnull char pfl; /* 'print' flag for substitutions */
51 3940506b 2005-01-13 devnull char active; /* 1 => data between start and end */
52 3940506b 2005-01-13 devnull char negfl; /* negation flag */
53 3940506b 2005-01-13 devnull } SedCom;
55 3940506b 2005-01-13 devnull /* Command Codes for field SedCom.command */
56 3940506b 2005-01-13 devnull #define ACOM 01
57 3940506b 2005-01-13 devnull #define BCOM 020
58 3940506b 2005-01-13 devnull #define CCOM 02
59 3940506b 2005-01-13 devnull #define CDCOM 025
60 3940506b 2005-01-13 devnull #define CNCOM 022
61 3940506b 2005-01-13 devnull #define COCOM 017
62 3940506b 2005-01-13 devnull #define CPCOM 023
63 3940506b 2005-01-13 devnull #define DCOM 03
64 3940506b 2005-01-13 devnull #define ECOM 015
65 3940506b 2005-01-13 devnull #define EQCOM 013
66 3940506b 2005-01-13 devnull #define FCOM 016
67 3940506b 2005-01-13 devnull #define GCOM 027
68 3940506b 2005-01-13 devnull #define CGCOM 030
69 3940506b 2005-01-13 devnull #define HCOM 031
70 3940506b 2005-01-13 devnull #define CHCOM 032
71 3940506b 2005-01-13 devnull #define ICOM 04
72 3940506b 2005-01-13 devnull #define LCOM 05
73 3940506b 2005-01-13 devnull #define NCOM 012
74 3940506b 2005-01-13 devnull #define PCOM 010
75 3940506b 2005-01-13 devnull #define QCOM 011
76 3940506b 2005-01-13 devnull #define RCOM 06
77 3940506b 2005-01-13 devnull #define SCOM 07
78 3940506b 2005-01-13 devnull #define TCOM 021
79 3940506b 2005-01-13 devnull #define WCOM 014
80 3940506b 2005-01-13 devnull #define CWCOM 024
81 3940506b 2005-01-13 devnull #define YCOM 026
82 3940506b 2005-01-13 devnull #define XCOM 033
85 3940506b 2005-01-13 devnull typedef struct label { /* Label symbol table */
86 3940506b 2005-01-13 devnull Rune asc[9]; /* Label name */
87 3940506b 2005-01-13 devnull SedCom *chain;
88 3940506b 2005-01-13 devnull SedCom *address; /* Command associated with label */
91 3940506b 2005-01-13 devnull typedef struct FILE_CACHE { /* Data file control block */
92 3940506b 2005-01-13 devnull struct FILE_CACHE *next; /* Forward Link */
93 3940506b 2005-01-13 devnull char *name; /* Name of file */
94 3940506b 2005-01-13 devnull } FileCache;
96 3940506b 2005-01-13 devnull SedCom pspace[MAXCMDS]; /* Command storage */
97 3940506b 2005-01-13 devnull SedCom *pend = pspace+MAXCMDS; /* End of command storage */
98 3940506b 2005-01-13 devnull SedCom *rep = pspace; /* Current fill point */
100 3940506b 2005-01-13 devnull Reprog *lastre = 0; /* Last regular expression */
101 3940506b 2005-01-13 devnull Resub subexp[MAXSUB]; /* sub-patterns of pattern match*/
103 3940506b 2005-01-13 devnull Rune addspace[ADDSIZE]; /* Buffer for a, c, & i commands */
104 3940506b 2005-01-13 devnull Rune *addend = addspace+ADDSIZE;
106 3940506b 2005-01-13 devnull SedCom *abuf[MAXADDS]; /* Queue of pending adds & reads */
107 3940506b 2005-01-13 devnull SedCom **aptr = abuf;
109 3940506b 2005-01-13 devnull struct { /* Sed program input control block */
110 3940506b 2005-01-13 devnull enum PTYPE /* Either on command line or in file */
111 3940506b 2005-01-13 devnull { P_ARG,
114 3940506b 2005-01-13 devnull union PCTL { /* Pointer to data */
115 3940506b 2005-01-13 devnull Biobuf *bp;
116 3940506b 2005-01-13 devnull char *curr;
120 3940506b 2005-01-13 devnull Rune genbuf[LBSIZE]; /* Miscellaneous buffer */
122 3940506b 2005-01-13 devnull FileCache *fhead = 0; /* Head of File Cache Chain */
123 3940506b 2005-01-13 devnull FileCache *ftail = 0; /* Tail of File Cache Chain */
125 3940506b 2005-01-13 devnull Rune *loc1; /* Start of pattern match */
126 3940506b 2005-01-13 devnull Rune *loc2; /* End of pattern match */
127 3940506b 2005-01-13 devnull Rune seof; /* Pattern delimiter char */
129 3940506b 2005-01-13 devnull Rune linebuf[LBSIZE+1]; /* Input data buffer */
130 3940506b 2005-01-13 devnull Rune *lbend = linebuf+LBSIZE; /* End of buffer */
131 3940506b 2005-01-13 devnull Rune *spend = linebuf; /* End of input data */
132 3940506b 2005-01-13 devnull Rune *cp; /* Current scan point in linebuf */
134 3940506b 2005-01-13 devnull Rune holdsp[LBSIZE+1]; /* Hold buffer */
135 3940506b 2005-01-13 devnull Rune *hend = holdsp+LBSIZE; /* End of hold buffer */
136 3940506b 2005-01-13 devnull Rune *hspend = holdsp; /* End of hold data */
138 3940506b 2005-01-13 devnull int nflag; /* Command line flags */
139 3940506b 2005-01-13 devnull int gflag;
141 3940506b 2005-01-13 devnull int dolflag; /* Set when at true EOF */
142 3940506b 2005-01-13 devnull int sflag; /* Set when substitution done */
143 3940506b 2005-01-13 devnull int jflag; /* Set when jump required */
144 3940506b 2005-01-13 devnull int delflag; /* Delete current line when set */
146 3940506b 2005-01-13 devnull long lnum = 0; /* Input line count */
148 3940506b 2005-01-13 devnull char fname[MAXFILES][40]; /* File name cache */
149 3940506b 2005-01-13 devnull Biobuf *fcode[MAXFILES]; /* File ID cache */
150 3940506b 2005-01-13 devnull int nfiles = 0; /* Cache fill point */
152 3940506b 2005-01-13 devnull Biobuf fout; /* Output stream */
153 3940506b 2005-01-13 devnull Biobuf bstdin; /* Default input */
154 3940506b 2005-01-13 devnull Biobuf* f = 0; /* Input data */
156 3940506b 2005-01-13 devnull Label ltab[LABSIZE]; /* Label name symbol table */
157 3940506b 2005-01-13 devnull Label *labend = ltab+LABSIZE; /* End of label table */
158 3940506b 2005-01-13 devnull Label *lab = ltab+1; /* Current Fill point */
160 3940506b 2005-01-13 devnull int depth = 0; /* {} stack pointer */
162 3940506b 2005-01-13 devnull Rune bad; /* Dummy err ptr reference */
163 3940506b 2005-01-13 devnull Rune *badp = &bad;
166 3940506b 2005-01-13 devnull char CGMES[] = "Command garbled: %S";
167 3940506b 2005-01-13 devnull char TMMES[] = "Too much text: %S";
168 3940506b 2005-01-13 devnull char LTL[] = "Label too long: %S";
169 3940506b 2005-01-13 devnull char AD0MES[] = "No addresses allowed: %S";
170 3940506b 2005-01-13 devnull char AD1MES[] = "Only one address allowed: %S";
172 3940506b 2005-01-13 devnull void address(Addr *);
173 3940506b 2005-01-13 devnull void arout(void);
174 3940506b 2005-01-13 devnull int cmp(char *, char *);
175 3940506b 2005-01-13 devnull int rcmp(Rune *, Rune *);
176 3940506b 2005-01-13 devnull void command(SedCom *);
177 3940506b 2005-01-13 devnull Reprog *compile(void);
178 3940506b 2005-01-13 devnull Rune *compsub(Rune *, Rune *);
179 3940506b 2005-01-13 devnull void dechain(void);
180 3940506b 2005-01-13 devnull void dosub(Rune *);
181 3940506b 2005-01-13 devnull int ecmp(Rune *, Rune *, int);
182 3940506b 2005-01-13 devnull void enroll(char *);
183 3940506b 2005-01-13 devnull void errexit(void);
184 3940506b 2005-01-13 devnull int executable(SedCom *);
185 3940506b 2005-01-13 devnull void execute(void);
186 3940506b 2005-01-13 devnull void fcomp(void);
187 3940506b 2005-01-13 devnull long getrune(void);
188 3940506b 2005-01-13 devnull Rune *gline(Rune *);
189 3940506b 2005-01-13 devnull int match(Reprog *, Rune *);
190 3940506b 2005-01-13 devnull void newfile(enum PTYPE, char *);
191 3940506b 2005-01-13 devnull int opendata(void);
192 3940506b 2005-01-13 devnull Biobuf *open_file(char *);
193 3940506b 2005-01-13 devnull Rune *place(Rune *, Rune *, Rune *);
194 3940506b 2005-01-13 devnull void quit(char *, char *);
195 3940506b 2005-01-13 devnull int rline(Rune *, Rune *);
196 3940506b 2005-01-13 devnull Label *search(Label *);
197 3940506b 2005-01-13 devnull int substitute(SedCom *);
198 3940506b 2005-01-13 devnull char *text(char *);
199 3940506b 2005-01-13 devnull Rune *stext(Rune *, Rune *);
200 3940506b 2005-01-13 devnull int ycomp(SedCom *);
201 3940506b 2005-01-13 devnull char * trans(int c);
202 3940506b 2005-01-13 devnull void putline(Biobuf *bp, Rune *buf, int n);
205 3940506b 2005-01-13 devnull main(int argc, char **argv)
207 3940506b 2005-01-13 devnull int compfl;
209 3940506b 2005-01-13 devnull lnum = 0;
210 3940506b 2005-01-13 devnull Binit(&fout, 1, OWRITE);
211 3940506b 2005-01-13 devnull fcode[nfiles++] = &fout;
212 3940506b 2005-01-13 devnull compfl = 0;
214 3940506b 2005-01-13 devnull if(argc == 1)
215 3940506b 2005-01-13 devnull exits(0);
216 3940506b 2005-01-13 devnull ARGBEGIN{
217 3940506b 2005-01-13 devnull case 'n':
218 3940506b 2005-01-13 devnull nflag++;
219 3940506b 2005-01-13 devnull continue;
220 3940506b 2005-01-13 devnull case 'f':
221 3940506b 2005-01-13 devnull if(argc <= 1)
222 3940506b 2005-01-13 devnull quit("no pattern-file", 0);
223 3940506b 2005-01-13 devnull newfile(P_FILE, ARGF());
224 3940506b 2005-01-13 devnull fcomp();
225 3940506b 2005-01-13 devnull compfl = 1;
226 3940506b 2005-01-13 devnull continue;
227 3940506b 2005-01-13 devnull case 'e':
228 3940506b 2005-01-13 devnull if (argc <= 1)
229 3940506b 2005-01-13 devnull quit("missing pattern", 0);
230 3940506b 2005-01-13 devnull newfile(P_ARG, ARGF());
231 3940506b 2005-01-13 devnull fcomp();
232 3940506b 2005-01-13 devnull compfl = 1;
233 3940506b 2005-01-13 devnull continue;
234 3940506b 2005-01-13 devnull case 'g':
235 3940506b 2005-01-13 devnull gflag++;
236 3940506b 2005-01-13 devnull continue;
237 3940506b 2005-01-13 devnull default:
238 3940506b 2005-01-13 devnull fprint(2, "sed: Unknown flag: %c\n", ARGC());
239 3940506b 2005-01-13 devnull continue;
240 3940506b 2005-01-13 devnull } ARGEND
242 3940506b 2005-01-13 devnull if(compfl == 0) {
243 3940506b 2005-01-13 devnull if (--argc < 0)
244 3940506b 2005-01-13 devnull quit("missing pattern", 0);
245 3940506b 2005-01-13 devnull newfile(P_ARG, *argv++);
246 3940506b 2005-01-13 devnull fcomp();
249 3940506b 2005-01-13 devnull if(depth)
250 3940506b 2005-01-13 devnull quit("Too many {'s", 0);
252 3940506b 2005-01-13 devnull ltab[0].address = rep;
254 3940506b 2005-01-13 devnull dechain();
256 3940506b 2005-01-13 devnull if(argc <= 0)
257 3940506b 2005-01-13 devnull enroll(0); /* Add stdin to cache */
258 3940506b 2005-01-13 devnull else while(--argc >= 0) {
259 3940506b 2005-01-13 devnull enroll(*argv++);
261 3940506b 2005-01-13 devnull execute();
262 3940506b 2005-01-13 devnull exits(0);
265 3940506b 2005-01-13 devnull fcomp(void)
267 3940506b 2005-01-13 devnull Rune *tp;
268 3940506b 2005-01-13 devnull SedCom *pt, *pt1;
270 3940506b 2005-01-13 devnull Label *lpt;
272 3940506b 2005-01-13 devnull static Rune *p = addspace;
273 3940506b 2005-01-13 devnull static SedCom **cmpend[DEPTH]; /* stack of {} operations */
275 3940506b 2005-01-13 devnull while (rline(linebuf, lbend) >= 0) {
276 3940506b 2005-01-13 devnull cp = linebuf;
277 3940506b 2005-01-13 devnull comploop:
278 3940506b 2005-01-13 devnull while(*cp == ' ' || *cp == '\t')
280 3940506b 2005-01-13 devnull if(*cp == '\0' || *cp == '#')
281 3940506b 2005-01-13 devnull continue;
282 3940506b 2005-01-13 devnull if(*cp == ';') {
284 3940506b 2005-01-13 devnull goto comploop;
287 3940506b 2005-01-13 devnull address(&rep->ad1);
288 3940506b 2005-01-13 devnull if (rep->ad1.type != A_NONE) {
289 3940506b 2005-01-13 devnull if (rep->ad1.type == A_LAST) {
290 3940506b 2005-01-13 devnull if (!lastre)
291 3940506b 2005-01-13 devnull quit("First RE may not be null", 0);
292 3940506b 2005-01-13 devnull rep->ad1.type = A_RE;
293 3940506b 2005-01-13 devnull rep->ad1.u.rp = lastre;
295 3940506b 2005-01-13 devnull if(*cp == ',' || *cp == ';') {
297 3940506b 2005-01-13 devnull address(&rep->ad2);
298 3940506b 2005-01-13 devnull if (rep->ad2.type == A_LAST) {
299 3940506b 2005-01-13 devnull rep->ad1.type = A_RE;
300 3940506b 2005-01-13 devnull rep->ad2.u.rp = lastre;
303 3940506b 2005-01-13 devnull rep->ad2.type = A_NONE;
305 3940506b 2005-01-13 devnull while(*cp == ' ' || *cp == '\t')
309 3940506b 2005-01-13 devnull switch(*cp++) {
311 3940506b 2005-01-13 devnull default:
312 3940506b 2005-01-13 devnull quit("Unrecognized command: %S", (char *)linebuf);
314 3940506b 2005-01-13 devnull case '!':
315 3940506b 2005-01-13 devnull rep->negfl = 1;
316 3940506b 2005-01-13 devnull goto swit;
318 3940506b 2005-01-13 devnull case '{':
319 3940506b 2005-01-13 devnull rep->command = BCOM;
320 3940506b 2005-01-13 devnull rep->negfl = !(rep->negfl);
321 3940506b 2005-01-13 devnull cmpend[depth++] = &rep->u.lb1;
322 3940506b 2005-01-13 devnull if(++rep >= pend)
323 3940506b 2005-01-13 devnull quit("Too many commands: %S", (char *) linebuf);
324 3940506b 2005-01-13 devnull if(*cp == '\0') continue;
325 3940506b 2005-01-13 devnull goto comploop;
327 3940506b 2005-01-13 devnull case '}':
328 3940506b 2005-01-13 devnull if(rep->ad1.type != A_NONE)
329 3940506b 2005-01-13 devnull quit(AD0MES, (char *) linebuf);
330 3940506b 2005-01-13 devnull if(--depth < 0)
331 3940506b 2005-01-13 devnull quit("Too many }'s", 0);
332 3940506b 2005-01-13 devnull *cmpend[depth] = rep;
333 3940506b 2005-01-13 devnull if(*cp == 0) continue;
334 3940506b 2005-01-13 devnull goto comploop;
336 3940506b 2005-01-13 devnull case '=':
337 3940506b 2005-01-13 devnull rep->command = EQCOM;
338 3940506b 2005-01-13 devnull if(rep->ad2.type != A_NONE)
339 3940506b 2005-01-13 devnull quit(AD1MES, (char *) linebuf);
342 3940506b 2005-01-13 devnull case ':':
343 3940506b 2005-01-13 devnull if(rep->ad1.type != A_NONE)
344 3940506b 2005-01-13 devnull quit(AD0MES, (char *) linebuf);
346 3940506b 2005-01-13 devnull while(*cp == ' ')
348 3940506b 2005-01-13 devnull tp = lab->asc;
349 3940506b 2005-01-13 devnull while (*cp && *cp != ';' && *cp != ' ' && *cp != '\t' && *cp != '#') {
350 3940506b 2005-01-13 devnull *tp++ = *cp++;
351 3940506b 2005-01-13 devnull if(tp >= &(lab->asc[8]))
352 3940506b 2005-01-13 devnull quit(LTL, (char *) linebuf);
354 3940506b 2005-01-13 devnull *tp = '\0';
356 3940506b 2005-01-13 devnull if(lpt = search(lab)) {
357 3940506b 2005-01-13 devnull if(lpt->address)
358 3940506b 2005-01-13 devnull quit("Duplicate labels: %S", (char *) linebuf);
359 3940506b 2005-01-13 devnull } else {
360 3940506b 2005-01-13 devnull lab->chain = 0;
361 3940506b 2005-01-13 devnull lpt = lab;
362 3940506b 2005-01-13 devnull if(++lab >= labend)
363 3940506b 2005-01-13 devnull quit("Too many labels: %S", (char *) linebuf);
365 3940506b 2005-01-13 devnull lpt->address = rep;
366 3940506b 2005-01-13 devnull if (*cp == '#')
367 3940506b 2005-01-13 devnull continue;
368 3940506b 2005-01-13 devnull rep--; /* reuse this slot */
371 3940506b 2005-01-13 devnull case 'a':
372 3940506b 2005-01-13 devnull rep->command = ACOM;
373 3940506b 2005-01-13 devnull if(rep->ad2.type != A_NONE)
374 3940506b 2005-01-13 devnull quit(AD1MES, (char *) linebuf);
375 3940506b 2005-01-13 devnull if(*cp == '\\') cp++;
376 3940506b 2005-01-13 devnull if(*cp++ != '\n')
377 3940506b 2005-01-13 devnull quit(CGMES, (char *) linebuf);
378 3940506b 2005-01-13 devnull rep->u.text = p;
379 3940506b 2005-01-13 devnull p = stext(p, addend);
381 3940506b 2005-01-13 devnull case 'c':
382 3940506b 2005-01-13 devnull rep->command = CCOM;
383 3940506b 2005-01-13 devnull if(*cp == '\\') cp++;
384 3940506b 2005-01-13 devnull if(*cp++ != '\n')
385 3940506b 2005-01-13 devnull quit(CGMES, (char *) linebuf);
386 3940506b 2005-01-13 devnull rep->u.text = p;
387 3940506b 2005-01-13 devnull p = stext(p, addend);
389 3940506b 2005-01-13 devnull case 'i':
390 3940506b 2005-01-13 devnull rep->command = ICOM;
391 3940506b 2005-01-13 devnull if(rep->ad2.type != A_NONE)
392 3940506b 2005-01-13 devnull quit(AD1MES, (char *) linebuf);
393 3940506b 2005-01-13 devnull if(*cp == '\\') cp++;
394 3940506b 2005-01-13 devnull if(*cp++ != '\n')
395 3940506b 2005-01-13 devnull quit(CGMES, (char *) linebuf);
396 3940506b 2005-01-13 devnull rep->u.text = p;
397 3940506b 2005-01-13 devnull p = stext(p, addend);
400 3940506b 2005-01-13 devnull case 'g':
401 3940506b 2005-01-13 devnull rep->command = GCOM;
404 3940506b 2005-01-13 devnull case 'G':
405 3940506b 2005-01-13 devnull rep->command = CGCOM;
408 3940506b 2005-01-13 devnull case 'h':
409 3940506b 2005-01-13 devnull rep->command = HCOM;
412 3940506b 2005-01-13 devnull case 'H':
413 3940506b 2005-01-13 devnull rep->command = CHCOM;
416 3940506b 2005-01-13 devnull case 't':
417 3940506b 2005-01-13 devnull rep->command = TCOM;
418 3940506b 2005-01-13 devnull goto jtcommon;
420 3940506b 2005-01-13 devnull case 'b':
421 3940506b 2005-01-13 devnull rep->command = BCOM;
422 3940506b 2005-01-13 devnull jtcommon:
423 3940506b 2005-01-13 devnull while(*cp == ' ')cp++;
424 3940506b 2005-01-13 devnull if(*cp == '\0') {
425 3940506b 2005-01-13 devnull if(pt = ltab[0].chain) {
426 3940506b 2005-01-13 devnull while(pt1 = pt->u.lb1)
427 3940506b 2005-01-13 devnull pt = pt1;
428 3940506b 2005-01-13 devnull pt->u.lb1 = rep;
430 3940506b 2005-01-13 devnull ltab[0].chain = rep;
433 3940506b 2005-01-13 devnull tp = lab->asc;
434 3940506b 2005-01-13 devnull while((*tp++ = *cp++))
435 3940506b 2005-01-13 devnull if(tp >= &(lab->asc[8]))
436 3940506b 2005-01-13 devnull quit(LTL, (char *) linebuf);
438 3940506b 2005-01-13 devnull tp[-1] = '\0';
440 3940506b 2005-01-13 devnull if(lpt = search(lab)) {
441 3940506b 2005-01-13 devnull if(lpt->address) {
442 3940506b 2005-01-13 devnull rep->u.lb1 = lpt->address;
443 3940506b 2005-01-13 devnull } else {
444 3940506b 2005-01-13 devnull pt = lpt->chain;
445 3940506b 2005-01-13 devnull while(pt1 = pt->u.lb1)
446 3940506b 2005-01-13 devnull pt = pt1;
447 3940506b 2005-01-13 devnull pt->u.lb1 = rep;
449 3940506b 2005-01-13 devnull } else {
450 3940506b 2005-01-13 devnull lab->chain = rep;
451 3940506b 2005-01-13 devnull lab->address = 0;
452 3940506b 2005-01-13 devnull if(++lab >= labend)
453 3940506b 2005-01-13 devnull quit("Too many labels: %S",
454 3940506b 2005-01-13 devnull (char *) linebuf);
458 3940506b 2005-01-13 devnull case 'n':
459 3940506b 2005-01-13 devnull rep->command = NCOM;
462 3940506b 2005-01-13 devnull case 'N':
463 3940506b 2005-01-13 devnull rep->command = CNCOM;
466 3940506b 2005-01-13 devnull case 'p':
467 3940506b 2005-01-13 devnull rep->command = PCOM;
470 3940506b 2005-01-13 devnull case 'P':
471 3940506b 2005-01-13 devnull rep->command = CPCOM;
474 3940506b 2005-01-13 devnull case 'r':
475 3940506b 2005-01-13 devnull rep->command = RCOM;
476 3940506b 2005-01-13 devnull if(rep->ad2.type != A_NONE)
477 3940506b 2005-01-13 devnull quit(AD1MES, (char *) linebuf);
478 3940506b 2005-01-13 devnull if(*cp++ != ' ')
479 3940506b 2005-01-13 devnull quit(CGMES, (char *) linebuf);
480 3940506b 2005-01-13 devnull rep->u.text = p;
481 3940506b 2005-01-13 devnull p = stext(p, addend);
484 3940506b 2005-01-13 devnull case 'd':
485 3940506b 2005-01-13 devnull rep->command = DCOM;
488 3940506b 2005-01-13 devnull case 'D':
489 3940506b 2005-01-13 devnull rep->command = CDCOM;
490 3940506b 2005-01-13 devnull rep->u.lb1 = pspace;
493 3940506b 2005-01-13 devnull case 'q':
494 3940506b 2005-01-13 devnull rep->command = QCOM;
495 3940506b 2005-01-13 devnull if(rep->ad2.type != A_NONE)
496 3940506b 2005-01-13 devnull quit(AD1MES, (char *) linebuf);
499 3940506b 2005-01-13 devnull case 'l':
500 3940506b 2005-01-13 devnull rep->command = LCOM;
503 3940506b 2005-01-13 devnull case 's':
504 3940506b 2005-01-13 devnull rep->command = SCOM;
505 3940506b 2005-01-13 devnull seof = *cp++;
506 3940506b 2005-01-13 devnull if ((rep->u.re1 = compile()) == 0) {
507 3940506b 2005-01-13 devnull if(!lastre)
508 3940506b 2005-01-13 devnull quit("First RE may not be null.", 0);
509 3940506b 2005-01-13 devnull rep->u.re1 = lastre;
511 3940506b 2005-01-13 devnull rep->rhs = p;
512 3940506b 2005-01-13 devnull if((p = compsub(p, addend)) == 0)
513 3940506b 2005-01-13 devnull quit(CGMES, (char *) linebuf);
514 3940506b 2005-01-13 devnull if(*cp == 'g') {
516 3940506b 2005-01-13 devnull rep->gfl++;
517 3940506b 2005-01-13 devnull } else if(gflag)
518 3940506b 2005-01-13 devnull rep->gfl++;
520 3940506b 2005-01-13 devnull if(*cp == 'p') {
522 3940506b 2005-01-13 devnull rep->pfl = 1;
525 3940506b 2005-01-13 devnull if(*cp == 'P') {
527 3940506b 2005-01-13 devnull rep->pfl = 2;
530 3940506b 2005-01-13 devnull if(*cp == 'w') {
532 3940506b 2005-01-13 devnull if(*cp++ != ' ')
533 3940506b 2005-01-13 devnull quit(CGMES, (char *) linebuf);
534 3940506b 2005-01-13 devnull text(fname[nfiles]);
535 3940506b 2005-01-13 devnull for(i = nfiles - 1; i >= 0; i--)
536 3940506b 2005-01-13 devnull if(cmp(fname[nfiles],fname[i]) == 0) {
537 3940506b 2005-01-13 devnull rep->fcode = fcode[i];
538 3940506b 2005-01-13 devnull goto done;
540 3940506b 2005-01-13 devnull if(nfiles >= MAXFILES)
541 3940506b 2005-01-13 devnull quit("Too many files in w commands 1", 0);
542 3940506b 2005-01-13 devnull rep->fcode = open_file(fname[nfiles]);
546 3940506b 2005-01-13 devnull case 'w':
547 3940506b 2005-01-13 devnull rep->command = WCOM;
548 3940506b 2005-01-13 devnull if(*cp++ != ' ')
549 3940506b 2005-01-13 devnull quit(CGMES, (char *) linebuf);
550 3940506b 2005-01-13 devnull text(fname[nfiles]);
551 3940506b 2005-01-13 devnull for(i = nfiles - 1; i >= 0; i--)
552 3940506b 2005-01-13 devnull if(cmp(fname[nfiles], fname[i]) == 0) {
553 3940506b 2005-01-13 devnull rep->fcode = fcode[i];
554 3940506b 2005-01-13 devnull goto done;
556 3940506b 2005-01-13 devnull if(nfiles >= MAXFILES){
557 3940506b 2005-01-13 devnull fprint(2, "sed: Too many files in w commands 2 \n");
558 3940506b 2005-01-13 devnull fprint(2, "nfiles = %d; MAXF = %d\n", nfiles, MAXFILES);
559 3940506b 2005-01-13 devnull errexit();
561 3940506b 2005-01-13 devnull rep->fcode = open_file(fname[nfiles]);
564 3940506b 2005-01-13 devnull case 'x':
565 3940506b 2005-01-13 devnull rep->command = XCOM;
568 3940506b 2005-01-13 devnull case 'y':
569 3940506b 2005-01-13 devnull rep->command = YCOM;
570 3940506b 2005-01-13 devnull seof = *cp++;
571 3940506b 2005-01-13 devnull if (ycomp(rep) == 0)
572 3940506b 2005-01-13 devnull quit(CGMES, (char *) linebuf);
577 3940506b 2005-01-13 devnull if(++rep >= pend)
578 3940506b 2005-01-13 devnull quit("Too many commands, last: %S", (char *) linebuf);
580 3940506b 2005-01-13 devnull if(*cp++ != '\0') {
581 3940506b 2005-01-13 devnull if(cp[-1] == ';')
582 3940506b 2005-01-13 devnull goto comploop;
583 3940506b 2005-01-13 devnull quit(CGMES, (char *) linebuf);
589 3940506b 2005-01-13 devnull Biobuf *
590 3940506b 2005-01-13 devnull open_file(char *name)
592 3940506b 2005-01-13 devnull Biobuf *bp;
595 3940506b 2005-01-13 devnull if ((bp = malloc(sizeof(Biobuf))) == 0)
596 3940506b 2005-01-13 devnull quit("Out of memory", 0);
597 3940506b 2005-01-13 devnull if ((fd = open(name, OWRITE)) < 0 &&
598 3940506b 2005-01-13 devnull (fd = create(name, OWRITE, 0666)) < 0)
599 3940506b 2005-01-13 devnull quit("Cannot create %s", name);
600 3940506b 2005-01-13 devnull Binit(bp, fd, OWRITE);
601 3940506b 2005-01-13 devnull Bseek(bp, 0, 2);
602 3940506b 2005-01-13 devnull fcode[nfiles++] = bp;
603 3940506b 2005-01-13 devnull return bp;
607 3940506b 2005-01-13 devnull compsub(Rune *rhs, Rune *end)
611 3940506b 2005-01-13 devnull while ((r = *cp++) != '\0') {
612 3940506b 2005-01-13 devnull if(r == '\\') {
613 3940506b 2005-01-13 devnull if (rhs < end)
614 3940506b 2005-01-13 devnull *rhs++ = 0xFFFF;
616 3940506b 2005-01-13 devnull return 0;
617 3940506b 2005-01-13 devnull r = *cp++;
618 3940506b 2005-01-13 devnull if(r == 'n')
619 3940506b 2005-01-13 devnull r = '\n';
620 3940506b 2005-01-13 devnull } else {
621 3940506b 2005-01-13 devnull if(r == seof) {
622 3940506b 2005-01-13 devnull if (rhs < end)
623 3940506b 2005-01-13 devnull *rhs++ = '\0';
625 3940506b 2005-01-13 devnull return 0;
626 3940506b 2005-01-13 devnull return rhs;
629 3940506b 2005-01-13 devnull if (rhs < end)
630 3940506b 2005-01-13 devnull *rhs++ = r;
632 3940506b 2005-01-13 devnull return 0;
635 3940506b 2005-01-13 devnull return 0;
638 3940506b 2005-01-13 devnull Reprog *
639 3940506b 2005-01-13 devnull compile(void)
642 3940506b 2005-01-13 devnull char *ep;
643 3940506b 2005-01-13 devnull char expbuf[512];
645 3940506b 2005-01-13 devnull if((c = *cp++) == seof) /* '//' */
646 3940506b 2005-01-13 devnull return 0;
647 3940506b 2005-01-13 devnull ep = expbuf;
649 3940506b 2005-01-13 devnull if (c == 0 || c == '\n')
650 3940506b 2005-01-13 devnull quit(TMMES, (char *) linebuf);
651 3940506b 2005-01-13 devnull if (c == '\\') {
652 3940506b 2005-01-13 devnull if (ep >= expbuf+sizeof(expbuf))
653 3940506b 2005-01-13 devnull quit(TMMES, (char *) linebuf);
654 3940506b 2005-01-13 devnull ep += runetochar(ep, &c);
655 3940506b 2005-01-13 devnull if ((c = *cp++) == 'n')
656 3940506b 2005-01-13 devnull c = '\n';
658 3940506b 2005-01-13 devnull if (ep >= expbuf+sizeof(expbuf))
659 3940506b 2005-01-13 devnull quit(TMMES, (char *) linebuf);
660 3940506b 2005-01-13 devnull ep += runetochar(ep, &c);
661 3940506b 2005-01-13 devnull } while ((c = *cp++) != seof);
662 3940506b 2005-01-13 devnull *ep = 0;
663 3940506b 2005-01-13 devnull return lastre = regcomp(expbuf);
667 3940506b 2005-01-13 devnull regerror(char *s)
669 3940506b 2005-01-13 devnull USED(s);
670 3940506b 2005-01-13 devnull quit(CGMES, (char *) linebuf);
674 3940506b 2005-01-13 devnull newfile(enum PTYPE type, char *name)
676 3940506b 2005-01-13 devnull if (type == P_ARG)
677 3940506b 2005-01-13 devnull prog.pctl.curr = name;
678 3940506b 2005-01-13 devnull else if ((prog.pctl.bp = Bopen(name, OREAD)) == 0)
679 3940506b 2005-01-13 devnull quit("Cannot open pattern-file: %s\n", name);
680 3940506b 2005-01-13 devnull prog.type = type;
684 3940506b 2005-01-13 devnull rline(Rune *buf, Rune *end)
689 3940506b 2005-01-13 devnull while ((c = getrune()) >= 0) {
691 3940506b 2005-01-13 devnull if (r == '\\') {
692 3940506b 2005-01-13 devnull if (buf <= end)
693 3940506b 2005-01-13 devnull *buf++ = r;
694 3940506b 2005-01-13 devnull if ((c = getrune()) < 0)
697 3940506b 2005-01-13 devnull } else if (r == '\n') {
698 3940506b 2005-01-13 devnull *buf = '\0';
699 3940506b 2005-01-13 devnull return(1);
701 3940506b 2005-01-13 devnull if (buf <= end)
702 3940506b 2005-01-13 devnull *buf++ = r;
704 3940506b 2005-01-13 devnull *buf = '\0';
705 3940506b 2005-01-13 devnull return(-1);
709 3940506b 2005-01-13 devnull getrune(void)
711 3940506b 2005-01-13 devnull char *p;
715 3940506b 2005-01-13 devnull if (prog.type == P_ARG) {
716 3940506b 2005-01-13 devnull if ((p = prog.pctl.curr) != 0) {
717 3940506b 2005-01-13 devnull if (*p) {
718 3940506b 2005-01-13 devnull prog.pctl.curr += chartorune(&r, p);
720 3940506b 2005-01-13 devnull } else {
721 3940506b 2005-01-13 devnull c = '\n'; /* fake an end-of-line */
722 3940506b 2005-01-13 devnull prog.pctl.curr = 0;
726 3940506b 2005-01-13 devnull } else if ((c = Bgetrune(prog.pctl.bp)) < 0)
727 3940506b 2005-01-13 devnull Bterm(prog.pctl.bp);
728 3940506b 2005-01-13 devnull return c;
732 3940506b 2005-01-13 devnull address(Addr *ap)
735 3940506b 2005-01-13 devnull long lno;
737 3940506b 2005-01-13 devnull if((c = *cp++) == '$')
738 3940506b 2005-01-13 devnull ap->type = A_DOL;
739 3940506b 2005-01-13 devnull else if(c == '/') {
740 3940506b 2005-01-13 devnull seof = c;
741 3940506b 2005-01-13 devnull if (ap->u.rp = compile())
742 3940506b 2005-01-13 devnull ap->type = A_RE;
744 3940506b 2005-01-13 devnull ap->type = A_LAST;
746 3940506b 2005-01-13 devnull else if (c >= '0' && c <= '9') {
747 3940506b 2005-01-13 devnull lno = c-'0';
748 3940506b 2005-01-13 devnull while ((c = *cp) >= '0' && c <= '9')
749 3940506b 2005-01-13 devnull lno = lno*10 + *cp++-'0';
750 3940506b 2005-01-13 devnull if(!lno)
751 3940506b 2005-01-13 devnull quit("line number 0 is illegal",0);
752 3940506b 2005-01-13 devnull ap->type = A_LINE;
753 3940506b 2005-01-13 devnull ap->u.line = lno;
757 3940506b 2005-01-13 devnull ap->type = A_NONE;
762 3940506b 2005-01-13 devnull cmp(char *a, char *b) /* compare characters */
764 3940506b 2005-01-13 devnull while(*a == *b++)
765 3940506b 2005-01-13 devnull if (*a == '\0')
766 3940506b 2005-01-13 devnull return(0);
767 3940506b 2005-01-13 devnull else a++;
768 3940506b 2005-01-13 devnull return(1);
772 3940506b 2005-01-13 devnull rcmp(Rune *a, Rune *b) /* compare runes */
774 3940506b 2005-01-13 devnull while(*a == *b++)
775 3940506b 2005-01-13 devnull if (*a == '\0')
776 3940506b 2005-01-13 devnull return(0);
777 3940506b 2005-01-13 devnull else a++;
778 3940506b 2005-01-13 devnull return(1);
782 3940506b 2005-01-13 devnull text(char *p) /* extract character string */
786 3940506b 2005-01-13 devnull while(*cp == '\t' || *cp == ' ')
788 3940506b 2005-01-13 devnull while (*cp) {
789 3940506b 2005-01-13 devnull if ((r = *cp++) == '\\')
790 3940506b 2005-01-13 devnull if ((r = *cp++) == 0)
792 3940506b 2005-01-13 devnull if (r == '\n')
793 3940506b 2005-01-13 devnull while (*cp == '\t' || *cp == ' ')
795 3940506b 2005-01-13 devnull p += runetochar(p, &r);
797 3940506b 2005-01-13 devnull *p++ = '\0';
798 3940506b 2005-01-13 devnull return p;
802 3940506b 2005-01-13 devnull stext(Rune *p, Rune *end) /* extract rune string */
804 3940506b 2005-01-13 devnull while(*cp == '\t' || *cp == ' ')
806 3940506b 2005-01-13 devnull while (*cp) {
807 3940506b 2005-01-13 devnull if (*cp == '\\')
808 3940506b 2005-01-13 devnull if (*++cp == 0)
810 3940506b 2005-01-13 devnull if (p >= end-1)
811 3940506b 2005-01-13 devnull quit(TMMES, (char *) linebuf);
812 3940506b 2005-01-13 devnull if ((*p++ = *cp++) == '\n')
813 3940506b 2005-01-13 devnull while(*cp == '\t' || *cp == ' ')
816 3940506b 2005-01-13 devnull *p++ = 0;
817 3940506b 2005-01-13 devnull return p;
822 3940506b 2005-01-13 devnull search (Label *ptr)
824 3940506b 2005-01-13 devnull Label *rp;
826 3940506b 2005-01-13 devnull for (rp = ltab; rp < ptr; rp++)
827 3940506b 2005-01-13 devnull if(rcmp(rp->asc, ptr->asc) == 0)
828 3940506b 2005-01-13 devnull return(rp);
829 3940506b 2005-01-13 devnull return(0);
833 3940506b 2005-01-13 devnull dechain(void)
835 3940506b 2005-01-13 devnull Label *lptr;
836 3940506b 2005-01-13 devnull SedCom *rptr, *trptr;
838 3940506b 2005-01-13 devnull for(lptr = ltab; lptr < lab; lptr++) {
840 3940506b 2005-01-13 devnull if(lptr->address == 0)
841 3940506b 2005-01-13 devnull quit("Undefined label: %S", (char *) lptr->asc);
843 3940506b 2005-01-13 devnull if(lptr->chain) {
844 3940506b 2005-01-13 devnull rptr = lptr->chain;
845 3940506b 2005-01-13 devnull while(trptr = rptr->u.lb1) {
846 3940506b 2005-01-13 devnull rptr->u.lb1 = lptr->address;
847 3940506b 2005-01-13 devnull rptr = trptr;
849 3940506b 2005-01-13 devnull rptr->u.lb1 = lptr->address;
855 3940506b 2005-01-13 devnull ycomp(SedCom *r)
858 3940506b 2005-01-13 devnull Rune *rp;
859 3940506b 2005-01-13 devnull Rune c, *tsp, highc;
860 3940506b 2005-01-13 devnull Rune *sp;
862 3940506b 2005-01-13 devnull highc = 0;
863 3940506b 2005-01-13 devnull for(tsp = cp; *tsp != seof; tsp++) {
864 3940506b 2005-01-13 devnull if(*tsp == '\\')
866 3940506b 2005-01-13 devnull if(*tsp == '\n' || *tsp == '\0')
867 3940506b 2005-01-13 devnull return(0);
868 3940506b 2005-01-13 devnull if (*tsp > highc) highc = *tsp;
871 3940506b 2005-01-13 devnull if ((rp = r->u.text = (Rune *) malloc(sizeof(Rune)*(highc+2))) == 0)
872 3940506b 2005-01-13 devnull quit("Out of memory", 0);
873 3940506b 2005-01-13 devnull *rp++ = highc; /* save upper bound */
874 3940506b 2005-01-13 devnull for (i = 0; i <= highc; i++)
875 3940506b 2005-01-13 devnull rp[i] = i;
876 3940506b 2005-01-13 devnull sp = cp;
877 3940506b 2005-01-13 devnull while((c = *sp++) != seof) {
878 3940506b 2005-01-13 devnull if(c == '\\' && *sp == 'n') {
880 3940506b 2005-01-13 devnull c = '\n';
882 3940506b 2005-01-13 devnull if((rp[c] = *tsp++) == '\\' && *tsp == 'n') {
883 3940506b 2005-01-13 devnull rp[c] = '\n';
886 3940506b 2005-01-13 devnull if(rp[c] == seof || rp[c] == '\0') {
887 3940506b 2005-01-13 devnull free(r->u.re1);
888 3940506b 2005-01-13 devnull r->u.re1 = 0;
889 3940506b 2005-01-13 devnull return(0);
892 3940506b 2005-01-13 devnull if(*tsp != seof) {
893 3940506b 2005-01-13 devnull free(r->u.re1);
894 3940506b 2005-01-13 devnull r->u.re1 = 0;
895 3940506b 2005-01-13 devnull return(0);
897 3940506b 2005-01-13 devnull cp = tsp+1;
898 3940506b 2005-01-13 devnull return(1);
902 3940506b 2005-01-13 devnull execute(void)
904 3940506b 2005-01-13 devnull SedCom *ipc;
906 3940506b 2005-01-13 devnull while (spend = gline(linebuf)){
907 3940506b 2005-01-13 devnull for(ipc = pspace; ipc->command; ) {
908 3940506b 2005-01-13 devnull if (!executable(ipc)) {
910 3940506b 2005-01-13 devnull continue;
912 3940506b 2005-01-13 devnull command(ipc);
914 3940506b 2005-01-13 devnull if(delflag)
916 3940506b 2005-01-13 devnull if(jflag) {
917 3940506b 2005-01-13 devnull jflag = 0;
918 3940506b 2005-01-13 devnull if((ipc = ipc->u.lb1) == 0)
924 3940506b 2005-01-13 devnull if(!nflag && !delflag)
925 3940506b 2005-01-13 devnull putline(&fout, linebuf, spend-linebuf);
926 3940506b 2005-01-13 devnull if(aptr > abuf) {
927 3940506b 2005-01-13 devnull arout();
929 3940506b 2005-01-13 devnull delflag = 0;
932 3940506b 2005-01-13 devnull /* determine if a statement should be applied to an input line */
934 3940506b 2005-01-13 devnull executable(SedCom *ipc)
936 3940506b 2005-01-13 devnull if (ipc->active) { /* Addr1 satisfied - accept until Addr2 */
937 3940506b 2005-01-13 devnull if (ipc->active == 1) /* Second line */
938 3940506b 2005-01-13 devnull ipc->active = 2;
939 3940506b 2005-01-13 devnull switch(ipc->ad2.type) {
940 3940506b 2005-01-13 devnull case A_NONE: /* No second addr; use first */
941 3940506b 2005-01-13 devnull ipc->active = 0;
943 3940506b 2005-01-13 devnull case A_DOL: /* Accept everything */
944 3940506b 2005-01-13 devnull return !ipc->negfl;
945 3940506b 2005-01-13 devnull case A_LINE: /* Line at end of range? */
946 3940506b 2005-01-13 devnull if (lnum <= ipc->ad2.u.line) {
947 3940506b 2005-01-13 devnull if (ipc->ad2.u.line == lnum)
948 3940506b 2005-01-13 devnull ipc->active = 0;
949 3940506b 2005-01-13 devnull return !ipc->negfl;
951 3940506b 2005-01-13 devnull ipc->active = 0; /* out of range */
952 3940506b 2005-01-13 devnull return ipc->negfl;
953 3940506b 2005-01-13 devnull case A_RE: /* Check for matching R.E. */
954 3940506b 2005-01-13 devnull if (match(ipc->ad2.u.rp, linebuf))
955 3940506b 2005-01-13 devnull ipc->active = 0;
956 3940506b 2005-01-13 devnull return !ipc->negfl;
957 3940506b 2005-01-13 devnull default: /* internal error */
958 3940506b 2005-01-13 devnull quit("Internal error", 0);
961 3940506b 2005-01-13 devnull switch (ipc->ad1.type) { /* Check first address */
962 3940506b 2005-01-13 devnull case A_NONE: /* Everything matches */
963 3940506b 2005-01-13 devnull return !ipc->negfl;
964 3940506b 2005-01-13 devnull case A_DOL: /* Only last line */
965 3940506b 2005-01-13 devnull if (dolflag)
966 3940506b 2005-01-13 devnull return !ipc->negfl;
968 3940506b 2005-01-13 devnull case A_LINE: /* Check line number */
969 3940506b 2005-01-13 devnull if (ipc->ad1.u.line == lnum) {
970 3940506b 2005-01-13 devnull ipc->active = 1; /* In range */
971 3940506b 2005-01-13 devnull return !ipc->negfl;
974 3940506b 2005-01-13 devnull case A_RE: /* Check R.E. */
975 3940506b 2005-01-13 devnull if (match(ipc->ad1.u.rp, linebuf)) {
976 3940506b 2005-01-13 devnull ipc->active = 1; /* In range */
977 3940506b 2005-01-13 devnull return !ipc->negfl;
980 3940506b 2005-01-13 devnull default:
981 3940506b 2005-01-13 devnull quit("Internal error", 0);
983 3940506b 2005-01-13 devnull return ipc->negfl;
987 3940506b 2005-01-13 devnull match(Reprog *pattern, Rune *buf)
989 3940506b 2005-01-13 devnull if (!pattern)
990 3940506b 2005-01-13 devnull return 0;
991 3940506b 2005-01-13 devnull subexp[0].s.rsp = buf;
992 3940506b 2005-01-13 devnull subexp[0].e.rep = 0;
993 3940506b 2005-01-13 devnull if (rregexec(pattern, linebuf, subexp, MAXSUB)) {
994 3940506b 2005-01-13 devnull loc1 = subexp[0].s.rsp;
995 3940506b 2005-01-13 devnull loc2 = subexp[0].e.rep;
996 3940506b 2005-01-13 devnull return 1;
998 3940506b 2005-01-13 devnull loc1 = loc2 = 0;
999 3940506b 2005-01-13 devnull return 0;
1003 3940506b 2005-01-13 devnull substitute(SedCom *ipc)
1005 3940506b 2005-01-13 devnull int len;
1007 3940506b 2005-01-13 devnull if(!match(ipc->u.re1, linebuf))
1008 3940506b 2005-01-13 devnull return 0;
1011 3940506b 2005-01-13 devnull * we have at least one match. some patterns, e.g. '$' or '^', can
1012 3940506b 2005-01-13 devnull * produce zero-length matches, so during a global substitute we
1013 3940506b 2005-01-13 devnull * must bump to the character after a zero-length match to keep from looping.
1015 3940506b 2005-01-13 devnull sflag = 1;
1016 3940506b 2005-01-13 devnull if(ipc->gfl == 0) /* single substitution */
1017 3940506b 2005-01-13 devnull dosub(ipc->rhs);
1019 3940506b 2005-01-13 devnull do{ /* global substitution */
1020 3940506b 2005-01-13 devnull len = loc2-loc1; /* length of match */
1021 3940506b 2005-01-13 devnull dosub(ipc->rhs); /* dosub moves loc2 */
1022 3940506b 2005-01-13 devnull if(*loc2 == 0) /* end of string */
1024 3940506b 2005-01-13 devnull if(len == 0) /* zero-length R.E. match */
1025 3940506b 2005-01-13 devnull loc2++; /* bump over zero-length match */
1026 3940506b 2005-01-13 devnull if(*loc2 == 0) /* end of string */
1028 3940506b 2005-01-13 devnull } while(match(ipc->u.re1, loc2));
1029 3940506b 2005-01-13 devnull return 1;
1033 3940506b 2005-01-13 devnull dosub(Rune *rhsbuf)
1035 3940506b 2005-01-13 devnull Rune *lp, *sp;
1036 3940506b 2005-01-13 devnull Rune *rp;
1037 3940506b 2005-01-13 devnull int c, n;
1039 3940506b 2005-01-13 devnull lp = linebuf;
1040 3940506b 2005-01-13 devnull sp = genbuf;
1041 3940506b 2005-01-13 devnull rp = rhsbuf;
1042 3940506b 2005-01-13 devnull while (lp < loc1)
1043 3940506b 2005-01-13 devnull *sp++ = *lp++;
1044 3940506b 2005-01-13 devnull while(c = *rp++) {
1045 3940506b 2005-01-13 devnull if (c == '&') {
1046 3940506b 2005-01-13 devnull sp = place(sp, loc1, loc2);
1047 3940506b 2005-01-13 devnull continue;
1049 3940506b 2005-01-13 devnull if (c == 0xFFFF && (c = *rp++) >= '1' && c < MAXSUB+'0') {
1050 3940506b 2005-01-13 devnull n = c-'0';
1051 3940506b 2005-01-13 devnull if (subexp[n].s.rsp && subexp[n].e.rep) {
1052 3940506b 2005-01-13 devnull sp = place(sp, subexp[n].s.rsp, subexp[n].e.rep);
1053 3940506b 2005-01-13 devnull continue;
1056 3940506b 2005-01-13 devnull fprint(2, "sed: Invalid back reference \\%d\n",n);
1057 3940506b 2005-01-13 devnull errexit();
1060 3940506b 2005-01-13 devnull *sp++ = c;
1061 3940506b 2005-01-13 devnull if (sp >= &genbuf[LBSIZE])
1062 3940506b 2005-01-13 devnull fprint(2, "sed: Output line too long.\n");
1064 3940506b 2005-01-13 devnull lp = loc2;
1065 3940506b 2005-01-13 devnull loc2 = sp - genbuf + linebuf;
1066 3940506b 2005-01-13 devnull while (*sp++ = *lp++)
1067 3940506b 2005-01-13 devnull if (sp >= &genbuf[LBSIZE])
1068 3940506b 2005-01-13 devnull fprint(2, "sed: Output line too long.\n");
1069 3940506b 2005-01-13 devnull lp = linebuf;
1070 3940506b 2005-01-13 devnull sp = genbuf;
1071 3940506b 2005-01-13 devnull while (*lp++ = *sp++)
1073 3940506b 2005-01-13 devnull spend = lp-1;
1077 3940506b 2005-01-13 devnull place(Rune *sp, Rune *l1, Rune *l2)
1079 3940506b 2005-01-13 devnull while (l1 < l2) {
1080 3940506b 2005-01-13 devnull *sp++ = *l1++;
1081 3940506b 2005-01-13 devnull if (sp >= &genbuf[LBSIZE])
1082 3940506b 2005-01-13 devnull fprint(2, "sed: Output line too long.\n");
1084 3940506b 2005-01-13 devnull return(sp);
1088 3940506b 2005-01-13 devnull trans(int c)
1090 3940506b 2005-01-13 devnull static char buf[] = "\\x0000";
1091 3940506b 2005-01-13 devnull static char hex[] = "0123456789abcdef";
1093 3940506b 2005-01-13 devnull switch(c) {
1094 3940506b 2005-01-13 devnull case '\b':
1095 3940506b 2005-01-13 devnull return "\\b";
1096 3940506b 2005-01-13 devnull case '\n':
1097 3940506b 2005-01-13 devnull return "\\n";
1098 3940506b 2005-01-13 devnull case '\r':
1099 3940506b 2005-01-13 devnull return "\\r";
1100 3940506b 2005-01-13 devnull case '\t':
1101 3940506b 2005-01-13 devnull return "\\t";
1102 3940506b 2005-01-13 devnull case '\\':
1103 3940506b 2005-01-13 devnull return "\\\\";
1105 3940506b 2005-01-13 devnull buf[2] = hex[(c>>12)&0xF];
1106 3940506b 2005-01-13 devnull buf[3] = hex[(c>>8)&0xF];
1107 3940506b 2005-01-13 devnull buf[4] = hex[(c>>4)&0xF];
1108 3940506b 2005-01-13 devnull buf[5] = hex[c&0xF];
1109 3940506b 2005-01-13 devnull return buf;
1113 3940506b 2005-01-13 devnull command(SedCom *ipc)
1115 3940506b 2005-01-13 devnull int i, c;
1116 3940506b 2005-01-13 devnull Rune *p1, *p2;
1117 3940506b 2005-01-13 devnull char *ucp;
1118 3940506b 2005-01-13 devnull Rune *rp;
1119 3940506b 2005-01-13 devnull Rune *execp;
1121 3940506b 2005-01-13 devnull switch(ipc->command) {
1123 3940506b 2005-01-13 devnull case ACOM:
1124 3940506b 2005-01-13 devnull *aptr++ = ipc;
1125 3940506b 2005-01-13 devnull if(aptr >= abuf+MAXADDS) {
1126 3940506b 2005-01-13 devnull quit("sed: Too many appends after line %ld\n",
1127 3940506b 2005-01-13 devnull (char *) lnum);
1129 3940506b 2005-01-13 devnull *aptr = 0;
1131 3940506b 2005-01-13 devnull case CCOM:
1132 3940506b 2005-01-13 devnull delflag = 1;
1133 3940506b 2005-01-13 devnull if(ipc->active == 1) {
1134 3940506b 2005-01-13 devnull for(rp = ipc->u.text; *rp; rp++)
1135 3940506b 2005-01-13 devnull Bputrune(&fout, *rp);
1136 3940506b 2005-01-13 devnull Bputc(&fout, '\n');
1139 3940506b 2005-01-13 devnull case DCOM:
1140 3940506b 2005-01-13 devnull delflag++;
1142 3940506b 2005-01-13 devnull case CDCOM:
1143 3940506b 2005-01-13 devnull p1 = p2 = linebuf;
1144 3940506b 2005-01-13 devnull while(*p1 != '\n') {
1145 3940506b 2005-01-13 devnull if(*p1++ == 0) {
1146 3940506b 2005-01-13 devnull delflag++;
1147 3940506b 2005-01-13 devnull return;
1151 3940506b 2005-01-13 devnull while(*p2++ = *p1++)
1153 3940506b 2005-01-13 devnull spend = p2-1;
1154 3940506b 2005-01-13 devnull jflag++;
1156 3940506b 2005-01-13 devnull case EQCOM:
1157 3940506b 2005-01-13 devnull Bprint(&fout, "%ld\n", lnum);
1159 3940506b 2005-01-13 devnull case GCOM:
1160 3940506b 2005-01-13 devnull p1 = linebuf;
1161 3940506b 2005-01-13 devnull p2 = holdsp;
1162 3940506b 2005-01-13 devnull while(*p1++ = *p2++)
1164 3940506b 2005-01-13 devnull spend = p1-1;
1166 3940506b 2005-01-13 devnull case CGCOM:
1167 3940506b 2005-01-13 devnull *spend++ = '\n';
1168 3940506b 2005-01-13 devnull p1 = spend;
1169 3940506b 2005-01-13 devnull p2 = holdsp;
1170 3940506b 2005-01-13 devnull while(*p1++ = *p2++)
1171 3940506b 2005-01-13 devnull if(p1 >= lbend)
1173 3940506b 2005-01-13 devnull spend = p1-1;
1175 3940506b 2005-01-13 devnull case HCOM:
1176 3940506b 2005-01-13 devnull p1 = holdsp;
1177 3940506b 2005-01-13 devnull p2 = linebuf;
1178 3940506b 2005-01-13 devnull while(*p1++ = *p2++);
1179 3940506b 2005-01-13 devnull hspend = p1-1;
1181 3940506b 2005-01-13 devnull case CHCOM:
1182 3940506b 2005-01-13 devnull *hspend++ = '\n';
1183 3940506b 2005-01-13 devnull p1 = hspend;
1184 3940506b 2005-01-13 devnull p2 = linebuf;
1185 3940506b 2005-01-13 devnull while(*p1++ = *p2++)
1186 3940506b 2005-01-13 devnull if(p1 >= hend)
1188 3940506b 2005-01-13 devnull hspend = p1-1;
1190 3940506b 2005-01-13 devnull case ICOM:
1191 3940506b 2005-01-13 devnull for(rp = ipc->u.text; *rp; rp++)
1192 3940506b 2005-01-13 devnull Bputrune(&fout, *rp);
1193 3940506b 2005-01-13 devnull Bputc(&fout, '\n');
1195 3940506b 2005-01-13 devnull case BCOM:
1196 3940506b 2005-01-13 devnull jflag = 1;
1198 3940506b 2005-01-13 devnull case LCOM:
1200 3940506b 2005-01-13 devnull for (i = 0, rp = linebuf; *rp; rp++) {
1201 3940506b 2005-01-13 devnull c = *rp;
1202 3940506b 2005-01-13 devnull if(c >= 0x20 && c < 0x7F && c != '\\') {
1203 3940506b 2005-01-13 devnull Bputc(&fout, c);
1204 3940506b 2005-01-13 devnull if(i++ > 71) {
1205 3940506b 2005-01-13 devnull Bprint(&fout, "\\\n");
1208 3940506b 2005-01-13 devnull } else {
1209 3940506b 2005-01-13 devnull for (ucp = trans(*rp); *ucp; ucp++){
1210 3940506b 2005-01-13 devnull c = *ucp;
1211 3940506b 2005-01-13 devnull Bputc(&fout, c);
1212 3940506b 2005-01-13 devnull if(i++ > 71) {
1213 3940506b 2005-01-13 devnull Bprint(&fout, "\\\n");
1219 3940506b 2005-01-13 devnull if(c == ' ')
1220 3940506b 2005-01-13 devnull Bprint(&fout, "\\n");
1221 3940506b 2005-01-13 devnull Bputc(&fout, '\n');
1223 3940506b 2005-01-13 devnull case NCOM:
1224 3940506b 2005-01-13 devnull if(!nflag)
1225 3940506b 2005-01-13 devnull putline(&fout, linebuf, spend-linebuf);
1227 3940506b 2005-01-13 devnull if(aptr > abuf)
1228 3940506b 2005-01-13 devnull arout();
1229 3940506b 2005-01-13 devnull if((execp = gline(linebuf)) == 0) {
1230 3940506b 2005-01-13 devnull delflag = 1;
1233 3940506b 2005-01-13 devnull spend = execp;
1235 3940506b 2005-01-13 devnull case CNCOM:
1236 3940506b 2005-01-13 devnull if(aptr > abuf)
1237 3940506b 2005-01-13 devnull arout();
1238 3940506b 2005-01-13 devnull *spend++ = '\n';
1239 3940506b 2005-01-13 devnull if((execp = gline(spend)) == 0) {
1240 3940506b 2005-01-13 devnull delflag = 1;
1243 3940506b 2005-01-13 devnull spend = execp;
1245 3940506b 2005-01-13 devnull case PCOM:
1246 3940506b 2005-01-13 devnull putline(&fout, linebuf, spend-linebuf);
1248 3940506b 2005-01-13 devnull case CPCOM:
1250 3940506b 2005-01-13 devnull for(rp = linebuf; *rp && *rp != '\n'; rp++)
1251 3940506b 2005-01-13 devnull Bputc(&fout, *rp);
1252 3940506b 2005-01-13 devnull Bputc(&fout, '\n');
1254 3940506b 2005-01-13 devnull case QCOM:
1255 3940506b 2005-01-13 devnull if(!nflag)
1256 3940506b 2005-01-13 devnull putline(&fout, linebuf, spend-linebuf);
1257 3940506b 2005-01-13 devnull if(aptr > abuf)
1258 3940506b 2005-01-13 devnull arout();
1259 3940506b 2005-01-13 devnull exits(0);
1260 3940506b 2005-01-13 devnull case RCOM:
1261 3940506b 2005-01-13 devnull *aptr++ = ipc;
1262 3940506b 2005-01-13 devnull if(aptr >= &abuf[MAXADDS])
1263 3940506b 2005-01-13 devnull quit("sed: Too many reads after line %ld\n",
1264 3940506b 2005-01-13 devnull (char *) lnum);
1265 3940506b 2005-01-13 devnull *aptr = 0;
1267 3940506b 2005-01-13 devnull case SCOM:
1268 3940506b 2005-01-13 devnull i = substitute(ipc);
1269 3940506b 2005-01-13 devnull if(i && ipc->pfl)
1270 3940506b 2005-01-13 devnull if(ipc->pfl == 1)
1271 3940506b 2005-01-13 devnull putline(&fout, linebuf, spend-linebuf);
1273 3940506b 2005-01-13 devnull goto cpcom;
1274 3940506b 2005-01-13 devnull if(i && ipc->fcode)
1275 3940506b 2005-01-13 devnull goto wcom;
1278 3940506b 2005-01-13 devnull case TCOM:
1279 3940506b 2005-01-13 devnull if(sflag == 0) break;
1280 3940506b 2005-01-13 devnull sflag = 0;
1281 3940506b 2005-01-13 devnull jflag = 1;
1285 3940506b 2005-01-13 devnull case WCOM:
1286 3940506b 2005-01-13 devnull putline(ipc->fcode,linebuf, spend-linebuf);
1288 3940506b 2005-01-13 devnull case XCOM:
1289 3940506b 2005-01-13 devnull p1 = linebuf;
1290 3940506b 2005-01-13 devnull p2 = genbuf;
1291 3940506b 2005-01-13 devnull while(*p2++ = *p1++);
1292 3940506b 2005-01-13 devnull p1 = holdsp;
1293 3940506b 2005-01-13 devnull p2 = linebuf;
1294 3940506b 2005-01-13 devnull while(*p2++ = *p1++);
1295 3940506b 2005-01-13 devnull spend = p2 - 1;
1296 3940506b 2005-01-13 devnull p1 = genbuf;
1297 3940506b 2005-01-13 devnull p2 = holdsp;
1298 3940506b 2005-01-13 devnull while(*p2++ = *p1++);
1299 3940506b 2005-01-13 devnull hspend = p2 - 1;
1301 3940506b 2005-01-13 devnull case YCOM:
1302 3940506b 2005-01-13 devnull p1 = linebuf;
1303 3940506b 2005-01-13 devnull p2 = ipc->u.text;
1304 3940506b 2005-01-13 devnull for (i = *p2++; *p1; p1++){
1305 3940506b 2005-01-13 devnull if (*p1 <= i) *p1 = p2[*p1];
1313 3940506b 2005-01-13 devnull putline(Biobuf *bp, Rune *buf, int n)
1315 3940506b 2005-01-13 devnull while (n--)
1316 3940506b 2005-01-13 devnull Bputrune(bp, *buf++);
1317 3940506b 2005-01-13 devnull Bputc(bp, '\n');
1321 3940506b 2005-01-13 devnull ecmp(Rune *a, Rune *b, int count)
1323 3940506b 2005-01-13 devnull while(count--)
1324 3940506b 2005-01-13 devnull if(*a++ != *b++) return(0);
1325 3940506b 2005-01-13 devnull return(1);
1329 3940506b 2005-01-13 devnull arout(void)
1331 3940506b 2005-01-13 devnull Rune *p1;
1332 3940506b 2005-01-13 devnull Biobuf *fi;
1334 3940506b 2005-01-13 devnull char *s;
1335 3940506b 2005-01-13 devnull char buf[128];
1337 3940506b 2005-01-13 devnull for (aptr = abuf; *aptr; aptr++) {
1338 3940506b 2005-01-13 devnull if((*aptr)->command == ACOM) {
1339 3940506b 2005-01-13 devnull for(p1 = (*aptr)->u.text; *p1; p1++ )
1340 3940506b 2005-01-13 devnull Bputrune(&fout, *p1);
1341 3940506b 2005-01-13 devnull Bputc(&fout, '\n');
1342 3940506b 2005-01-13 devnull } else {
1343 3940506b 2005-01-13 devnull for(s = buf, p1= (*aptr)->u.text; *p1; p1++)
1344 3940506b 2005-01-13 devnull s += runetochar(s, p1);
1345 3940506b 2005-01-13 devnull *s = '\0';
1346 3940506b 2005-01-13 devnull if((fi = Bopen(buf, OREAD)) == 0)
1347 3940506b 2005-01-13 devnull continue;
1348 3940506b 2005-01-13 devnull while((c = Bgetc(fi)) >= 0)
1349 3940506b 2005-01-13 devnull Bputc(&fout, c);
1350 3940506b 2005-01-13 devnull Bterm(fi);
1353 3940506b 2005-01-13 devnull aptr = abuf;
1354 3940506b 2005-01-13 devnull *aptr = 0;
1358 3940506b 2005-01-13 devnull errexit(void)
1360 3940506b 2005-01-13 devnull exits("error");
1364 3940506b 2005-01-13 devnull quit (char *msg, char *arg)
1366 3940506b 2005-01-13 devnull fprint(2, "sed: ");
1367 3940506b 2005-01-13 devnull fprint(2, msg, arg);
1368 3940506b 2005-01-13 devnull fprint(2, "\n");
1369 3940506b 2005-01-13 devnull errexit();
1373 3940506b 2005-01-13 devnull gline(Rune *addr)
1375 3940506b 2005-01-13 devnull long c;
1376 3940506b 2005-01-13 devnull Rune *p;
1378 3940506b 2005-01-13 devnull static long peekc = 0;
1380 3940506b 2005-01-13 devnull if (f == 0 && opendata() < 0)
1381 3940506b 2005-01-13 devnull return 0;
1382 3940506b 2005-01-13 devnull sflag = 0;
1383 3940506b 2005-01-13 devnull lnum++;
1384 3940506b 2005-01-13 devnull /* Bflush(&fout);********* dumped 4/30/92 - bobf****/
1386 3940506b 2005-01-13 devnull p = addr;
1387 3940506b 2005-01-13 devnull for (c = (peekc ? peekc : Bgetrune(f)); c >= 0; c = Bgetrune(f)) {
1388 3940506b 2005-01-13 devnull if (c == '\n') {
1389 3940506b 2005-01-13 devnull if ((peekc = Bgetrune(f)) < 0) {
1390 3940506b 2005-01-13 devnull if (fhead == 0)
1391 3940506b 2005-01-13 devnull dolflag = 1;
1393 3940506b 2005-01-13 devnull *p = '\0';
1394 3940506b 2005-01-13 devnull return p;
1396 3940506b 2005-01-13 devnull if (c && p < lbend)
1397 3940506b 2005-01-13 devnull *p++ = c;
1399 3940506b 2005-01-13 devnull /* return partial final line, adding implicit newline */
1400 3940506b 2005-01-13 devnull if(p != addr) {
1401 3940506b 2005-01-13 devnull *p = '\0';
1402 3940506b 2005-01-13 devnull peekc = -1;
1403 3940506b 2005-01-13 devnull if (fhead == 0)
1404 3940506b 2005-01-13 devnull dolflag = 1;
1405 3940506b 2005-01-13 devnull return p;
1407 3940506b 2005-01-13 devnull peekc = 0;
1408 3940506b 2005-01-13 devnull Bterm(f);
1409 3940506b 2005-01-13 devnull } while (opendata() > 0); /* Switch to next stream */
1411 3940506b 2005-01-13 devnull return 0;
1414 3940506b 2005-01-13 devnull /* Data file input section - the intent is to transparently
1415 3940506b 2005-01-13 devnull * catenate all data input streams.
1418 3940506b 2005-01-13 devnull enroll(char *filename) /* Add a file to the input file cache */
1420 3940506b 2005-01-13 devnull FileCache *fp;
1422 3940506b 2005-01-13 devnull if ((fp = (FileCache *) malloc(sizeof (FileCache))) == 0)
1423 3940506b 2005-01-13 devnull quit("Out of memory", 0);
1424 3940506b 2005-01-13 devnull if (ftail == 0)
1425 3940506b 2005-01-13 devnull fhead = fp;
1427 3940506b 2005-01-13 devnull ftail->next = fp;
1428 3940506b 2005-01-13 devnull ftail = fp;
1429 3940506b 2005-01-13 devnull fp->next = 0;
1430 3940506b 2005-01-13 devnull fp->name = filename; /* 0 => stdin */
1434 3940506b 2005-01-13 devnull opendata(void)
1436 3940506b 2005-01-13 devnull if (fhead == 0)
1437 3940506b 2005-01-13 devnull return -1;
1438 3940506b 2005-01-13 devnull if (fhead->name) {
1439 3940506b 2005-01-13 devnull if ((f = Bopen(fhead->name, OREAD)) == 0)
1440 3940506b 2005-01-13 devnull quit("Can't open %s", fhead->name);
1441 3940506b 2005-01-13 devnull } else {
1442 3940506b 2005-01-13 devnull Binit(&bstdin, 0, OREAD);
1443 3940506b 2005-01-13 devnull f = &bstdin;
1445 3940506b 2005-01-13 devnull fhead = fhead->next;
1446 3940506b 2005-01-13 devnull return 1;