<?xml version="1.0" encoding="utf-8"?> <!DOCTYPE html PUBLIC "-//W3C//DTD HTML 4.01 Transitional//EN" "http://www.w3.org/TR/html4/loose.dtd"> <html> <head> <meta http-equiv=Content-Type content="text/html; charset=utf8"> <title>/usr/web/sources/contrib/cross/field.c - Plan 9 from Bell Labs</title> <!-- THIS FILE IS AUTOMATICALLY GENERATED. --> <!-- EDIT sources.tr INSTEAD. --> </meta> </head> <body> <p style="margin-top: 0; margin-bottom: 0.17in"></p> <p style="line-height: 1.2em; margin-left: 1.00in; text-indent: 0.00in; margin-right: 1.00in; margin-top: 0; margin-bottom: 0; text-align: center;"> <span style="font-size: 10pt"><a href="/plan9/">Plan 9 from Bell Labs</a>’s /usr/web/sources/contrib/cross/field.c</span></p> <p style="margin-top: 0; margin-bottom: 0.17in"></p> <p style="margin-top: 0; margin-bottom: 0.17in"></p> <center><font size=-1> Copyright © 2009 Alcatel-Lucent.<br /> Distributed under the <a href="/plan9/license.html">Lucent Public License version 1.02</a>. <br /> <a href="/plan9/download.html">Download the Plan 9 distribution.</a> </font> </center> <p style="margin-top: 0; margin-bottom: 0.17in"></p> <table width="100%" cellspacing=0 border=0><tr><td align="center"> <table cellspacing=0 cellpadding=5 bgcolor="#eeeeff"><tr><td align="left"> <pre> <!-- END HEADER --> #include <u.h> #include <libc.h> #include <bio.h> #include <ctype.h> #include <regexp.h> typedef struct Range Range; typedef struct Slice Slice; typedef struct Slices Slices; typedef struct Token Token; struct Range { int begin; int end; }; struct Slice { char *begin; char *end; }; #pragma varargck type "S" Slice struct Slices { uint len; uint size; Slice *slices; }; struct Token { int type; Slice slice; }; enum { NF = 0x7FFFFFFF }; Biobuf bin; Biobuf bout; int guesscollapse(const char *sep); int Sfmt(Fmt *f); Slice lex(char **sp); Slice next(char **sp); Slice peek(void); void extend(Slice *slice, char **sp); int tiseof(Slice *tok); int tisdelim(Slice *tok); int tisspace(Slice *tok); int parseranges(char *src, Range **rv); Range parserange(char **sp); int stoi(Slice slice); int parsenum(char **s); void process(Biobuf *b, int rc, Range *rv, Reprog *delim, char *sep, int collapse); void pprefix(char *prefix); uint split(char *line, Reprog *delim, Slices *ss, int collapse); void reset(Slices *ss); void append(Slices *ss, char *begin, char *end); void usage(void); void main(int argc, char *argv[]) { Range *rv; char *filename, *insep, *outsep; Reprog *delim; int rc, collapse, eflag, Eflag, oflag, zflag; insep = "[ \t\v\r]+"; outsep = " "; Binit(&bin, 0, OREAD); Binit(&bout, 1, OWRITE); fmtinstall('S', Sfmt); zflag = 0; eflag = 0; Eflag = 0; oflag = 0; ARGBEGIN { case '0': outsep = ""; zflag = 1; break; case 'e': eflag = 1; break; case 'E': Eflag = 1; break; case 'F': insep = EARGF(usage()); break; case 'O': oflag = 1; outsep = EARGF(usage()); break; default: usage(); break; } ARGEND; if (eflag && Eflag) { fprint(2, "flag conflict: -e and -E are mutually exclusive\n"); usage(); } if (oflag && zflag) { fprint(2, "flag conflict: -0 and -O are mutually exclusive\n"); usage(); } if (argc <= 0) usage(); delim = regcomp(insep); if (delim == nil) sysfatal("bad input separator regexp '%s': %r", insep); rv = nil; rc = parseranges(*argv++, &rv); if (rc < 0) sysfatal("parseranges failed"); collapse = guesscollapse(insep); if (eflag) collapse = 0; if (Eflag) collapse = 1; if (*argv == nil) { process(&bin, rc, rv, delim, outsep, collapse); } else while ((filename = *argv++) != nil) { Biobuf *b; if (strcmp(filename, "-") == 0) { process(&bin, rc, rv, delim, outsep, collapse); continue; } b = Bopen(filename, OREAD); if (b == nil) sysfatal("failure opening '%s': %r", filename); process(b, rc, rv, delim, outsep, collapse); Bterm(b); } exits(0); } int guesscollapse(const char *sep) { int len = utflen(sep); return len > 1 && (len != 2 || *sep != '\\'); } int Sfmt(Fmt *f) { Slice s = va_arg(f->args, Slice); if (s.begin == nil || s.end == nil) return 0; return fmtprint(f, "%.*s", s.end - s.begin, s.begin); } /* * The field selection syntax is: * * fields := range [[delim] fields] * range := field | NUM '-' [field] * field := NUM | 'NF' * delim := ws+ | '|' | ',' * ws := c such that `isspace(c)` is true. */ Slice lex(char **sp) { char *s; Slice slice; memset(&slice, 0, sizeof(slice)); s = *sp; slice.begin = s; while (isspace(*s)) s++; if (s == *sp) { switch (*s) { case '\0': slice.begin = nil; break; case '-': s++; break; case 'N': if (*++s == 'F') s++; break; case ',': case '|': s++; break; default: if (!isdigit(*s)) sysfatal("lexical error, c = %c", *s); while (isdigit(*s)) s++; break; } } slice.end = s; *sp = s; return slice; } Slice current; Slice peek() { return current; } Slice next(char **sp) { Slice tok = peek(); current = lex(sp); return tok; } void extend(Slice *slice, char **sp) { Slice tok = next(sp); slice->end = tok.end; } int stoi(Slice slice) { char *s; int n = 0, sign = 1; s = slice.begin; if (*s == '-') { sign = -1; s++; } for (; s != slice.end; s++) { if (!isdigit(*s)) sysfatal("stoi: bad number in '%S', c = %c", slice, *s); n = n * 10 + (*s - '0'); } return sign * n; } int tiseof(Slice *tok) { return tok == nil || tok->begin == nil; } int tisdelim(Slice *tok) { return tiseof(tok) || tisspace(tok) || *tok->begin == ',' || *tok->begin == '|'; } int tisspace(Slice *tok) { return !tiseof(tok) && isspace(*tok->begin); } int parseranges(char *src, Range **rv) { char *s; Range *rs, *t; int n, m; Slice tok; rs = nil; m = 0; n = 0; s = src; if (s == nil || *s == '\0') return -1; next(&s); do { tok = peek(); while (tisspace(&tok)) tok = next(&s); Range r = parserange(&s); if (n >= m) { m = 2*m; if (m == 0) m = 1; t = realloc(rs, sizeof(Range) * m); if (t == nil) sysfatal("realloc failed parsing ranges"); rs = t; } rs[n++] = r; tok = next(&s); if (!tisdelim(&tok)) sysfatal("syntax error in field list"); } while (!tiseof(&tok)); *rv = rs; return n; } int tokeq(Slice *tok, const char *s) { return !tiseof(tok) && !strncmp(tok->begin, s, tok->end - tok->begin); } Range parserange(char **sp) { Range range; Slice tok; range.begin = range.end = NF; tok = peek(); if (tokeq(&tok, "NF")) { next(sp); return range; } range.begin = range.end = parsenum(sp); tok = peek(); if (tokeq(&tok, "-")) { next(sp); range.end = NF; tok = peek(); if (tokeq(&tok, "NF")) { next(sp); return range; } if (!tiseof(&tok) && !tisdelim(&tok)) range.end = parsenum(sp); } return range; } int parsenum(char **sp) { Slice tok; tok = next(sp); if (tiseof(&tok)) sysfatal("EOF in number parser"); if (isdigit(*tok.begin)) return stoi(tok); if (*tok.begin != '-') sysfatal("number parse error: unexpected '%S'", tok); extend(&tok, sp); if (!isdigit(*(tok.begin + 1))) sysfatal("negative number parse error: unspected '%S'", tok); return stoi(tok); } void process(Biobuf *b, int rc, Range *rv, Reprog *delim, char *outsep, int collapse) { char *line, *prefix; const int nulldelim = 1; Slice *s; Slices ss; memset(&ss, 0, sizeof(ss)); while ((line = Brdstr(b, '\n', nulldelim)) != 0) { int printed = 0; uint nfields = split(line, delim, &ss, collapse); s = ss.slices; prefix = nil; for (int k = 0; k < rc; k++) { int begin = rv[k].begin; int end = rv[k].end; if (begin == 0) { pprefix(prefix); prefix = outsep; Bprint(&bout, "%s", line); printed = 1; begin = 1; } if (begin == NF) begin = nfields; if (begin < 0) begin += nfields + 1; begin--; if (end < 0) end += nfields + 1; if (begin < 0 || end < 0 || end < begin || nfields < begin) continue; for (int f = begin; f < end && f < nfields; f++) { pprefix(prefix); prefix = outsep; Bprint(&bout, "%S", s[f]); printed = 1; } } if (rc != 0 && (printed || !collapse)) Bputc(&bout, '\n'); free(line); } free(ss.slices); } void pprefix(char *prefix) { if (prefix == nil) return; if (*prefix == '\0') Bputc(&bout, '\0'); else Bprint(&bout, "%s", prefix); } void reset(Slices *ss) { ss->len = 0; } uint split(char *line, Reprog *delim, Slices *ss, int collapse) { char *s, *b, *e; Resub match[1]; memset(match, 0, sizeof(match)); reset(ss); b = nil; e = nil; s = line; while (regexec(delim, s, match, nelem(match))) { b = s; e = match[0].sp; s = match[0].ep; memset(match, 0, sizeof(match)); if (collapse && (e == line || b == e)) continue; append(ss, b, e); } b = s; e = b + strlen(s); if (!collapse || b != e) append(ss, b, e); return ss->len; } void append(Slices *ss, char *begin, char *end) { if (ss->len >= ss->size) { Slice *s; ss->size *= 2; if (ss->size == 0) ss->size = 1; s = realloc(ss->slices, ss->size * sizeof(Slice)); if (s == nil) sysfatal("malloc failed appending slice: %r"); ss->slices = s; } ss->slices[ss->len].begin = begin; ss->slices[ss->len++].end = end; } void usage() { sysfatal("usage: field [ -E | -e ] [ -F regexp ] [ -0 | -O delimiter ] <field list> [file...]"); } <!-- BEGIN TAIL --> </pre> </td></tr></table> </td></tr></table> <p style="margin-top: 0; margin-bottom: 0.17in"></p> <p style="line-height: 1.2em; margin-left: 1.00in; text-indent: 0.00in; margin-right: 1.00in; margin-top: 0; margin-bottom: 0; text-align: center;"> <span style="font-size: 10pt"></span></p> <p style="margin-top: 0; margin-bottom: 0.50in"></p> <p style="margin-top: 0; margin-bottom: 0.33in"></p> <center><table border="0"><tr> <td valign="middle"><a href="http://www.alcatel-lucent.com/"><img border="0" src="/plan9/img/logo_ft.gif" alt="Bell Labs" /> </a></td> <td valign="middle"><a href="http://www.opensource.org"><img border="0" alt="OSI certified" src="/plan9/img/osi-certified-60x50.gif" /> </a></td> <td><img style="padding-right: 45px;" alt="Powered by Plan 9" src="/plan9/img/power36.gif" /> </td> </tr></table></center> <p style="margin-top: 0; margin-bottom: 0.17in"></p> <center> <span style="font-size: 10pt">(<a href="/plan9/">Return to Plan 9 Home Page</a>)</span> </center> <p style="margin-top: 0; margin-bottom: 0.17in"></p> <center><font size=-1> <span style="font-size: 10pt"><a href="http://www.lucent.com/copyright.html">Copyright</a></span> <span style="font-size: 10pt">© 2009 Alcatel-Lucent.</span> <span style="font-size: 10pt">All Rights Reserved.</span> <br /> <span style="font-size: 10pt">Comments to</span> <span style="font-size: 10pt"><a href="mailto:webmaster@plan9.bell-labs.com">webmaster@plan9.bell-labs.com</a>.</span> </font></center> </body> </html>