2011-05-29 20:30:44 +00:00
|
|
|
/* See LICENSE file for copyright and license details. */
|
2015-02-20 12:21:46 +00:00
|
|
|
#include <limits.h>
|
2015-02-01 00:24:03 +00:00
|
|
|
#include <stdint.h>
|
2015-03-20 17:09:23 +00:00
|
|
|
#include <stdio.h>
|
2011-05-29 20:30:44 +00:00
|
|
|
#include <stdlib.h>
|
|
|
|
#include <string.h>
|
2014-11-13 17:29:30 +00:00
|
|
|
|
2011-05-29 20:30:44 +00:00
|
|
|
#include "text.h"
|
2015-03-20 17:09:23 +00:00
|
|
|
#include "utf.h"
|
2011-05-29 20:30:44 +00:00
|
|
|
#include "util.h"
|
|
|
|
|
2015-03-22 15:29:50 +00:00
|
|
|
static size_t startnum = 1;
|
|
|
|
static size_t incr = 1;
|
|
|
|
static size_t blines = 1;
|
|
|
|
static size_t delimlen = 2;
|
2016-03-10 04:40:34 +00:00
|
|
|
static size_t seplen = 1;
|
2015-03-22 15:29:50 +00:00
|
|
|
static int width = 6;
|
|
|
|
static int pflag = 0;
|
|
|
|
static char type[] = { 'n', 't', 'n' }; /* footer, body, header */
|
|
|
|
static char *delim = "\\:";
|
2016-03-10 04:40:34 +00:00
|
|
|
static char format[6] = "%*ld";
|
2015-03-22 15:29:50 +00:00
|
|
|
static char *sep = "\t";
|
|
|
|
static regex_t preg[3];
|
2015-03-18 16:58:09 +00:00
|
|
|
|
|
|
|
static int
|
2016-03-10 04:40:34 +00:00
|
|
|
getsection(struct line *l, int *section)
|
2015-03-18 16:58:09 +00:00
|
|
|
{
|
2016-03-10 04:40:34 +00:00
|
|
|
size_t i;
|
2015-03-22 15:29:50 +00:00
|
|
|
int sectionchanged = 0, newsection = *section;
|
2015-03-18 16:58:09 +00:00
|
|
|
|
2016-03-10 04:40:34 +00:00
|
|
|
for (i = 0; (l->len - i) >= delimlen &&
|
|
|
|
!memcmp(l->data + i, delim, delimlen); i += delimlen) {
|
2015-03-18 16:58:09 +00:00
|
|
|
if (!sectionchanged) {
|
|
|
|
sectionchanged = 1;
|
|
|
|
newsection = 0;
|
|
|
|
} else {
|
2015-03-22 15:29:50 +00:00
|
|
|
newsection = (newsection + 1) % 3;
|
2015-03-18 16:58:09 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2016-03-10 04:40:34 +00:00
|
|
|
if (!(l->len - i) || l->data[i] == '\n')
|
2015-03-18 16:58:09 +00:00
|
|
|
*section = newsection;
|
|
|
|
else
|
|
|
|
sectionchanged = 0;
|
|
|
|
|
|
|
|
return sectionchanged;
|
|
|
|
}
|
2015-02-01 00:24:03 +00:00
|
|
|
|
2015-03-07 12:33:39 +00:00
|
|
|
static void
|
2015-03-22 15:29:50 +00:00
|
|
|
nl(const char *fname, FILE *fp)
|
2015-02-01 00:24:03 +00:00
|
|
|
{
|
2016-03-10 04:40:34 +00:00
|
|
|
static struct line line;
|
|
|
|
static size_t size;
|
|
|
|
size_t number = startnum, bl = 1;
|
|
|
|
ssize_t len;
|
2015-03-27 16:03:44 +00:00
|
|
|
int donumber, oldsection, section = 1;
|
2015-02-01 00:24:03 +00:00
|
|
|
|
2016-03-10 04:40:34 +00:00
|
|
|
while ((len = getline(&line.data, &size, fp)) > 0) {
|
|
|
|
line.len = len;
|
2015-03-10 11:49:56 +00:00
|
|
|
donumber = 0;
|
2015-03-18 16:58:09 +00:00
|
|
|
oldsection = section;
|
|
|
|
|
2016-03-10 04:40:34 +00:00
|
|
|
if (getsection(&line, §ion)) {
|
2015-03-18 16:58:09 +00:00
|
|
|
if ((section >= oldsection) && !pflag)
|
|
|
|
number = startnum;
|
|
|
|
continue;
|
|
|
|
}
|
2015-03-10 11:49:56 +00:00
|
|
|
|
2015-03-22 15:29:50 +00:00
|
|
|
switch (type[section]) {
|
|
|
|
case 't':
|
2016-03-10 04:40:34 +00:00
|
|
|
if (line.data[0] != '\n')
|
2015-03-22 15:29:50 +00:00
|
|
|
donumber = 1;
|
|
|
|
break;
|
|
|
|
case 'p':
|
2016-03-10 04:40:34 +00:00
|
|
|
if (!regexec(preg + section, line.data, 0, NULL, 0))
|
2015-03-22 15:29:50 +00:00
|
|
|
donumber = 1;
|
|
|
|
break;
|
|
|
|
case 'a':
|
2016-03-10 04:40:34 +00:00
|
|
|
if (line.data[0] == '\n' && bl < blines) {
|
2015-03-10 11:49:56 +00:00
|
|
|
++bl;
|
|
|
|
} else {
|
|
|
|
donumber = 1;
|
|
|
|
bl = 1;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
if (donumber) {
|
2016-03-10 04:40:34 +00:00
|
|
|
printf(format, width, number);
|
|
|
|
fwrite(sep, 1, seplen, stdout);
|
2015-03-18 16:58:09 +00:00
|
|
|
number += incr;
|
2015-02-20 12:05:54 +00:00
|
|
|
}
|
2016-03-10 04:40:34 +00:00
|
|
|
fwrite(line.data, 1, line.len, stdout);
|
2015-02-01 00:24:03 +00:00
|
|
|
}
|
2016-03-10 04:40:34 +00:00
|
|
|
free(line.data);
|
2015-02-01 00:24:03 +00:00
|
|
|
if (ferror(fp))
|
2015-03-22 15:29:50 +00:00
|
|
|
eprintf("getline %s:", fname);
|
2015-02-01 00:24:03 +00:00
|
|
|
}
|
2011-05-29 20:30:44 +00:00
|
|
|
|
2013-06-14 18:20:47 +00:00
|
|
|
static void
|
|
|
|
usage(void)
|
|
|
|
{
|
2015-03-22 15:29:50 +00:00
|
|
|
eprintf("usage: %s [-p] [-b type] [-d delim] [-f type]\n"
|
|
|
|
" [-h type] [-i num] [-l num] [-n format]\n"
|
2015-12-21 17:36:28 +00:00
|
|
|
" [-s sep] [-v num] [-w num] [file]\n", argv0);
|
2015-03-18 16:58:09 +00:00
|
|
|
}
|
2015-03-22 15:29:50 +00:00
|
|
|
|
2015-03-18 16:58:09 +00:00
|
|
|
static char
|
|
|
|
getlinetype(char *type, regex_t *preg)
|
|
|
|
{
|
|
|
|
if (type[0] == 'p')
|
2015-03-22 15:29:50 +00:00
|
|
|
eregcomp(preg, type + 1, REG_NOSUB);
|
|
|
|
else if (!type[0] || !strchr("ant", type[0]))
|
2015-03-18 16:58:09 +00:00
|
|
|
usage();
|
|
|
|
|
|
|
|
return type[0];
|
2013-06-14 18:20:47 +00:00
|
|
|
}
|
|
|
|
|
2011-05-29 20:30:44 +00:00
|
|
|
int
|
|
|
|
main(int argc, char *argv[])
|
|
|
|
{
|
2015-04-04 21:09:06 +00:00
|
|
|
FILE *fp = NULL;
|
2016-03-10 04:40:34 +00:00
|
|
|
size_t s;
|
2015-05-24 23:33:19 +00:00
|
|
|
int ret = 0;
|
2015-03-22 15:29:50 +00:00
|
|
|
char *d, *formattype, *formatblit;
|
2011-05-29 20:30:44 +00:00
|
|
|
|
2013-06-14 18:20:47 +00:00
|
|
|
ARGBEGIN {
|
2015-03-18 16:58:09 +00:00
|
|
|
case 'd':
|
2016-03-10 04:40:34 +00:00
|
|
|
switch (utflen((d = EARGF(usage())))) {
|
2015-03-20 17:09:23 +00:00
|
|
|
case 0:
|
2016-03-10 04:40:34 +00:00
|
|
|
eprintf("empty logical page delimiter\n");
|
2015-03-20 17:09:23 +00:00
|
|
|
case 1:
|
|
|
|
s = strlen(d);
|
2015-03-22 15:29:50 +00:00
|
|
|
delim = emalloc(s + 1 + 1);
|
|
|
|
estrlcpy(delim, d, s + 1 + 1);
|
|
|
|
estrlcat(delim, ":", s + 1 + 1);
|
2015-03-20 17:09:23 +00:00
|
|
|
delimlen = s + 1;
|
|
|
|
break;
|
|
|
|
default:
|
|
|
|
delim = d;
|
|
|
|
delimlen = strlen(delim);
|
|
|
|
break;
|
2015-03-18 16:58:09 +00:00
|
|
|
}
|
|
|
|
break;
|
|
|
|
case 'f':
|
2015-03-22 15:29:50 +00:00
|
|
|
type[0] = getlinetype(EARGF(usage()), preg);
|
|
|
|
break;
|
|
|
|
case 'b':
|
|
|
|
type[1] = getlinetype(EARGF(usage()), preg + 1);
|
2015-03-18 16:58:09 +00:00
|
|
|
break;
|
|
|
|
case 'h':
|
2015-03-22 15:29:50 +00:00
|
|
|
type[2] = getlinetype(EARGF(usage()), preg + 2);
|
2013-06-14 18:20:47 +00:00
|
|
|
break;
|
|
|
|
case 'i':
|
2015-02-01 00:24:03 +00:00
|
|
|
incr = estrtonum(EARGF(usage()), 0, MIN(LLONG_MAX, SIZE_MAX));
|
2013-06-14 18:20:47 +00:00
|
|
|
break;
|
2015-03-10 11:49:56 +00:00
|
|
|
case 'l':
|
2015-03-22 15:29:50 +00:00
|
|
|
blines = estrtonum(EARGF(usage()), 0, MIN(LLONG_MAX, SIZE_MAX));
|
2015-03-10 11:49:56 +00:00
|
|
|
break;
|
2015-02-20 14:12:03 +00:00
|
|
|
case 'n':
|
2015-03-22 15:29:50 +00:00
|
|
|
formattype = EARGF(usage());
|
|
|
|
estrlcpy(format, "%", sizeof(format));
|
|
|
|
|
|
|
|
if (!strcmp(formattype, "ln")) {
|
|
|
|
formatblit = "-";
|
|
|
|
} else if (!strcmp(formattype, "rn")) {
|
|
|
|
formatblit = "";
|
|
|
|
} else if (!strcmp(formattype, "rz")) {
|
|
|
|
formatblit = "0";
|
|
|
|
} else {
|
|
|
|
eprintf("%s: bad format\n", formattype);
|
|
|
|
}
|
|
|
|
|
|
|
|
estrlcat(format, formatblit, sizeof(format));
|
2016-03-10 04:40:34 +00:00
|
|
|
estrlcat(format, "*ld", sizeof(format));
|
2015-02-20 14:12:03 +00:00
|
|
|
break;
|
2015-03-18 16:58:09 +00:00
|
|
|
case 'p':
|
|
|
|
pflag = 1;
|
|
|
|
break;
|
2013-06-14 18:20:47 +00:00
|
|
|
case 's':
|
|
|
|
sep = EARGF(usage());
|
2016-03-10 04:40:34 +00:00
|
|
|
seplen = unescape(sep);
|
2013-06-14 18:20:47 +00:00
|
|
|
break;
|
2015-02-20 12:05:54 +00:00
|
|
|
case 'v':
|
|
|
|
startnum = estrtonum(EARGF(usage()), 0, MIN(LLONG_MAX, SIZE_MAX));
|
|
|
|
break;
|
2015-02-20 12:15:43 +00:00
|
|
|
case 'w':
|
|
|
|
width = estrtonum(EARGF(usage()), 1, INT_MAX);
|
|
|
|
break;
|
2013-06-14 18:20:47 +00:00
|
|
|
default:
|
|
|
|
usage();
|
2015-11-01 10:16:49 +00:00
|
|
|
} ARGEND
|
2013-06-14 18:20:47 +00:00
|
|
|
|
2014-12-04 12:04:41 +00:00
|
|
|
if (argc > 1)
|
|
|
|
usage();
|
|
|
|
|
2015-03-22 15:29:50 +00:00
|
|
|
if (!argc) {
|
2014-12-04 12:00:19 +00:00
|
|
|
nl("<stdin>", stdin);
|
2014-12-04 12:04:41 +00:00
|
|
|
} else {
|
2015-05-19 15:44:15 +00:00
|
|
|
if (!strcmp(argv[0], "-")) {
|
2015-05-15 11:28:39 +00:00
|
|
|
argv[0] = "<stdin>";
|
|
|
|
fp = stdin;
|
|
|
|
} else if (!(fp = fopen(argv[0], "r"))) {
|
2014-12-04 12:04:41 +00:00
|
|
|
eprintf("fopen %s:", argv[0]);
|
2015-05-15 11:28:39 +00:00
|
|
|
}
|
2014-12-04 12:00:19 +00:00
|
|
|
nl(argv[0], fp);
|
2011-05-29 20:30:44 +00:00
|
|
|
}
|
2015-03-22 15:29:50 +00:00
|
|
|
|
2015-05-24 23:33:19 +00:00
|
|
|
ret |= fp && fp != stdin && fshut(fp, argv[0]);
|
|
|
|
ret |= fshut(stdin, "<stdin>") | fshut(stdout, "<stdout>");
|
|
|
|
|
|
|
|
return ret;
|
2011-05-29 20:30:44 +00:00
|
|
|
}
|