sbase/uniq.c

140 lines
2.4 KiB
C
Raw Normal View History

2012-05-21 19:24:28 -04:00
/* See LICENSE file for copyright and license details. */
2015-02-14 15:02:41 -05:00
#include <ctype.h>
2012-05-21 19:24:28 -04:00
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
2013-03-05 15:35:55 -05:00
2012-05-21 19:24:28 -04:00
#include "util.h"
static void uniqline(FILE *, char *);
static void uniq(FILE *, FILE *);
static void uniqfinish(FILE *);
2012-05-21 19:24:28 -04:00
static const char *countfmt = "";
static int dflag = 0;
static int uflag = 0;
static int fskip = 0;
static int sskip = 0;
2012-05-21 19:24:28 -04:00
2014-01-20 05:47:46 -05:00
static char *prevline = NULL;
static char *prevoffset = NULL;
2014-01-20 05:47:46 -05:00
static long prevlinecount = 0;
2012-05-21 19:24:28 -04:00
2013-06-14 14:20:47 -04:00
static void
usage(void)
{
eprintf("usage: %s [-c] [-d | -u] [-f fields] [-s chars]"
2015-02-19 09:54:09 -05:00
" [input [output]]\n", argv0);
2013-06-14 14:20:47 -04:00
}
2012-05-21 19:24:28 -04:00
int
main(int argc, char *argv[])
{
FILE *fp = stdin, *ofp = stdout;
2012-05-21 19:24:28 -04:00
2013-06-14 14:20:47 -04:00
ARGBEGIN {
case 'c':
countfmt = "%7ld ";
break;
case 'd':
dflag = 1;
2013-06-14 14:20:47 -04:00
break;
case 'u':
uflag = 1;
2013-06-14 14:20:47 -04:00
break;
case 'f':
fskip = estrtonum(EARGF(usage()), 0, INT_MAX);
break;
case 's':
sskip = estrtonum(EARGF(usage()), 0, INT_MAX);
break;
2013-06-14 14:20:47 -04:00
default:
usage();
} ARGEND;
2012-05-21 19:24:28 -04:00
if (argc == 0) {
uniq(stdin, stdout);
} else if (argc >= 1) {
if (strcmp(argv[0], "-") && !(fp = fopen(argv[0], "r")))
2013-06-14 14:20:47 -04:00
eprintf("fopen %s:", argv[0]);
if (argc == 2) {
if (strcmp(argv[1], "-") &&
!(ofp = fopen(argv[1], "w")))
eprintf("fopen %s:", argv[1]);
} else
eprintf("extra argument: %s\n", argv[2]);
uniq(fp, ofp);
if (fp != stdin)
fclose(fp);
} else
2013-06-14 14:20:47 -04:00
usage();
uniqfinish(ofp);
if (ofp != stdout)
fclose(ofp);
2012-05-21 19:24:28 -04:00
2014-10-02 18:46:04 -04:00
return 0;
2012-05-21 19:24:28 -04:00
}
static char *
uniqskip(char *l)
{
char *lo = l;
int f = fskip, s = sskip;
2015-02-11 07:02:33 -05:00
for (; f; --f) {
while (isblank(*lo))
lo++;
while (*lo && !isblank(*lo))
lo++;
}
for (; s && *lo && *lo != '\n'; --s, ++lo);
return lo;
}
static void
uniqline(FILE *ofp, char *l)
2012-05-21 19:24:28 -04:00
{
char *loffset = l ? uniqskip(l) : l;
int linesequel = (!l || !prevline)
2014-01-20 05:47:46 -05:00
? l == prevline
: !strcmp(loffset, prevoffset);
2012-05-21 19:24:28 -04:00
if (linesequel) {
2014-01-20 05:47:46 -05:00
++prevlinecount;
2012-05-21 19:24:28 -04:00
return;
}
if (prevline) {
if ((prevlinecount == 1 && !dflag) ||
(prevlinecount != 1 && !uflag)) {
fprintf(ofp, countfmt, prevlinecount);
fputs(prevline, ofp);
2012-05-21 19:24:28 -04:00
}
2014-01-20 05:47:46 -05:00
free(prevline);
prevline = prevoffset = NULL;
2012-05-21 19:24:28 -04:00
}
if (l) {
prevline = estrdup(l);
prevoffset = prevline + (loffset - l);
}
2014-01-20 05:47:46 -05:00
prevlinecount = 1;
2012-05-21 19:24:28 -04:00
}
static void
uniq(FILE *fp, FILE *ofp)
2012-05-21 19:24:28 -04:00
{
char *buf = NULL;
size_t size = 0;
2014-11-18 15:49:30 -05:00
while (getline(&buf, &size, fp) != -1)
uniqline(ofp, buf);
2012-05-21 19:24:28 -04:00
}
static void
uniqfinish(FILE *ofp)
2012-05-21 19:24:28 -04:00
{
uniqline(ofp, NULL);
2012-05-21 19:24:28 -04:00
}