386BSD 0.1 development
authorWilliam F. Jolitz <wjolitz@soda.berkeley.edu>
Fri, 26 Apr 1991 22:18:32 +0000 (14:18 -0800)
committerWilliam F. Jolitz <wjolitz@soda.berkeley.edu>
Fri, 26 Apr 1991 22:18:32 +0000 (14:18 -0800)
Work on file usr/src/usr.bin/uniq/uniq.c

Co-Authored-By: Lynne Greer Jolitz <ljolitz@cardio.ucsf.edu>
Synthesized-from: 386BSD-0.1

usr/src/usr.bin/uniq/uniq.c [new file with mode: 0644]

diff --git a/usr/src/usr.bin/uniq/uniq.c b/usr/src/usr.bin/uniq/uniq.c
new file mode 100644 (file)
index 0000000..90cafbb
--- /dev/null
@@ -0,0 +1,216 @@
+/*
+ * Copyright (c) 1989 The Regents of the University of California.
+ * All rights reserved.
+ *
+ * This code is derived from software contributed to Berkeley by
+ * Case Larsen.
+ *
+ * Redistribution and use in source and binary forms, with or without
+ * modification, are permitted provided that the following conditions
+ * are met:
+ * 1. Redistributions of source code must retain the above copyright
+ *    notice, this list of conditions and the following disclaimer.
+ * 2. Redistributions in binary form must reproduce the above copyright
+ *    notice, this list of conditions and the following disclaimer in the
+ *    documentation and/or other materials provided with the distribution.
+ * 3. All advertising materials mentioning features or use of this software
+ *    must display the following acknowledgement:
+ *     This product includes software developed by the University of
+ *     California, Berkeley and its contributors.
+ * 4. Neither the name of the University nor the names of its contributors
+ *    may be used to endorse or promote products derived from this software
+ *    without specific prior written permission.
+ *
+ * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
+ * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
+ * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+ * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
+ * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+ * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
+ * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
+ * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
+ * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
+ * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
+ * SUCH DAMAGE.
+ */
+
+#ifndef lint
+char copyright[] =
+"@(#) Copyright (c) 1989 The Regents of the University of California.\n\
+ All rights reserved.\n";
+#endif /* not lint */
+
+#ifndef lint
+static char sccsid[] = "@(#)uniq.c     5.2 (Berkeley) 6/1/90";
+#endif /* not lint */
+
+#include <stdio.h>
+#include <ctype.h>
+
+int cflag, dflag, uflag;
+int numchars, numfields, repeats;
+
+#define        MAXLINELEN      (2048 + 1)
+
+main (argc,argv)
+       int argc;
+       char **argv;
+{
+       extern int optind;
+       FILE *ifp, *ofp, *file();
+       int ch;
+       register char *t1, *t2;
+       char *prevline, *thisline, *malloc(), *skip();
+
+       while ((ch = getopt(argc, argv, "-cdu123456789")) != EOF)
+               switch (ch) {
+               case '-':
+                       --optind;
+                       goto done;
+               case 'c':
+                       cflag = 1;
+                       break;
+               case 'd':
+                       dflag = 1;
+                       break;
+               case 'u':
+                       uflag = 1;
+                       break;
+               /*
+                * since -n is a valid option that could be picked up by
+                * getopt, but is better handled by the +n and -n code, we
+                * break out.
+                */
+               case '1': case '2': case '3': case '4':
+               case '5': case '6': case '7': case '8': case '9':
+                       --optind;
+                       goto done;
+               case '?':
+               default:
+                       usage();
+       }
+
+done:  argc -= optind;
+       argv +=optind;
+
+       /* if no flags are set, default is -d -u */
+       if (cflag) {
+               if (dflag || uflag)
+                       usage();
+       } else if (!dflag && !uflag)
+               dflag = uflag = 1;
+
+       /* because of the +, getopt is messed up */
+       for (; **argv == '+' || **argv == '-'; ++argv, --argc)
+               switch (**argv) {
+               case '+':
+                       if ((numchars = atoi(*argv + 1)) < 0)
+                               goto negerr;
+                       break;
+               case '-':
+                       if ((numfields = atoi(*argv + 1)) < 0) {
+negerr:                                (void)fprintf(stderr,
+                                   "uniq: negative field/char skip value.\n");
+                               usage();
+                       }
+                       break;
+               }
+    
+       switch(argc) {
+       case 0:
+               ifp = stdin;
+               ofp = stdout;
+               break;
+       case 1:
+               ifp = file(argv[0], "r");
+               ofp = stdout;
+               break;
+       case 2:
+               ifp = file(argv[0], "r");
+               ofp = file(argv[1], "w");
+               break;
+       default:
+               usage();
+       }
+
+       prevline = malloc(MAXLINELEN);
+       thisline = malloc(MAXLINELEN);
+       (void)fgets(prevline, MAXLINELEN, ifp);
+
+       while (fgets(thisline, MAXLINELEN, ifp)) {
+               /* if requested get the chosen fields + character offsets */
+               if (numfields || numchars) {
+                       t1 = skip(thisline);
+                       t2 = skip(prevline);
+               } else {
+                       t1 = thisline;
+                       t2 = prevline;
+               }
+
+               /* if different, print; set previous to new value */
+               if (strcmp(t1, t2)) {
+                       show(ofp, prevline);
+                       t1 = prevline;
+                       prevline = thisline;
+                       thisline = t1;
+                       repeats = 0;
+               }
+               else
+                       ++repeats;
+       }
+       show(ofp, prevline);
+       exit(0);
+}
+
+/*
+ * show --
+ *     output a line depending on the flags and number of repetitions
+ *     of the line.
+ */
+show(ofp, str)
+       FILE *ofp;
+       char *str;
+{
+       if (cflag)
+               (void)fprintf(ofp, "%4d %s", repeats + 1, str);
+       if (dflag && repeats || uflag && !repeats)
+               (void)fprintf(ofp, "%s", str);
+}
+
+char *
+skip(str)
+       register char *str;
+{
+       register int infield, nchars, nfields;
+
+       for (nfields = numfields, infield = 0; nfields && *str; ++str)
+               if (isspace(*str)) {
+                       if (infield) {
+                               infield = 0;
+                               --nfields;
+                       }
+               } else if (!infield)
+                       infield = 1;
+       for (nchars = numchars; nchars-- && *str; ++str);
+       return(str);
+}
+
+FILE *
+file(name, mode)
+       char *name, *mode;
+{
+       FILE *fp;
+
+       if (!(fp = fopen(name, mode))) {
+               (void)fprintf(stderr, "uniq: can't open %s.\n", name);
+               exit(1);
+       }
+       return(fp);
+}
+
+usage()
+{
+       (void)fprintf(stderr,
+           "usage: uniq [-c | -du] [- #fields] [+ #chars] [input [output]]\n");
+       exit(1);
+}