+/*
+ * Copyright (c) 1980, 1987 Regents of the University of California.
+ * All rights reserved.
+ *
+ * Redistribution and use in source and binary forms, with or without
+ * modification, are permitted provided that the following conditions
+ * are met:
+ * 1. Redistributions of source code must retain the above copyright
+ * notice, this list of conditions and the following disclaimer.
+ * 2. Redistributions in binary form must reproduce the above copyright
+ * notice, this list of conditions and the following disclaimer in the
+ * documentation and/or other materials provided with the distribution.
+ * 3. All advertising materials mentioning features or use of this software
+ * must display the following acknowledgement:
+ * This product includes software developed by the University of
+ * California, Berkeley and its contributors.
+ * 4. Neither the name of the University nor the names of its contributors
+ * may be used to endorse or promote products derived from this software
+ * without specific prior written permission.
+ *
+ * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
+ * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
+ * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+ * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
+ * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+ * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
+ * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
+ * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
+ * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
+ * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
+ * SUCH DAMAGE.
+ */
+
+#ifndef lint
+char copyright[] =
+"@(#) Copyright (c) 1980, 1987 Regents of the University of California.\n\
+ All rights reserved.\n";
+#endif /* not lint */
+
+#ifndef lint
+static char sccsid[] = "@(#)wc.c 5.7 (Berkeley) 3/2/91";
+#endif /* not lint */
+
+/* wc line, word and char count */
+
+#include <sys/param.h>
+#include <sys/stat.h>
+#include <sys/file.h>
+#include <stdio.h>
+
+#define DEL 0177 /* del char */
+#define NL 012 /* newline char */
+#define SPACE 040 /* space char */
+#define TAB 011 /* tab char */
+
+static long tlinect, twordct, tcharct;
+static int doline, doword, dochar;
+
+main(argc, argv)
+ int argc;
+ char **argv;
+{
+ extern int optind;
+ register int ch;
+ int total;
+
+ /*
+ * wc is unusual in that its flags are on by default, so,
+ * if you don't get any arguments, you have to turn them
+ * all on.
+ */
+ if (argc > 1 && argv[1][0] == '-' && argv[1][1]) {
+ while ((ch = getopt(argc, argv, "lwc")) != EOF)
+ switch((char)ch) {
+ case 'l':
+ doline = 1;
+ break;
+ case 'w':
+ doword = 1;
+ break;
+ case 'c':
+ dochar = 1;
+ break;
+ case '?':
+ default:
+ fputs("usage: wc [-lwc] [files]\n", stderr);
+ exit(1);
+ }
+ argv += optind;
+ argc -= optind;
+ }
+ else {
+ ++argv;
+ --argc;
+ doline = doword = dochar = 1;
+ }
+
+ total = 0;
+ if (!*argv) {
+ cnt((char *)NULL);
+ putchar('\n');
+ }
+ else do {
+ cnt(*argv);
+ printf(" %s\n", *argv);
+ ++total;
+ } while(*++argv);
+
+ if (total > 1) {
+ if (doline)
+ printf(" %7ld", tlinect);
+ if (doword)
+ printf(" %7ld", twordct);
+ if (dochar)
+ printf(" %7ld", tcharct);
+ puts(" total");
+ }
+ exit(0);
+}
+
+cnt(file)
+ char *file;
+{
+ register u_char *C;
+ register short gotsp;
+ register int len;
+ register long linect, wordct, charct;
+ struct stat sbuf;
+ int fd;
+ u_char buf[MAXBSIZE];
+
+ linect = wordct = charct = 0;
+ if (file) {
+ if ((fd = open(file, O_RDONLY, 0)) < 0) {
+ perror(file);
+ exit(1);
+ }
+ if (!doword) {
+ /*
+ * line counting is split out because it's a lot
+ * faster to get lines than to get words, since
+ * the word count requires some logic.
+ */
+ if (doline) {
+ while(len = read(fd, buf, MAXBSIZE)) {
+ if (len == -1) {
+ perror(file);
+ exit(1);
+ }
+ charct += len;
+ for (C = buf; len--; ++C)
+ if (*C == '\n')
+ ++linect;
+ }
+ tlinect += linect;
+ printf(" %7ld", linect);
+ if (dochar) {
+ tcharct += charct;
+ printf(" %7ld", charct);
+ }
+ close(fd);
+ return;
+ }
+ /*
+ * if all we need is the number of characters and
+ * it's a directory or a regular or linked file, just
+ * stat the puppy. We avoid testing for it not being
+ * a special device in case someone adds a new type
+ * of inode.
+ */
+ if (dochar) {
+ if (fstat(fd, &sbuf)) {
+ perror(file);
+ exit(1);
+ }
+ if (sbuf.st_mode & (S_IFREG | S_IFLNK | S_IFDIR)) {
+ printf(" %7ld", sbuf.st_size);
+ tcharct += sbuf.st_size;
+ close(fd);
+ return;
+ }
+ }
+ }
+ }
+ else
+ fd = 0;
+ /* do it the hard way... */
+ for (gotsp = 1; len = read(fd, buf, MAXBSIZE);) {
+ if (len == -1) {
+ perror(file);
+ exit(1);
+ }
+ charct += len;
+ for (C = buf; len--; ++C)
+ switch(*C) {
+ case NL:
+ ++linect;
+ case TAB:
+ case SPACE:
+ gotsp = 1;
+ continue;
+ default:
+#ifdef notdef
+ /*
+ * This line of code implements the
+ * original V7 wc algorithm, i.e.
+ * a non-printing character doesn't
+ * toggle the "word" count, so that
+ * " ^D^F " counts as 6 spaces,
+ * while "foo^D^Fbar" counts as 8
+ * characters.
+ *
+ * test order is important -- gotsp
+ * will normally be NO, so test it
+ * first
+ */
+ if (gotsp && *C > SPACE && *C < DEL) {
+#endif
+ /*
+ * This line implements the manual
+ * page, i.e. a word is a "maximal
+ * string of characters delimited by
+ * spaces, tabs or newlines." Notice
+ * nothing was said about a character
+ * being printing or non-printing.
+ */
+ if (gotsp) {
+ gotsp = 0;
+ ++wordct;
+ }
+ }
+ }
+ if (doline) {
+ tlinect += linect;
+ printf(" %7ld", linect);
+ }
+ if (doword) {
+ twordct += wordct;
+ printf(" %7ld", wordct);
+ }
+ if (dochar) {
+ tcharct += charct;
+ printf(" %7ld", charct);
+ }
+ close(fd);
+}