wc.c revision da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin/***********************************************************************
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin* *
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin* This software is part of the ast package *
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin* Copyright (c) 1992-2007 AT&T Knowledge Ventures *
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin* and is licensed under the *
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin* Common Public License, Version 1.0 *
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin* by AT&T Knowledge Ventures *
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin* *
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin* A copy of the License is available at *
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin* http://www.opensource.org/licenses/cpl1.0.txt *
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin* (with md5 checksum 059e8cd6165cb4c31e351f2b69388fd9) *
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin* *
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin* Information and Software Systems Research *
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin* AT&T Research *
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin* Florham Park NJ *
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin* *
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin* Glenn Fowler <gsf@research.att.com> *
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin* David Korn <dgk@research.att.com> *
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin* *
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin***********************************************************************/
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin#pragma prototyped
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin/*
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin * David Korn
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin * AT&T Bell Laboratories
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin *
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin * count the number of bytes, words, and lines in a file
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin */
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chinstatic const char usage[] =
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin"[-?\n@(#)$Id: wc (AT&T Research) 2006-08-25 $\n]"
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chinUSAGE_LICENSE
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin"[+NAME?wc - print the number of bytes, words, and lines in files]"
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin"[+DESCRIPTION?\bwc\b reads one or more input files and, by default, "
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin "for each file writes a line containing the number of newlines, "
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin "\aword\as, and bytes contained in each file followed by the "
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin "file name to standard output in that order. A \aword\a is "
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin "defined to be a non-zero length string delimited by \bisspace\b(3) "
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin "characters.]"
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin"[+?If more than one file is specified, \bwc\b writes a total count "
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin "for all of the named files with \btotal\b written instead "
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin "of the file name.]"
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin"[+?By default, \bwc\b writes all three counts. Options can specified "
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin "so that only certain counts are written. The options \b-c\b "
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin "and \b-m\b are mutually exclusive.]"
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin"[+?If no \afile\a is given, or if the \afile\a is \b-\b, \bwc\b "
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin "reads from standard input and no filename is written to standard "
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin "output. The start of the file is defined as the current offset.]"
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin"[l:lines?List the line counts.]"
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin"[w:words?List the word counts.]"
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin"[c:bytes|chars:chars?List the byte counts.]"
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin"[m|C:multibyte-chars?List the character counts.]"
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin"[q:quiet?Suppress invalid multibyte character warnings.]"
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin"[L:longest-line|max-line-length?List the longest line length.]"
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin"\n"
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin"\n[file ...]\n"
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin"\n"
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin"[+EXIT STATUS?]{"
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin "[+0?All files processed successfully.]"
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin "[+>0?One or more files failed to open or could not be read.]"
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin"}"
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin"[+SEE ALSO?\bcat\b(1), \bisspace\b(3)]"
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin;
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin#include <cmd.h>
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin#include <wc.h>
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin#include <ls.h>
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin#define ERRORMAX 125
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chinstatic void printout(register Wc_t *wp, register char *name,register int mode)
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin{
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin if(mode&WC_LINES)
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin sfprintf(sfstdout," %7I*d",sizeof(wp->lines),wp->lines);
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin if(mode&WC_WORDS)
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin sfprintf(sfstdout," %7I*d",sizeof(wp->words),wp->words);
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin if(mode&WC_CHARS)
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin sfprintf(sfstdout," %7I*d",sizeof(wp->chars),wp->chars);
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin if(mode&WC_LONGEST)
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin sfprintf(sfstdout," %7I*d",sizeof(wp->chars),wp->longest);
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin if(name)
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin sfprintf(sfstdout," %s",name);
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin sfputc(sfstdout,'\n');
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin}
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chinint
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chinb_wc(int argc,register char **argv, void* context)
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin{
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin register char *cp;
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin register int mode=0, n;
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin register Wc_t *wp;
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin Sfio_t *fp;
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin Sfoff_t tlines=0, twords=0, tchars=0;
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin struct stat statb;
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin cmdinit(argc, argv, context, ERROR_CATALOG, 0);
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin while (n = optget(argv,usage)) switch (n)
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin {
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin case 'c':
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin mode |= WC_CHARS;
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin break;
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin case 'l':
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin mode |= WC_LINES;
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin break;
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin case 'L':
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin mode |= WC_LONGEST;
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin break;
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin case 'm':
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin case 'C':
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin mode |= WC_MBYTE;
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin break;
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin case 'q':
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin mode |= WC_QUIET;
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin break;
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin case 'w':
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin mode |= WC_WORDS;
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin break;
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin case ':':
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin error(2, "%s", opt_info.arg);
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin break;
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin case '?':
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin error(ERROR_usage(2), "%s", opt_info.arg);
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin break;
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin }
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin argv += opt_info.index;
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin if (error_info.errors)
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin error(ERROR_usage(2), "%s", optusage(NiL));
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin if(mode&WC_MBYTE)
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin {
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin if(mode&WC_CHARS)
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin error(2, "-c and -C are mutually exclusive");
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin mode |= WC_CHARS;
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin if(!mbwide())
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin {
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin mode &= ~WC_MBYTE;
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin setlocale(LC_CTYPE, "C");
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin }
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin }
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin if(!(mode&(WC_WORDS|WC_CHARS|WC_LINES|WC_MBYTE|WC_LONGEST)))
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin mode |= (WC_WORDS|WC_CHARS|WC_LINES);
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin if(!(wp = wc_init(mode)))
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin error(3,"internal error");
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin if(!(mode&WC_WORDS))
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin {
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin memzero(wp->space, (1<<CHAR_BIT));
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin wp->space['\n'] = -1;
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin }
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin if(cp = *argv)
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin argv++;
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin do
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin {
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin if(!cp || streq(cp,"-"))
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin fp = sfstdin;
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin else if(!(fp = sfopen(NiL,cp,"r")))
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin {
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin error(ERROR_system(0),"%s: cannot open",cp);
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin continue;
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin }
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin if(cp)
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin n++;
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin if(!(mode&(WC_WORDS|WC_LINES|WC_MBYTE|WC_LONGEST)) && fstat(sffileno(fp),&statb)>=0
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin && S_ISREG(statb.st_mode))
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin {
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin wp->chars = statb.st_size - lseek(sffileno(fp),0L,1);
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin lseek(sffileno(fp),0L,2);
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin }
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin else
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin wc_count(wp, fp, cp);
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin if(fp!=sfstdin)
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin sfclose(fp);
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin tchars += wp->chars;
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin twords += wp->words;
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin tlines += wp->lines;
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin printout(wp,cp,mode);
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin }
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin while(cp= *argv++);
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin if(n>1)
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin {
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin wp->lines = tlines;
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin wp->chars = tchars;
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin wp->words = twords;
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin printout(wp,"total",mode);
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin }
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin return(error_info.errors<ERRORMAX?error_info.errors:ERRORMAX);
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin}
da2e3ebdc1edfbc5028edf1354e7dd2fa69a7968chin