logresolve.c revision 17dc8282ea6b3ad1bbc661b498de9ec2e9987ede
c9b9246a20d2167ef0297bf7bf85ccaec84ac40fnilgun/* Copyright 1999-2005 The Apache Software Foundation or its licensors, as
c9b9246a20d2167ef0297bf7bf85ccaec84ac40fnilgun * applicable.
4a56677aad9b66a36f3dc9fddbca8dc1230ad471rbowen * Licensed under the Apache License, Version 2.0 (the "License");
c9b9246a20d2167ef0297bf7bf85ccaec84ac40fnilgun * you may not use this file except in compliance with the License.
c9b9246a20d2167ef0297bf7bf85ccaec84ac40fnilgun * You may obtain a copy of the License at
c9b9246a20d2167ef0297bf7bf85ccaec84ac40fnilgun * Unless required by applicable law or agreed to in writing, software
c9b9246a20d2167ef0297bf7bf85ccaec84ac40fnilgun * distributed under the License is distributed on an "AS IS" BASIS,
c9b9246a20d2167ef0297bf7bf85ccaec84ac40fnilgun * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
c9b9246a20d2167ef0297bf7bf85ccaec84ac40fnilgun * See the License for the specific language governing permissions and
c9b9246a20d2167ef0297bf7bf85ccaec84ac40fnilgun * limitations under the License.
c9b9246a20d2167ef0297bf7bf85ccaec84ac40fnilgun * logresolve 2.0
c9b9246a20d2167ef0297bf7bf85ccaec84ac40fnilgun * Tom Rathborne - tomr uunet.ca - http://www.uunet.ca/~tomr/
c9b9246a20d2167ef0297bf7bf85ccaec84ac40fnilgun * UUNET Canada, April 16, 1995
c9b9246a20d2167ef0297bf7bf85ccaec84ac40fnilgun * Rewritten by David Robinson. (drtr ast.cam.ac.uk)
c9b9246a20d2167ef0297bf7bf85ccaec84ac40fnilgun * Rewritten again, and ported to APR by Colm MacCarthaigh
c9b9246a20d2167ef0297bf7bf85ccaec84ac40fnilgun * Usage: logresolve [-s filename] [-c] < access_log > new_log
c9b9246a20d2167ef0297bf7bf85ccaec84ac40fnilgun * Arguments:
0f8e51a88c016cac46e17ba4f298b58136fbfaf5nilgun * -s filename name of a file to record statistics
c9b9246a20d2167ef0297bf7bf85ccaec84ac40fnilgun * -c check the DNS for a matching A record for the host.
c9b9246a20d2167ef0297bf7bf85ccaec84ac40fnilgun * Notes: (For historical interest)
c9b9246a20d2167ef0297bf7bf85ccaec84ac40fnilgun * To generate meaningful statistics from an HTTPD log file, it's good
c9b9246a20d2167ef0297bf7bf85ccaec84ac40fnilgun * to have the domain name of each machine that accessed your site, but
c9b9246a20d2167ef0297bf7bf85ccaec84ac40fnilgun * doing this on the fly can slow HTTPD down.
c9b9246a20d2167ef0297bf7bf85ccaec84ac40fnilgun * Compiling NCSA HTTPD with the -DMINIMAL_DNS flag turns IP#->hostname
c9b9246a20d2167ef0297bf7bf85ccaec84ac40fnilgun * resolution off. Before running your stats program, just run your log
c9b9246a20d2167ef0297bf7bf85ccaec84ac40fnilgun * file through this program (logresolve) and all of your IP numbers will
c9b9246a20d2167ef0297bf7bf85ccaec84ac40fnilgun * be resolved into hostnames (where possible).
c9b9246a20d2167ef0297bf7bf85ccaec84ac40fnilgun * logresolve takes an HTTPD access log (in the COMMON log file format,
c9b9246a20d2167ef0297bf7bf85ccaec84ac40fnilgun * or any other format that has the IP number/domain name as the first
df92fac9baa2b098d654a59cb7b517e8ef6ed1f6nilgun * field for that matter), and outputs the same file with all of the
c9b9246a20d2167ef0297bf7bf85ccaec84ac40fnilgun * domain names looked up. Where no domain name can be found, the IP
c9b9246a20d2167ef0297bf7bf85ccaec84ac40fnilgun * number is left in.
c9b9246a20d2167ef0297bf7bf85ccaec84ac40fnilgun * To minimize impact on your nameserver, logresolve has its very own
c9b9246a20d2167ef0297bf7bf85ccaec84ac40fnilgun * internal hash-table cache. This means that each IP number will only
c9b9246a20d2167ef0297bf7bf85ccaec84ac40fnilgun * be looked up the first time it is found in the log file.
c9b9246a20d2167ef0297bf7bf85ccaec84ac40fnilgun * The -c option causes logresolve to apply the same check as httpd
0f8e51a88c016cac46e17ba4f298b58136fbfaf5nilgun * compiled with -DMAXIMUM_DNS; after finding the hostname from the IP
c9b9246a20d2167ef0297bf7bf85ccaec84ac40fnilgun * address, it looks up the IP addresses for the hostname and checks
c9b9246a20d2167ef0297bf7bf85ccaec84ac40fnilgun * that one of these matches the original address.
c9b9246a20d2167ef0297bf7bf85ccaec84ac40fnilgun/* Statistics */
c9b9246a20d2167ef0297bf7bf85ccaec84ac40fnilgunstatic int cachehits = 0;
c9b9246a20d2167ef0297bf7bf85ccaec84ac40fnilgunstatic int cachesize = 0;
0f8e51a88c016cac46e17ba4f298b58136fbfaf5nilgunstatic int entries = 0;
0f8e51a88c016cac46e17ba4f298b58136fbfaf5nilgunstatic int resolves = 0;
0f8e51a88c016cac46e17ba4f298b58136fbfaf5nilgunstatic int withname = 0;
c9b9246a20d2167ef0297bf7bf85ccaec84ac40fnilgunstatic int doublefailed = 0;
0f8e51a88c016cac46e17ba4f298b58136fbfaf5nilgunstatic int noreverse = 0;
c9b9246a20d2167ef0297bf7bf85ccaec84ac40fnilgun * prints various statistics to output
c9b9246a20d2167ef0297bf7bf85ccaec84ac40fnilgun apr_file_printf(output, "logresolve Statistics:" NL);
c9b9246a20d2167ef0297bf7bf85ccaec84ac40fnilgun apr_file_printf(output, " With name : %d" NL, withname);
c9b9246a20d2167ef0297bf7bf85ccaec84ac40fnilgun apr_file_printf(output, " Resolves : %d" NL, resolves);
c9b9246a20d2167ef0297bf7bf85ccaec84ac40fnilgun apr_file_printf(output, " - Double lookup failed : %d" NL,
c9b9246a20d2167ef0297bf7bf85ccaec84ac40fnilgun apr_file_printf(output, "Cache hits : %d" NL, cachehits);
c9b9246a20d2167ef0297bf7bf85ccaec84ac40fnilgun apr_file_printf(output, "Cache size : %d" NL, cachesize);
c9b9246a20d2167ef0297bf7bf85ccaec84ac40fnilgun * usage info
c9b9246a20d2167ef0297bf7bf85ccaec84ac40fnilgunstatic void usage(void)
c9b9246a20d2167ef0297bf7bf85ccaec84ac40fnilgun "%s -- Resolve IP-addresses to hostnames in Apache log files." NL
c9b9246a20d2167ef0297bf7bf85ccaec84ac40fnilgun " -s Record statistics to STATFILE when finished." NL
c9b9246a20d2167ef0297bf7bf85ccaec84ac40fnilgun " -c Perform double lookups when resolving IP addresses." NL,
c9b9246a20d2167ef0297bf7bf85ccaec84ac40fnilgun const char * arg;
c9b9246a20d2167ef0297bf7bf85ccaec84ac40fnilgun#if APR_MAJOR_VERSION > 1 || (APR_MAJOR_VERSION == 1 && APR_MINOR_VERSION >= 3)
c9b9246a20d2167ef0297bf7bf85ccaec84ac40fnilgun if (apr_app_initialize(&argc, &argv, NULL) != APR_SUCCESS) {
c9b9246a20d2167ef0297bf7bf85ccaec84ac40fnilgun while (1) {
c9b9246a20d2167ef0297bf7bf85ccaec84ac40fnilgun } /* switch */
c9b9246a20d2167ef0297bf7bf85ccaec84ac40fnilgun } /* else */
entries++;
withname++;
if (hostname) {
cachehits++;
withname++;
resolves++;
cachesize++;
noreverse++;
if (doublelookups) {
0, pool);
doublefailed++;
if (stats) {