mod_rewrite.c revision 5259ba24286df14fb89be643f234a4dc9613a071
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bnd/* ====================================================================
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bnd * The Apache Software License, Version 1.1
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bnd * Copyright (c) 2000-2003 The Apache Software Foundation. All rights
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bnd * reserved.
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bnd * Redistribution and use in source and binary forms, with or without
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bnd * modification, are permitted provided that the following conditions
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bnd * are met:
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bnd * 1. Redistributions of source code must retain the above copyright
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bnd * notice, this list of conditions and the following disclaimer.
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bnd * 2. Redistributions in binary form must reproduce the above copyright
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bnd * notice, this list of conditions and the following disclaimer in
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bnd * the documentation and/or other materials provided with the
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bnd * distribution.
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bnd * 3. The end-user documentation included with the redistribution,
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bnd * if any, must include the following acknowledgment:
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bnd * "This product includes software developed by the
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bnd * Apache Software Foundation (http://www.apache.org/)."
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bnd * Alternately, this acknowledgment may appear in the software itself,
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bnd * if and wherever such third-party acknowledgments normally appear.
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bnd * 4. The names "Apache" and "Apache Software Foundation" must
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bnd * not be used to endorse or promote products derived from this
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bnd * software without prior written permission. For written
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bnd * permission, please contact apache@apache.org.
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bnd * 5. Products derived from this software may not be called "Apache",
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bnd * nor may "Apache" appear in their name, without prior written
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bnd * permission of the Apache Software Foundation.
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bnd * THIS SOFTWARE IS PROVIDED ``AS IS'' AND ANY EXPRESSED OR IMPLIED
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bnd * WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bnd * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bnd * DISCLAIMED. IN NO EVENT SHALL THE APACHE SOFTWARE FOUNDATION OR
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bnd * ITS CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bnd * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bnd * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bnd * USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bnd * ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bnd * OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bnd * OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bnd * SUCH DAMAGE.
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bnd * ====================================================================
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bnd * This software consists of voluntary contributions made by many
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bnd * individuals on behalf of the Apache Software Foundation. For more
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bnd * information on the Apache Software Foundation, please see
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bnd * Portions of this software are based upon public domain software
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bnd * originally written at the National Center for Supercomputing Applications,
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bnd * University of Illinois, Urbana-Champaign.
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bnd** _ __ ___ ___ __| | _ __ _____ ___ __(_) |_ ___
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bnd** | '_ ` _ \ / _ \ / _` | | '__/ _ \ \ /\ / / '__| | __/ _ \
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bnd** | | | | | | (_) | (_| | | | | __/\ V V /| | | | || __/
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bnd** |_| |_| |_|\___/ \__,_|___|_| \___| \_/\_/ |_| |_|\__\___|
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bnd** URL Rewriting Module
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bnd** This module uses a rule-based rewriting engine (based on a
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bnd** regular-expression parser) to rewrite requested URLs on the fly.
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bnd** It supports an unlimited number of additional rule conditions (which can
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bnd** operate on a lot of variables, even on HTTP headers) for granular
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bnd** matching and even external database lookups (either via plain text
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bnd** tables, DBM hash files or even external processes) for advanced URL
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bnd** substitution.
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bnd** It operates on the full URLs (including the PATH_INFO part) both in
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bnd** per-server context (httpd.conf) and per-dir context (.htaccess) and even
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bnd** can generate QUERY_STRING parts on result. The rewriting result finally
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bnd** can lead to internal subprocessing, external request redirection or even
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bnd** to internal proxy throughput.
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bnd** This module was originally written in April 1996 and
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bnd** gifted exclusively to the The Apache Software Foundation in July 1997 by
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bnd** Ralf S. Engelschall
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bnd** rse@engelschall.com
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bnd#if !defined(OS2) && !defined(WIN32) && !defined(BEOS) && !defined(NETWARE)
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bnd#define MOD_REWRITE_SET_MUTEX_PERMS /* XXX Apache should define something */
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bnd** +-------------------------------------------------------+
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bnd** | static module configuration
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bnd** +-------------------------------------------------------+
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bnd** Our interface to the Apache server kernel:
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bnd** o Runtime logic of a request is as following:
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bnd** while(request or subrequest)
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bnd** foreach(stage #0...#9)
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bnd** foreach(module) (**)
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bnd** try to run hook
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bnd** o the order of modules at (**) is the inverted order as
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bnd** given in the "Configuration" file, i.e. the last module
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bnd** specified is the first one called for each hook!
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bnd** The core module is always the last!
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bnd** o there are two different types of result checking and
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bnd** continue processing:
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bnd** for hook #0,#1,#4,#5,#6,#8:
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bnd** hook run loop stops on first modules which gives
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bnd** back a result != DECLINED, i.e. it usually returns OK
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bnd** which says "OK, module has handled this _stage_" and for #1
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bnd** this have not to mean "Ok, the filename is now valid".
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bnd** for hook #2,#3,#7,#9:
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bnd** all hooks are run, independend of result
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bnd** o at the last stage, the core module always
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bnd** - says "HTTP_BAD_REQUEST" if r->filename does not begin with "/"
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bnd** - prefix URL with document_root or replaced server_root
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bnd** with document_root and sets r->filename
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bnd** - always return a "OK" independed if the file really exists
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bnd /* the module (predeclaration) */
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bnd /* rewritemap int: handler function registry */
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bnd /* the cache */
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bnd /* whether proxy module is available or not */
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bndstatic const char *lockname;
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bndstatic apr_global_mutex_t *rewrite_mapr_lock_acquire = NULL;
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bnd** +-------------------------------------------------------+
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bnd** | configuration directive handling
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bnd** +-------------------------------------------------------+
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bnd** per-server configuration structure handling
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bndstatic void *config_server_create(apr_pool_t *p, server_rec *s)
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bnd a = (rewrite_server_conf *)apr_pcalloc(p, sizeof(rewrite_server_conf));
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bnd a->rewritemaps = apr_array_make(p, 2, sizeof(rewritemap_entry));
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bnd a->rewriteconds = apr_array_make(p, 2, sizeof(rewritecond_entry));
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bnd a->rewriterules = apr_array_make(p, 2, sizeof(rewriterule_entry));
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bnd return (void *)a;
8574d86b9ec3be36b7f54ed0547a0ee5d60dbd6bndstatic void *config_server_merge(apr_pool_t *p, void *basev, void *overridesv)
sizeof(rewrite_perdir_conf));
return NULL;
while (*option) {
if (limit <= 0) {
return NULL;
return NULL;
const char *a1)
return NULL;
const char *a2)
const char *ignored_fname;
int bad = 0;
if (colon) {
++bad;
++bad;
if (bad) {
return NULL;
const char *error;
return error;
if (!lockname) {
return NULL;
const char *a1)
return NULL;
const char *in_str)
char *a1;
char *a2;
char *a3;
char *cp;
const char *err;
int rc;
return err;
cp++;
== NULL);
if (rc) {
return NULL;
char *str)
char *cp;
char *cp1;
char *cp2;
char *cp3;
char *key;
char *val;
const char *err;
return err;
return NULL;
return NULL;
const char *in_str)
char *a1;
char *a2;
char *a3;
char *cp;
const char *err;
int mode;
return err;
cp++;
sizeof(rewritecond_entry));
sizeof(rewritecond_entry));
return NULL;
char *str)
char *cp;
char *cp1;
char *cp2;
char *cp3;
char *key;
char *val;
const char *err;
return err;
return NULL;
int status = 0;
if (i < MAX_ENV_FLAGS) {
if (i < MAX_COOKIE_FLAGS) {
return NULL;
if (map_pfn_register) {
return OK;
server_rec *s)
void *data;
int first_time = 0;
if (!data) {
return HTTP_INTERNAL_SERVER_ERROR;
#ifdef MOD_REWRITE_SET_MUTEX_PERMS
return HTTP_INTERNAL_SERVER_ERROR;
return HTTP_INTERNAL_SERVER_ERROR;
for (; s; s = s->next) {
open_rewritelog(s, p);
if (!first_time) {
return HTTP_INTERNAL_SERVER_ERROR;
return OK;
lockname, p);
const char *saved_rulestatus;
const char *var;
const char *thisserver;
char *thisport;
const char *thisurl;
const char *ccp;
unsigned int port;
int rulestatus;
return DECLINED;
return DECLINED;
r->filename);
if (rulestatus) {
unsigned skip;
if (!proxy_available) {
return HTTP_FORBIDDEN;
r->filename);
return OK;
if (r->args) {
? r->args
NULL);
n = r->status;
return HTTP_FORBIDDEN;
return HTTP_GONE;
return DECLINED;
#if APR_HAS_USER
return HTTP_BAD_REQUEST;
(r->filename +
r->filename);
return OK;
return DECLINED;
if (t == NULL) {
return DECLINED;
r->filename, t);
ap_set_content_type(r, t);
return OK;
char *cp;
char *cp2;
const char *ccp;
char *prefix;
int rulestatus;
char *ofilename;
return DECLINED;
return DECLINED;
return DECLINED;
* URL: http://localhost/foo and .htaccess is located in foo directory
if (r->filename &&
return DECLINED;
return DECLINED;
return HTTP_FORBIDDEN;
if (rulestatus) {
unsigned skip;
return OK;
* hostname and compare/substitute only the stuff after it.
if (r->args) {
? r->args
NULL);
n = r->status;
return HTTP_FORBIDDEN;
return HTTP_GONE;
return HTTP_BAD_REQUEST;
return OK;
r->filename+l);
return OK;
return DECLINED;
return DECLINED;
return DECLINED;
if (is_redirect_limit_exceeded(r)) {
return HTTP_INTERNAL_SERVER_ERROR;
return OK;
if (!reqc) {
char *perdir)
int changed;
int rc;
changed = 0;
loop:
p = &entries[i];
if (rc) {
goto loop;
if (p->skip > 0) {
s = p->skip;
p = &entries[i];
p = &entries[i];
return changed;
char *perdir)
char *uri;
char *output;
const char *vary;
int prefixstrip;
int failed;
int rc;
prefixstrip = 0;
sizeof(regmatch));
failed = 0;
c = &conds[i];
if (rc == 0) {
c = &conds[i];
if (rc == 0) {
if (failed) {
p->forced_mimetype);
reduce_uri(r);
r->filename);
p->forced_mimetype);
int rc;
rc = 0;
#if !defined(OS2)
sizeof(regmatch));
return rc;
inp++;
goto skip;
char *endp;
goto skip;
goto skip;
if (result) {
char *var;
span = 0;
skip:
space--;
char *olduri;
if (q != NULL) {
if (qsappend) {
r->filename);
char *cp;
unsigned short port;
char *portp;
char *hostp;
char *url;
char *olduri;
apr_size_t l;
c = *cp;
*cp = c;
const char *thisserver;
char *thisport;
int port;
switch (*uri++) {
char *cp;
return NULL;
++cp;
++cp;
NULL);
#if APR_HAS_USER
char *newuri;
char *homedir;
return newuri;
rewritemap_entry *s;
char *value;
s = &entries[i];
return NULL;
if ((value =
return value;
return NULL;
return NULL;
if ((value =
return value;
return NULL;
if ((value =
return value;
return value;
return NULL;
if ((value =
return NULL;
value);
return value;
return NULL;
char *cpT;
char *curkey;
char *curval;
return NULL;
if (skip == 0) {
++cpT;
if (skip == 0) {
return value;
return value;
#ifndef NO_WRITEV
return NULL;
if (rewrite_mapr_lock_acquire) {
#ifdef NO_WRITEV
buf[i++] = c;
if (rewrite_mapr_lock_acquire) {
return NULL;
cp++) {
return value;
cp++) {
return value;
char *value;
return value;
char *value;
return value;
static int rewrite_rand_init_done = 0;
static void rewrite_rand_init(void)
if (!rewrite_rand_init_done) {
static int rewrite_rand(int l, int h)
char *buf;
return value;
return buf;
const char *fname;
if (!fname) {
!= APR_SUCCESS) {
char *str1;
const char *type;
char *ruser;
const char *rhost;
(unsigned long)(r->server), (unsigned long)r,
return APR_SUCCESS;
APR_LOCK_DEFAULT, p);
return rc;
#ifdef MOD_REWRITE_SET_MUTEX_PERMS
return rc;
return APR_SUCCESS;
return APR_SUCCESS;
return APR_SUCCESS;
return rc;
return APR_SUCCESS;
const char *desc)
!= APR_SUCCESS) ||
procattr, p);
if (fpin) {
if (fpout) {
return (rc);
const char *result;
/* XXX: wow this has gotta be slow if you actually use it for a lot, recalculates exploded time for each variable */
return (char *)result; \
return NULL;
cache *c;
return NULL;
#if APR_HAS_THREADS
return NULL;
return NULL;
return NULL;
return n % CACHE_TLB_ROWS;
char *key)
for (i=0; i < CACHE_TLB_COLS; ++i) {
return NULL;
return &elt[j];
return NULL;
cacheentry *e)
cachelist *l;
cacheentry *e;
cachetlbentry *t;
int found_list;
#if APR_HAS_THREADS
found_list = 0;
if (e != NULL) {
#if APR_HAS_THREADS
#if APR_HAS_THREADS
if (!found_list) {
sizeof(cachetlbentry));
for (i=0; i<CACHE_TLB_ROWS; ++i) {
for (j=0; j<CACHE_TLB_COLS; ++j)
#if APR_HAS_THREADS
#if APR_HAS_THREADS
cachelist *l;
cacheentry *e;
#if APR_HAS_THREADS
if (e != NULL) {
#if APR_HAS_THREADS
#if APR_HAS_THREADS
#if APR_HAS_THREADS
return NULL;
const char *subst)
char *output;
return output;
char *cp;
int isquoted;
cp++; \
isquoted = 0; \
cp++; \
cp++; \
char *cp;
char *var;
char *val;
char *domain;
char *expires;
char *path;
char *tok_cntx;
char *cookie;
if (expires) {
char *notename;
void *data;
(expires)?
r->request_time +
: NULL,
NULL);
const char *root;
const char *slash;
char *statpath;
for (i = 0; i < n1; i++) {
int depth;
else if (*s == left) {
++depth;
return NULL;
int depth;
return NULL;
else if (*s == left) {
++depth;
return NULL;
{ NULL }