request.c revision b38846b15c8891c6dec44dcc4f96ca40721bf663
/* ====================================================================
* The Apache Software License, Version 1.1
*
* Copyright (c) 2000-2001 The Apache Software Foundation. All rights
* reserved.
*
* Redistribution and use in source and binary forms, with or without
* modification, are permitted provided that the following conditions
* are met:
*
* 1. Redistributions of source code must retain the above copyright
* notice, this list of conditions and the following disclaimer.
*
* 2. Redistributions in binary form must reproduce the above copyright
* notice, this list of conditions and the following disclaimer in
* distribution.
*
* 3. The end-user documentation included with the redistribution,
* if any, must include the following acknowledgment:
* "This product includes software developed by the
* Apache Software Foundation (http://www.apache.org/)."
* Alternately, this acknowledgment may appear in the software itself,
* if and wherever such third-party acknowledgments normally appear.
*
* 4. The names "Apache" and "Apache Software Foundation" must
* not be used to endorse or promote products derived from this
* software without prior written permission. For written
* permission, please contact apache@apache.org.
*
* 5. Products derived from this software may not be called "Apache",
* nor may "Apache" appear in their name, without prior written
* permission of the Apache Software Foundation.
*
* THIS SOFTWARE IS PROVIDED ``AS IS'' AND ANY EXPRESSED OR IMPLIED
* WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
* OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
* DISCLAIMED. IN NO EVENT SHALL THE APACHE SOFTWARE FOUNDATION OR
* ITS CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
* SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
* LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF
* USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND
* ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
* OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT
* OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
* SUCH DAMAGE.
* ====================================================================
*
* This software consists of voluntary contributions made by many
* individuals on behalf of the Apache Software Foundation. For more
* information on the Apache Software Foundation, please see
*
* Portions of this software are based upon public domain software
* originally written at the National Center for Supercomputing Applications,
* University of Illinois, Urbana-Champaign.
*/
/*
* http_request.c: functions to get and process requests
*
* Rob McCool 3/21/93
*
* Thoroughly revamped by rst for Apache. NB this file reads
* best from the bottom up.
*
*/
#include "apr_strings.h"
#include "apr_file_io.h"
#include "apr_fnmatch.h"
#define APR_WANT_STRFUNC
#include "apr_want.h"
#define CORE_PRIVATE
#include "ap_config.h"
#include "httpd.h"
#include "http_config.h"
#include "http_request.h"
#include "http_core.h"
#include "http_protocol.h"
#include "http_log.h"
#include "http_main.h"
#include "util_filter.h"
#include "util_charset.h"
#include "mod_core.h"
#include <stdarg.h>
#endif
)
(request_rec *r),(r),DECLINED)
(request_rec *r),(r),DECLINED)
(request_rec *r),(r),DECLINED)
(request_rec *r),(r),DECLINED)
/*****************************************************************
*
* Getting and checking directory configuration. Also checks the
* FollowSymlinks and FollowSymOwner stuff, since this is really the
* only place that can happen (barring a new mid_dir_walk callout).
*
* We can't do it as an access_checker module function which gets
* called with the final per_dir_config, since we could have a directory
* with FollowSymLinks disabled, which contains a symlink to another
* with a .htaccess file which turns FollowSymLinks back on --- and
* access in such a case must be denied. So, whatever it is that
* checks FollowSymLinks needs to know the state of the options as
* they change, all the way down.
*/
/*
* We don't want people able to serve up pipes, or unix sockets, or other
* scary things. Note that symlink tests are performed later.
*/
static int check_safe_file(request_rec *r)
{
return OK;
}
"object is not a file, directory or symlink: %s",
r->filename);
return HTTP_FORBIDDEN;
}
{
#if defined(OS2)
/* OS/2 doesn't have symlinks */
return OK;
#else
char *lastp;
int res;
if (opts & OPT_SYM_LINKS)
return OK;
/*
* Strip trailing '/', if any, off what we're checking; trailing slashes
* make some systems follow symlinks to directories even in lstat().
* After we've done the lstat, put it back. Also, don't bother checking
* '/' at all...
*
* Note that we don't have to worry about multiple slashes here because of
* no2slash() below...
*/
if (lastp == d)
return OK; /* Root directory, '/' */
if (*lastp == '/')
*lastp = '\0';
else
if (lastp)
*lastp = '/';
/*
* Note that we don't reject accesses to nonexistent files (multiviews or
* the like may cons up a way to run the transaction anyway)...
*/
return OK;
/* OK, it's a symlink. May still be OK with OPT_SYM_OWNER */
if (!(opts & OPT_SYM_OWNER))
return HTTP_FORBIDDEN;
/* OPT_SYM_OWNER only works if we can get the owner from the file */
if (res != APR_SUCCESS)
return HTTP_FORBIDDEN;
return HTTP_FORBIDDEN;
/* TODO: replace with an apr_compare_users() fn */
#endif
}
/* Dealing with the file system to get PATH_INFO
*/
static int get_path_info(request_rec *r)
{
char *cp;
int rv;
#if defined(HAVE_DRIVE_LETTERS) || defined(HAVE_UNC_PATHS)
char bStripSlash=1;
#endif
/* assume path_info already set */
return OK;
}
#ifdef HAVE_DRIVE_LETTERS
/* If the directory is x:\, then we don't want to strip
* the trailing slash since x: is not a valid directory.
*/
bStripSlash = 0;
#endif
#ifdef HAVE_UNC_PATHS
* advance over the trailing slash. Any other
* UNC name is OK to strip the slash.
*/
char *p;
int iCount=0;
p = path;
p++;
iCount++;
}
if (iCount == 4)
bStripSlash = 0;
}
#endif
#if defined(HAVE_DRIVE_LETTERS) || defined(HAVE_UNC_PATHS)
if (bStripSlash)
#endif
/* Advance over trailing slashes ... NOT part of filename
* if file is not a UNC name (Win32 only).
*/
continue;
/* See if the pathname ending here exists... */
*cp = '\0';
/* ### We no longer need the test ap_os_is_filename_valid() here
* since apr_stat isn't a posix thing - it's apr_stat's responsibility
* to handle whatever path string arrives at it's door - by platform
* and volume restrictions as applicable...
* TODO: This code becomes even simpler if apr_stat grows
* an APR_PATHINCOMPLETE result to indicate that we are staring at
*/
*cp = '/';
/*
* Aha! Found something. If it was a directory, we will search
* contents of that directory for a multi_match, so the PATH_INFO
* argument starts with the component after that.
*/
}
*cp = '\0';
return OK;
}
continue;
--cp;
}
else {
if (APR_STATUS_IS_EACCES(rv))
"access to %s denied", r->uri);
else
"access to %s failed", r->uri);
return HTTP_FORBIDDEN;
}
}
return OK;
}
{
&core_module);
char *test_filename;
char *test_dirname;
int res;
unsigned i, num_dirs;
int j, test_filename_len;
#if defined(HAVE_UNC_PATHS) || defined(NETWARE)
unsigned iStart = 1;
#endif
/*
* Are we dealing with a file? If not, we can (hopefuly) safely assume we
* have a handler that doesn't require one, but for safety's sake, and so
* we have something find_types() can get something out of, fake one. But
* don't run through the directory entries.
*/
return OK;
}
/*
* Go down the directory hierarchy. Where we have to check for symlinks,
* do so. Where a .htaccess file has permission to override anything,
* try to find one. If either of these things fails, we could poke
* around, see why, and adjust the lookup_rec accordingly --- this might
* save us a call to get_path_info (with the attendant stat()s); however,
* for the moment, that's not worth the trouble.
*
* Fake filenames (i.e. proxy:) only match Directory sections.
*/
if (!ap_os_is_path_absolute(r->filename))
{
const char *entry_dir;
for (j = 0; j < num_sec; ++j) {
entry_config = sec[j];
entry_dir = entry_core->d;
if (entry_core->r) {
}
else if (entry_core->d_is_fnmatch) {
}
if (this_conf)
}
return OK;
}
/* XXX This needs to be rolled into APR, the APR function will not
* be allowed to fold the case of any non-existant segment of the path:
*/
/* TODO This is rather silly right here, we should simply be setting
* filename and path_info at the end of our directory_walk
*/
res = get_path_info(r);
return res;
}
/* XXX This becomes moot, and will already happen above for elements
* that actually exist:
*/
/* XXX This becomes mute, since the APR canonical parsing will handle
* 2slash and dot directory issues:
*/
/* XXX This needs to be rolled into APR: */
if ((res = check_safe_file(r))) {
return res;
}
--num_dirs;
++num_dirs;
/*
* We will use test_dirname as scratch space while we build directory
* names during the walk. Profiling shows directory_walk to be a busy
* function so we try to avoid allocating lots of extra memory here.
* We need 2 extra bytes, one for trailing \0 and one because
* make_dirstr_prefix will add potentially one extra /.
*/
/* XXX These exception cases go away if apr_stat() returns the
* APR_PATHINCOMPLETE status, so we skip hard filesystem testing
* of the initial 'pseudo' elements:
*/
#if defined(HAVE_UNC_PATHS)
/* If the name is a UNC name, then do not perform any true file test
* This is optimized to use the normal walk (skips the redundant '/' root)
*/
iStart = 4;
#endif
#if defined(NETWARE)
/* If the name is a fully qualified volume name, then do not perform any
* XXX: The implementation eludes me at this moment...
* Does this make sense? Please test!
*/
iStart = 2;
#endif
#if defined(HAVE_DRIVE_LETTERS) || defined(NETWARE)
/* Should match <Directory> sections starting from '/', not 'e:/'
* they have one for each filesystem. Traditionally, Apache has treated
* <Directory /> permissions as the base for the whole server, and this
* tradition should probably be preserved.
*
*/
if (test_filename[0] == '/')
i = 1;
else
i = 0;
#else
/* Normal File Systems are rooted at / */
i = 1;
#endif /* def HAVE_DRIVE_LETTERS || NETWARE */
/* j keeps track of which section we're on, see core_reorder_directories */
j = 0;
for (; i <= num_dirs; ++i) {
int overrides_here;
&core_module);
/*
* XXX: this could be made faster by only copying the next component
* rather than copying the entire thing all over.
*/
/*
* Do symlink checks first, because they are done with the
* permissions appropriate to the *parent* directory...
*/
#if defined(HAVE_UNC_PATHS) || defined(NETWARE)
/* Test only legal names against the real filesystem */
if (i >= iStart)
#endif
"Symbolic link not allowed: %s", test_dirname);
return res;
}
/*
* Begin *this* level by looking for matching <Directory> sections
* from access.conf.
*/
for (; j < num_sec; ++j) {
char *entry_dir;
entry_config = sec[j];
entry_dir = entry_core->d;
if (entry_core->r
#if defined(HAVE_DRIVE_LETTERS) || defined(NETWARE)
/* To account for the top-level "/" directory when i == 0
* XXX: The net test may be wrong... may fail ap_os_is_path_absolute
*/
&& entry_core->d_components > i)
#else
|| entry_core->d_components > i
#endif /* def HAVE_DRIVE_LETTERS || NETWARE */
)
break;
if (entry_core->d_is_fnmatch) {
}
}
if (this_conf) {
&core_module);
}
#if defined(HAVE_DRIVE_LETTERS) || defined(NETWARE)
/* So that other top-level directory sections (e.g. "e:/") aren't
* skipped when i == 0
* XXX: I don't get you here, Tim... That's a level 1 section, but
* we are at level 0. Did you mean fast-forward to the next?
*/
else if (!i)
break;
#endif /* def HAVE_DRIVE_LETTERS || NETWARE */
}
/* If .htaccess files are enabled, check for one. */
#if defined(HAVE_UNC_PATHS) || defined(NETWARE)
/* Test only legal names against the real filesystem */
if (i >= iStart)
#endif
if (overrides_here) {
sconf->access_name);
if (res)
return res;
if (htaccess_conf) {
}
}
}
/*
* There's two types of IS_SPECIAL sections (see http_core.c), and we've
* already handled the proxy:-style stuff. Now we'll deal with the
* regexes.
*/
for (; j < num_sec; ++j) {
entry_config = sec[j];
if (entry_core->r) {
}
}
}
/*
* Symlink permissions are determined by the parent. If the request is
* for a directory then applying the symlink test here would use the
* permissions of the directory as opposed to its parent. Consider a
* symlink pointing to a dir with a .htaccess disallowing symlinks. If
* you access /symlink (or /symlink/) you would get a 403 without this
* S_ISDIR test. But if you accessed /symlink/index.html, for example,
* you would *not* get the 403.
*/
"Symbolic link not allowed: %s", r->filename);
return res;
}
return OK; /* Can only "fail" if access denied by the
* symlink goop. */
}
{
&core_module);
char *test_location;
char *entry_url;
int j;
if (!num_url) {
return OK;
}
/* Location and LocationMatch differ on their behaviour w.r.t. multiple
* slashes. Location matches multiple slashes with a single slash,
* LocationMatch doesn't. An exception, for backwards brokenness is
* absoluteURIs... in which case neither match multiple slashes.
*/
if (r->uri[0] != '/') {
test_location = r->uri;
}
else {
}
/* Go through the location entries, and check for matches. */
/* we apply the directive sections in some order;
* should really try them with the most general first.
*/
for (j = 0; j < num_url; ++j) {
entry_config = url[j];
entry_url = entry_core->d;
if (entry_core->r) {
}
else if (entry_core->d_is_fnmatch) {
}
}
if (this_conf)
}
return OK;
}
{
&core_module);
char *test_file;
/* get the basename */
}
else {
++test_file;
}
/* Go through the file entries, and check for matches. */
if (num_files) {
char *entry_file;
int j;
/* we apply the directive sections in some order;
* should really try them with the most general first.
*/
for (j = 0; j < num_files; ++j) {
entry_config = file[j];
entry_file = entry_core->d;
if (entry_core->r) {
}
else if (entry_core->d_is_fnmatch) {
}
}
}
if (this_conf)
}
}
return OK;
}
/*****************************************************************
*
* The sub_request mechanism.
*
* Fns to look up a relative URI from, e.g., a map file or SSI document.
* These do all access checks, etc., but don't actually run the transaction
* ... use run_sub_req below for that. Also, be sure to use destroy_sub_req
* as appropriate if you're likely to be creating more than a few of these.
* (An early Apache version didn't destroy the sub_reqs used in directory
* indexing. The result, when indexing a directory with 800-odd files in
* it, was massively excessive storage allocation).
*
* Note more manipulation of protocol-specific vars in the request
* structure...
*/
{
return rr;
}
{
if (APR_BUCKET_IS_EOS(e)) {
}
return APR_SUCCESS;
}
{
/* Is there a require line configured for the type of *this* req? */
int i;
if (!reqs_arr)
return 0;
return 1;
return 0;
}
const char *new_file,
const request_rec *r,
{
int res;
char *udir;
rnew = make_sub_request(r);
/* make a copy of the allowed-methods list */
/* start with the same set of output filters */
if (next_filter) {
}
else {
}
/* no input filters for a subrequest */
/* would be nicer to pass "method" to ap_set_sub_req_protocol */
if (new_file[0] == '/')
else {
}
if (res) {
return rnew;
}
return rnew;
}
if (res) {
return rnew;
}
/*
* We could be clever at this point, and avoid calling directory_walk,
* etc. However, we'd need to test that the old and new filenames contain
* the same directory components, so it would require duplicating the
* start of translate_name. Instead we rely on the cache of .htaccess
* results.
*
* NB: directory_walk() clears the per_dir_config, so we don't inherit
* from location_walk() above
*/
&& (!ap_some_auth_required(rnew)
)
) {
}
return rnew;
}
const request_rec *r,
{
}
const request_rec *r,
{
int res;
char *fdir;
rnew = make_sub_request(r);
/* make a copy of the allowed-methods list */
/* start with the same set of output filters */
if (next_filter) {
}
else {
}
/* no input filters for a subrequest */
/*
* Check for a special case... if there are no '/' characters in new_file
* at all, then we are looking at a relative lookup in the same
* directory. That means we won't have to redo directory_walk, and we may
* not even have to redo access checks.
*/
&& (rv != APR_INCOMPLETE)) {
}
return rnew;
}
/*
* no matter what, if it's a subdirectory, we need to re-run
* directory_walk
*/
if (!res) {
}
}
else {
return rnew;
}
/*
* do a file_walk, if it doesn't change the per_dir_config then
* we know that we don't have to redo all the access checks
*/
return rnew;
}
}
return rnew;
}
}
}
else {
/* XXX: @@@: What should be done with the parsed_uri values? */
/*
* XXX: this should be set properly like it is in the same-dir case
* but it's actually sometimes to impossible to do it... because the
* file may not have a uri associated with it -djg
*/
if (!res) {
}
}
if (res
&& (!ap_some_auth_required(rnew)
)
) {
}
return rnew;
}
{
int retval;
/* see comments in process_request_internal() */
retval = ap_invoke_handler(r);
return retval;
}
{
/* Reclaim the space */
apr_pool_destroy(r->pool);
}
/*
* Function to set the r->mtime field to the specified value if it's later
* than what's already there.
*/
{
if (r->mtime < dependency_mtime) {
r->mtime = dependency_mtime;
}
}
/*
* Is it the initial main request, which we only get *once* per HTTP request?
*/
{
return
&&
}